In [22]:
import pandas as pd
import requests
import json
import time  
from tqdm import tqdm

import re
import nltk
from nltk.corpus import stopwords
from nltk.stem import WordNetLemmatizer
import string
from unidecode import unidecode

In [23]:
API_KEY = "AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU"

def analyze_text(text, language="pt"):
    default_scores = {
        "toxicity": None,
        "insult": None,
        "threat": None,
        "profanity": None,
        "identity_attack": None
    }

    if pd.isna(text) or not str(text).strip():
        print("Texto vazio ou NaN. Pulando.")
        return default_scores
    
    url = f"https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key={API_KEY}"
    data = {
        "comment": {"text": text},
        "languages": [language],
        "requestedAttributes": {
            "TOXICITY": {},
            "INSULT": {},
            "THREAT": {},
            "PROFANITY": {},
            "IDENTITY_ATTACK": {}
        }
    }

    try:
        response = requests.post(url, data=json.dumps(data))
        response.raise_for_status()
        result = response.json()

        scores = {
            "toxicity": result['attributeScores']['TOXICITY']['summaryScore']['value'],
            "insult": result['attributeScores']['INSULT']['summaryScore']['value'],
            "threat": result['attributeScores']['THREAT']['summaryScore']['value'],
            "profanity": result['attributeScores']['PROFANITY']['summaryScore']['value'],
            "identity_attack": result['attributeScores']['IDENTITY_ATTACK']['summaryScore']['value']
        }

        return scores
    except Exception as e:
        print(f"Erro com texto: {text[:40]}...\nErro: {e}")
        return default_scores



In [24]:

nltk.download('punkt')
nltk.download('stopwords')
nltk.download('wordnet')

lemmatizer = WordNetLemmatizer()
stop_words = set(stopwords.words('portuguese'))

custom_stopwords = {
    't', 'be', 'nao', 'youtu', 'vai', 'av', 'ja', 'to', 'the', 'this', 'i', 'and', 
    'you', 'y', 'www', 'sao', 'pois', 'contra', 'user', 'ai', 'so', 'gente', 'voce', 'of', 
    'ola', 'gift', 'card', 'kwaivideo', 'r', 'bom', 'q', 'vc', 'vcs', 'pra','ta', 'phone', 'ok', 'la',
    'sera', 'ha', 'aqui', 'ate', 'dia', 'mc', 'im', 'tmj', 'pix', 'g', 'diz', 'ti', 'etc', 'tudo', 
    'todo', 'toda', 'youtube', 'g1', 'm', 'instagram', 'fb', 'in', 'link', 'was', 'blocked', 'kk'
}

stop_words.update(custom_stopwords)

def preprocess_text(text):

    # Fun√ß√£o para extrair e substituir o dom√≠nio da URL
    def substituir_dominios(texto):
        # Fun√ß√£o para extrair e substituir o dom√≠nio da URL
        def extrair_dominio(url):
            # Remove o protocolo (http://, https://, etc.) e o "www." se presente
            dominio = re.sub(r'^https?://(?:www\.)?|www\.', '', url)
            # Remove o caminho e par√¢metros da URL
            dominio = re.split(r'[/?#]', dominio)[0]
            # Retorna a parte principal do dom√≠nio (antes do primeiro ponto)
            return dominio.split('.')[0]

        # Substitui URLs por seus dom√≠nios principais
        return re.sub(r'https?://(?:www\.)?\S+|www\.\S+', lambda match: extrair_dominio(match.group(0)), texto)

    # Substituir dom√≠nios
    text = substituir_dominios(text)

    # Converte para min√∫sculas
    text = text.lower()

    # Remove acentos
    text = unidecode(text)

    #Remover Pontua√ß√£o
    text = text.translate(str.maketrans('', '', string.punctuation))

    # Remove URLs e men√ß√µes
    #text = re.sub(r'http\S+|www\S+|https\S+|@\w+', '', text)

    # Substitui emojis repetidos por apenas um
    text = re.sub(r'([\U00010000-\U0010FFFF])\1+', r'\1', text)
    text = re.sub(r'([\U0001F600-\U0001F64F]|[\U0001F300-\U0001F5FF]|[\U0001F680-\U0001F6FF]|[\U0001F700-\U0001F77F]|[\U0001F780-\U0001F7FF]|[\U0001F800-\U0001F8FF]|[\U0001F900-\U0001F9FF]|[\U0001FA00-\U0001FA6F]|[\U0001FA70-\U0001FAFF])\1+', r'\1', text)


    # Remove espa√ßos em branco extras (in√≠cio ou final) e m√∫ltiplos espa√ßos no meio do texto
    text = re.sub(r'\s+', ' ', text).strip()

    # Remove pontua√ß√µes e caracteres especiais
    #text = re.sub(r'[^\w\s]', '', text)

    # Ajusta risadas "kkk" ou mais para "kk"
    text = re.sub(r'k{2,}|K{2,}', 'kk', text)

    # Ajusta risadas "haha" ou mais para "haha"
    text = re.sub(r'(ha){2,}', 'haha', text, flags=re.IGNORECASE)

    # Ajusta risadas "kaka" ou mais para "kaka"
    text = re.sub(r'(ka){2,}', 'kaka', text, flags=re.IGNORECASE)

    # Remove as stopwords
    text = ' '.join([word for word in text.split() if word not in stop_words])


    return text


[nltk_data] Downloading package punkt to C:\Users\Melissa
[nltk_data]     Felipe\AppData\Roaming\nltk_data...
[nltk_data]   Package punkt is already up-to-date!
[nltk_data] Downloading package stopwords to C:\Users\Melissa
[nltk_data]     Felipe\AppData\Roaming\nltk_data...
[nltk_data]   Package stopwords is already up-to-date!
[nltk_data] Downloading package wordnet to C:\Users\Melissa
[nltk_data]     Felipe\AppData\Roaming\nltk_data...
[nltk_data]   Package wordnet is already up-to-date!


## Telegram

In [25]:
df_telegram = pd.read_csv('../datasets/fakeTelegram.BR_2022.csv')
df_telegram.head()

Unnamed: 0,date_message,id_member_anonymous,id_group_anonymous,media,media_type,media_url,has_media,has_media_url,trava_zap,text_content_anonymous,dataset_info_id,date_system,score_sentiment,score_misinformation,id_message,id_persona,message_type,messenger,media_name,media_md5
0,2022-10-05 06:25:04,1078cc958f0febe28f4d03207660715f,12283e08a2eb5789201e105b34489ee7,,,,False,False,False,Ent√£o √© Fato Renato o √°udio que eu ouvi no wha...,5,2022-10-05 06:25:28.863641,0.0,,16385,Wanda Silva,Texto,telegram,,
1,2022-10-05 06:25:08,,12283e08a2eb5789201e105b34489ee7,,,,False,False,False,"Saiu no YouTube do presidente a 8 horas atr√°s,...",5,2022-10-05 06:25:28.926311,0.0644,,16386,Wanda Silva,Texto,telegram,,
2,2022-10-05 06:26:28,92a2d8fd7144074f659d1d29dc3751da,9f2d7394334eb224c061c9740b5748fc,,,,False,False,False,"√â isso, nossa parte j√° foi quase toda feita. N...",5,2022-10-05 06:26:29.361949,-0.3551,0.157242,16366,Wanda Silva,Texto,telegram,,
3,2022-10-05 06:27:28,d60aa38f62b4977426b70944af4aff72,c8f2de56550ed0bf85249608b7ead93d,94dca4cda503100ebfda7ce2bcc060eb.jpg,image/jpg,,True,False,False,GENTE ACHEI ELES EM UMA SEITA MA√áON√ÅRICA,5,2022-10-05 06:27:29.935624,0.0,,19281,Wanda Silva,Imagem,telegram,,94dca4cda503100ebfda7ce2bcc060eb
4,2022-10-05 06:27:44,cd6979b0b5265f08468fa1689b6300ce,e56ec342fc599ebb4ed89655eb6f03aa,5ad5c8bbe9da93a37fecf3e5aa5b0637.jpg,image/jpg,,True,False,False,,5,2022-10-05 06:28:29.316325,,,507185,Wanda Silva,Imagem,telegram,,5ad5c8bbe9da93a37fecf3e5aa5b0637


In [26]:
ids_para_remover = ['b73c0b674b28d87375d78dcae2f1a21f','62b3aa83e4df122e48cb1f97583e403f',
                    '893874da7344daaa00b8b5b3dc295b59','38737f3c7a07586c4efbfa39aa345705',
                    'da4cbbc1b7b1192ad83bcdae613ac2c3', 'bf66a467459264e0d33e4c8518a82827',
                    '46e009035e6150d656d0c194db88fb07','811541f6ce49347d1798e8dd2d3cbf83',
                    '1d2a0a63333d12ad188e9e6f7f2e0419','7c379613d4da713fe959d8c7ddc11ce2',
                    'debe17fd10d504076d2df8682f63bfc6','e9713ae04a02a810d6f33dd956f42794',
                    'd6c77928db26721ce46aca2d549780f0','8e53464d3b01eea3e39d07e51ecbb1b4',
                    'bacd40da04dd7d13f646993bdcf8e79d','2273d1167a6212812d95dc8fadbae78e',
                    'cd3bb1bdf75be7595e6373171a5c2225','add8c1ba533c5e5450d92c061a5ee7bf',
                    'e198f90df1995528531dd43db0c935ea', '06dc9ac55ed64caab2bd97e9ab717302',
                    'c0110feb539d212836605b66192722dd','f71912700ac5331415408ce229681359',
                    '2ee692357a9c948351c43a9540e859ae', '25b66278176dabe814dfc25a405a2470',
                    '08b21cb1e7de74ef5fe1085230075523']

In [27]:
# Filtrar o DataFrame para remover as linhas com esses IDs
df_filtrado_telegram = df_telegram[~df_telegram['id_member_anonymous'].isin(ids_para_remover)]
df_filtrado_telegram

Unnamed: 0,date_message,id_member_anonymous,id_group_anonymous,media,media_type,media_url,has_media,has_media_url,trava_zap,text_content_anonymous,dataset_info_id,date_system,score_sentiment,score_misinformation,id_message,id_persona,message_type,messenger,media_name,media_md5
0,2022-10-05 06:25:04,1078cc958f0febe28f4d03207660715f,12283e08a2eb5789201e105b34489ee7,,,,False,False,False,Ent√£o √© Fato Renato o √°udio que eu ouvi no wha...,5,2022-10-05 06:25:28.863641,0.0000,,16385,Wanda Silva,Texto,telegram,,
1,2022-10-05 06:25:08,,12283e08a2eb5789201e105b34489ee7,,,,False,False,False,"Saiu no YouTube do presidente a 8 horas atr√°s,...",5,2022-10-05 06:25:28.926311,0.0644,,16386,Wanda Silva,Texto,telegram,,
2,2022-10-05 06:26:28,92a2d8fd7144074f659d1d29dc3751da,9f2d7394334eb224c061c9740b5748fc,,,,False,False,False,"√â isso, nossa parte j√° foi quase toda feita. N...",5,2022-10-05 06:26:29.361949,-0.3551,0.157242,16366,Wanda Silva,Texto,telegram,,
3,2022-10-05 06:27:28,d60aa38f62b4977426b70944af4aff72,c8f2de56550ed0bf85249608b7ead93d,94dca4cda503100ebfda7ce2bcc060eb.jpg,image/jpg,,True,False,False,GENTE ACHEI ELES EM UMA SEITA MA√áON√ÅRICA,5,2022-10-05 06:27:29.935624,0.0000,,19281,Wanda Silva,Imagem,telegram,,94dca4cda503100ebfda7ce2bcc060eb
4,2022-10-05 06:27:44,cd6979b0b5265f08468fa1689b6300ce,e56ec342fc599ebb4ed89655eb6f03aa,5ad5c8bbe9da93a37fecf3e5aa5b0637.jpg,image/jpg,,True,False,False,,5,2022-10-05 06:28:29.316325,,,507185,Wanda Silva,Imagem,telegram,,5ad5c8bbe9da93a37fecf3e5aa5b0637
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
557581,2022-11-11 12:06:15,333e9869f23dbd4682d1be382d9c1e59,e56ec342fc599ebb4ed89655eb6f03aa,25e43b6a58b848c43ad5b5f9e979822a.jpg,url,https://terrabrasilnoticias.com/2022/11/bndes-...,True,True,False,"BNDES tem lucro de R$ 9,6 bilh√µes no terceiro ...",5,2022-11-16 14:49:39.146502,0.1027,,575796,Wanda Silva,Url,telegram,,25e43b6a58b848c43ad5b5f9e979822a
557582,2022-11-11 12:09:08,,5b10d7739171149be6d9961e3350c071,657949d03e4088f6b332e2686ccd3221.jpg,url,https://youtu.be/8g1Vz9_0xVk,True,True,False,https://youtu.be/8g1Vz9_0xVk,5,2022-11-16 14:49:39.847434,0.0000,,1286443,Wanda Silva,Url,telegram,,657949d03e4088f6b332e2686ccd3221
557583,2022-11-11 12:09:47,,1590a03f43b5ba4b6147a1c5e1dd357b,a21848a61045380a6483866daed0ca0e.jpg,image/jpg,https://t.me/vemprasruas,True,True,False,"Empres√°rios, demitam os petistas primeiro.\n\n...",5,2022-11-16 14:49:39.922279,0.0000,,13294,Wanda Silva,Imagem,telegram,,a21848a61045380a6483866daed0ca0e
557584,2022-11-11 12:09:46,,5b10d7739171149be6d9961e3350c071,a21848a61045380a6483866daed0ca0e.jpg,image/jpg,https://t.me/vemprasruas,True,True,False,"Empres√°rios, demitam os petistas primeiro.\n\n...",5,2022-11-16 14:49:39.992932,0.0000,,1286444,Wanda Silva,Imagem,telegram,,a21848a61045380a6483866daed0ca0e


In [28]:
# Removendo linhas com valores NaN na coluna 'text_content_anonymous'
df_filtrado_telegram = df_filtrado_telegram.dropna(subset=['text_content_anonymous'])

# Removendo trava_zap
df_filtrado_telegram = df_filtrado_telegram[df_filtrado_telegram['trava_zap'] == False]


len(df_filtrado_telegram)

443759

In [29]:

df_geral_telegram = df_filtrado_telegram.copy()

# Aplicar o pr√©-processamento √† coluna de texto
df_geral_telegram['text_processed'] = df_geral_telegram['text_content_anonymous'].apply(preprocess_text)

In [30]:
df_geral_telegram.head()

Unnamed: 0,date_message,id_member_anonymous,id_group_anonymous,media,media_type,media_url,has_media,has_media_url,trava_zap,text_content_anonymous,...,date_system,score_sentiment,score_misinformation,id_message,id_persona,message_type,messenger,media_name,media_md5,text_processed
0,2022-10-05 06:25:04,1078cc958f0febe28f4d03207660715f,12283e08a2eb5789201e105b34489ee7,,,,False,False,False,Ent√£o √© Fato Renato o √°udio que eu ouvi no wha...,...,2022-10-05 06:25:28.863641,0.0,,16385,Wanda Silva,Texto,telegram,,,entao fato renato audio ouvi whatsapp ocorreu ...
1,2022-10-05 06:25:08,,12283e08a2eb5789201e105b34489ee7,,,,False,False,False,"Saiu no YouTube do presidente a 8 horas atr√°s,...",...,2022-10-05 06:25:28.926311,0.0644,,16386,Wanda Silva,Texto,telegram,,,saiu presidente 8 horas atras infelizmente con...
2,2022-10-05 06:26:28,92a2d8fd7144074f659d1d29dc3751da,9f2d7394334eb224c061c9740b5748fc,,,,False,False,False,"√â isso, nossa parte j√° foi quase toda feita. N...",...,2022-10-05 06:26:29.361949,-0.3551,0.157242,16366,Wanda Silva,Texto,telegram,,,parte quase feita segundo turno completamos pa...
3,2022-10-05 06:27:28,d60aa38f62b4977426b70944af4aff72,c8f2de56550ed0bf85249608b7ead93d,94dca4cda503100ebfda7ce2bcc060eb.jpg,image/jpg,,True,False,False,GENTE ACHEI ELES EM UMA SEITA MA√áON√ÅRICA,...,2022-10-05 06:27:29.935624,0.0,,19281,Wanda Silva,Imagem,telegram,,94dca4cda503100ebfda7ce2bcc060eb,achei seita maconarica
5,2022-10-05 06:28:30,,b52442a5fbc459ae590dca0d215e32f9,,,,False,False,False,Kƒ∑kkkkk to rindo at√© agora....Quem disse q ia ...,...,2022-10-05 06:29:29.046694,0.7003,0.197813,2735,Wanda Silva,Texto,telegram,,,rindo agoraquem disse ia fazer acordo diabo pr...


In [31]:
df_geral_telegram.shape

(443759, 21)

In [32]:
palavras_religiosas = [
    "deus", "jesus", "misericordia", "davi",
    "salomao", "reino", "templo", "conservador",
    "pentecostal", "rcc", "renovacao", "carismatic",
    "paulo ricardo", "bernardo kuster", "herege", "ateu",
    "jerico", "heresia"
]

# Fun√ß√£o para verificar se uma palavra est√° relacionada √† religi√£o
def relacionada_religiao(word):
    word_lower = word.lower()
    palavras_religiosas_lower = [palavra.lower() for palavra in palavras_religiosas]

    # Verificando se alguma palavra da lista de palavras religiosas est√° presente
    return any(palavra in word_lower for palavra in palavras_religiosas_lower)


df_religiao_telegram = df_geral_telegram[df_geral_telegram['text_processed'].apply(lambda x: relacionada_religiao(x))]


In [33]:
palavras_politicas = [ "lula", "bolsonaro", "pt", "pl", "stf", "patria", "55", "22", "13", "senadores", "lulaladrao",
                       "urnas", "alexandre", "moraes", "comunismo", "eleicao", "eleicoes", "esquerda", "direita",
                         "presidente", "tse", "fraude", "voto", "turno", "ministro"]

def retirar_mensagens_com_palavras_politicas(word):
    word_lower = word.lower()
    palavras_politica_lower = [palavra.lower() for palavra in palavras_politicas]

    return any(palavra in word_lower for palavra in palavras_politica_lower)


df_politico_telegram = df_religiao_telegram[~df_religiao_telegram['text_processed'].apply(lambda x: retirar_mensagens_com_palavras_politicas(x))]

In [34]:

# Ativa barra de progresso no Pandas
tqdm.pandas()

# Lista para armazenar os resultados
results = []

# La√ßo com barra de progresso
for i, row in tqdm(df_politico_telegram.iterrows(), total=len(df_politico_telegram), desc="Analisando textos"):
    text = row['text_content_anonymous']
    scores = analyze_text(text)
    results.append(scores)
    time.sleep(1)  # opcional

# Transformar resultados em DataFrame
scores_df = pd.DataFrame(results)

# Concatenar com o DataFrame original
df_final_telegram = pd.concat([df_politico_telegram.reset_index(drop=True), scores_df], axis=1)

# Ver o resultado final
df_final_telegram.head()


Analisando textos:   1%|‚ñè         | 107/8526 [03:37<3:56:12,  1.68s/it]

Erro com texto: Tudo isso √© montagem e de p√©ssima qualid...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:   1%|‚ñè         | 108/8526 [03:38<3:49:22,  1.63s/it]

Erro com texto: O pr√≥prio nome dessa senhora serva de sa...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:   1%|‚ñè         | 109/8526 [03:40<4:10:11,  1.78s/it]

Erro com texto: Domingo aben√ßoado a todas mulheres linda...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:   3%|‚ñé         | 257/8526 [08:38<4:36:35,  2.01s/it]

Erro com texto: √â pra rir ou pra chorar?! üò∞
Tem Miseric√≥...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:   4%|‚ñç         | 348/8526 [11:38<4:36:26,  2.03s/it]

Erro com texto: MATEUS 7 1:5
N√ÉO OLHA PARA OS JULGAMENTO...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:   4%|‚ñç         | 350/8526 [11:42<4:40:58,  2.06s/it]

Erro com texto: Eles servem a satan√°s e n√£o sabem o que ...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:   5%|‚ñç         | 409/8526 [13:38<4:16:20,  1.89s/it]

Erro com texto: Bom dia irmaos paz pe√ßo a aten√ß√£o dos ir...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:   5%|‚ñç         | 412/8526 [13:44<4:31:14,  2.01s/it]

Erro com texto: Que ben√ß√£o,Deus est√° no controle do Bras...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:   5%|‚ñå         | 440/8526 [14:38<4:36:50,  2.05s/it]

Erro com texto: Exato, minha fam√≠lia √© toda do time do 9...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  11%|‚ñà         | 955/8526 [32:38<4:29:51,  2.14s/it] 

Erro com texto: Eu disse, no sentido do Cristianismo. O ...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  11%|‚ñà         | 956/8526 [32:40<4:06:49,  1.96s/it]

Erro com texto: üî¥ Assista, informe-se e ajude a comparti...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  15%|‚ñà‚ñå        | 1302/8526 [44:26<3:52:39,  1.93s/it]

Erro com texto: Dia 30 √© dia de jejum por nossa na√ß√£o e ...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  16%|‚ñà‚ñå        | 1353/8526 [46:06<3:55:00,  1.97s/it]

Erro com texto: meu Deus censuram o canal do Renato Barr...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  17%|‚ñà‚ñã        | 1432/8526 [48:41<4:03:23,  2.06s/it]

Erro com texto: miseric√≥rdia, qtas pessoas parecem zumbi...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  18%|‚ñà‚ñä        | 1524/8526 [51:45<3:49:21,  1.97s/it]

Erro com texto: Deus queira que isso n√£o aconte√ßa... Vam...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  18%|‚ñà‚ñä        | 1552/8526 [52:38<3:23:56,  1.75s/it]

Erro com texto: N√£o cumprimenta ningu√©m, nem o seu vice,...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  18%|‚ñà‚ñä        | 1556/8526 [52:47<4:06:11,  2.12s/it]

Erro com texto: Esse √© o v√≠deo que mostra bem no come√ßo ...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  19%|‚ñà‚ñâ        | 1599/8526 [54:10<3:52:40,  2.02s/it]

Erro com texto: Miseric√≥rdia que absurdo falar assim de ...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  21%|‚ñà‚ñà        | 1794/8526 [1:00:34<3:09:06,  1.69s/it]

Erro com texto: Censura ü§¨ pra n√≥s !!
Pinga pro molusco ü¶ë...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  21%|‚ñà‚ñà        | 1802/8526 [1:00:49<3:26:32,  1.84s/it]

Erro com texto: "...para as sociedades medievais e do in...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  21%|‚ñà‚ñà‚ñè       | 1832/8526 [1:01:45<3:19:48,  1.79s/it]

Erro com texto: Vejam isso! Meu Deus! Virou uma ditadura...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  22%|‚ñà‚ñà‚ñè       | 1859/8526 [1:02:34<3:11:27,  1.72s/it]

Erro com texto: V√≠deo de ,Jesus Cristo Vai Voltar,...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  22%|‚ñà‚ñà‚ñè       | 1876/8526 [1:03:03<2:59:02,  1.62s/it]

Erro com texto: _______

Est√° escrito na palavra de Deus...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  22%|‚ñà‚ñà‚ñè       | 1877/8526 [1:03:05<2:54:30,  1.57s/it]

Erro com texto: . 
‚ö†Ô∏è‚ö†Ô∏èüëÄ
‚ö°Ô∏è üá¨üáß

üî¥ üëâ EBS no Reino Unido üá¨...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  22%|‚ñà‚ñà‚ñè       | 1879/8526 [1:03:08<2:53:19,  1.56s/it]

Erro com texto: ‚ùóÔ∏èDrop 4429‚ùóÔ∏è

A Armadura de Deus
Seja f...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  22%|‚ñà‚ñà‚ñè       | 1880/8526 [1:03:10<3:13:08,  1.74s/it]

Erro com texto: Covarde... Confessar com boca somente aq...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  22%|‚ñà‚ñà‚ñè       | 1888/8526 [1:03:24<3:11:36,  1.73s/it]

Erro com texto: Bom acho que teremos que ir para as ruas...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  22%|‚ñà‚ñà‚ñè       | 1911/8526 [1:04:05<3:23:57,  1.85s/it]

Erro com texto: üá¨üáß - Liz Truss torna-se a primeira-minis...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  22%|‚ñà‚ñà‚ñè       | 1913/8526 [1:04:08<3:10:42,  1.73s/it]

Erro com texto: Bom dia!! Desejamos boas-vindas e que vo...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  22%|‚ñà‚ñà‚ñè       | 1916/8526 [1:04:13<3:00:13,  1.64s/it]

Erro com texto: üü°  Rea√ß√£o √† ren√∫ncia de Truss

Emmanuel ...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  22%|‚ñà‚ñà‚ñè       | 1917/8526 [1:04:15<3:18:43,  1.80s/it]

Erro com texto: Liz Truss renuncia ao cargo de primeira-...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  23%|‚ñà‚ñà‚ñé       | 1920/8526 [1:04:20<3:24:19,  1.86s/it]

Erro com texto: Muito obrigado pelo seu feedback, parab√©...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  23%|‚ñà‚ñà‚ñé       | 1929/8526 [1:04:37<3:22:39,  1.84s/it]

Erro com texto: Nossa Esperan√ßa √© Sua Vinda, o Rei dos r...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  24%|‚ñà‚ñà‚ñé       | 2008/8526 [1:07:12<3:30:50,  1.94s/it]

Erro com texto: Meu amigo, se prepare, fale enquanto pod...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  24%|‚ñà‚ñà‚ñç       | 2052/8526 [1:08:36<3:18:34,  1.84s/it]

Erro com texto: V√≠deo de Cleonice Deus √â  Fiel...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  24%|‚ñà‚ñà‚ñç       | 2054/8526 [1:08:39<3:02:45,  1.69s/it]

Erro com texto: Quero falar de um grupo de babacas que n...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  24%|‚ñà‚ñà‚ñç       | 2060/8526 [1:08:50<3:10:55,  1.77s/it]

Erro com texto: V√≠deo de Derci Amo ‚ù§Ô∏èJesusüôèüèºüåπ...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  25%|‚ñà‚ñà‚ñç       | 2101/8526 [1:10:14<4:13:43,  2.37s/it]

Erro com texto: minha hist√≥ria de vida hoje teria sido d...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  25%|‚ñà‚ñà‚ñå       | 2148/8526 [1:11:42<3:49:38,  2.16s/it]

Erro com texto: Quando voc√™ v√™ um √™xodo em massa de jude...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  25%|‚ñà‚ñà‚ñå       | 2149/8526 [1:11:44<3:49:17,  2.16s/it]

Erro com texto: https://www.correiobraziliense.com.br/po...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  28%|‚ñà‚ñà‚ñä       | 2416/8526 [1:20:38<3:01:24,  1.78s/it]

Erro com texto: ‚ö†Ô∏èüáßüá∑ "‚ÄúV√ÉO ENCONTRAR PROVAS‚Äù DEUS AVISOU...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  28%|‚ñà‚ñà‚ñä       | 2420/8526 [1:20:48<3:49:47,  2.26s/it]

Erro com texto: Irm√£os isso tudo √© verdade? estou em des...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  29%|‚ñà‚ñà‚ñâ       | 2507/8526 [1:23:40<3:27:40,  2.07s/it]

Erro com texto: MENAGEM AOS CRIST√ÉO DE TODAS AS DENOMINA...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  30%|‚ñà‚ñà‚ñâ       | 2536/8526 [1:24:36<3:32:33,  2.13s/it]

Erro com texto: gente o mourao adora o gmail ‚ùì‚ùì‚ùì‚ùì o baph...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  31%|‚ñà‚ñà‚ñà‚ñè      | 2670/8526 [1:29:07<2:56:45,  1.81s/it]

Erro com texto: ‚òëÔ∏è‚òëÔ∏è‚òëÔ∏è‚òëÔ∏è‚òëÔ∏è‚òëÔ∏èüåπüåπüåπüåπ
 Bom Dia Caros Assinant...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  31%|‚ñà‚ñà‚ñà‚ñè      | 2671/8526 [1:29:09<2:47:12,  1.71s/it]

Erro com texto: üå©

By Pepe 

O mundo est√° despertando.
D...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  32%|‚ñà‚ñà‚ñà‚ñè      | 2746/8526 [1:31:39<3:24:44,  2.13s/it]

Erro com texto: üå©

üè¶ üá¨üáß O Banco da Inglaterra estende ai...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  33%|‚ñà‚ñà‚ñà‚ñé      | 2795/8526 [1:33:15<2:59:00,  1.87s/it]

Erro com texto: 2019 - Denunciou Jo√£o de Deus...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  34%|‚ñà‚ñà‚ñà‚ñç      | 2911/8526 [1:37:07<3:00:52,  1.93s/it]

Erro com texto: O governo da Argentina est√° pedindo ao C...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos:  34%|‚ñà‚ñà‚ñà‚ñç      | 2918/8526 [1:37:21<3:19:30,  2.13s/it]

Erro com texto: Estas pessoas n√£o servem o nosso Deus ,n...
Erro: 429 Client Error: Too Many Requests for url: https://commentanalyzer.googleapis.com/v1alpha1/comments:analyze?key=AIzaSyCQXBfvKoDxM0m0Fd8Yc3kMVajQCe0uAiU


Analisando textos: 100%|‚ñà‚ñà‚ñà‚ñà‚ñà‚ñà‚ñà‚ñà‚ñà‚ñà| 8526/8526 [4:40:03<00:00,  1.97s/it]  


Unnamed: 0,date_message,id_member_anonymous,id_group_anonymous,media,media_type,media_url,has_media,has_media_url,trava_zap,text_content_anonymous,...,message_type,messenger,media_name,media_md5,text_processed,toxicity,insult,threat,profanity,identity_attack
0,2022-10-05 06:43:51,,99561fb8c30a84c837927176b102d5d5,b9cf0b8950c9c0cf18c62f1904472cc1.jpg,image/jpg,,True,False,False,"Feedback de Mateus Alves\n29 anos. Brasil, Par...",...,Imagem,telegram,,6a72ad1e5a9c7d7caf41ccaeddc35e52,feedback mateus alves 29 anos brasil parana po...,0.016022,0.009565,0.006842,0.019622,0.003404
1,2022-10-05 08:56:25,d87aad01c33013334c184d741b3986ad,b11f2df64ac19aad47a50accf32052d6,,,,False,False,False,"O Senhor, quando lembrou a Jac√≥ que, o nome de...",...,Texto,telegram,,,senhor lembrou jaco nome jaco jaco sim israel ...,0.049832,0.020515,0.006926,0.016172,0.034816
2,2022-10-05 08:56:24,d87aad01c33013334c184d741b3986ad,b11f2df64ac19aad47a50accf32052d6,4ac8be9d59dea0e35ff866eb4d752db1.jpg,image/jpg,,True,False,False,JAC√ì LUTOU COM DEUS E VENCEU - AS DUAS CASAS D...,...,Imagem,telegram,,4ac8be9d59dea0e35ff866eb4d752db1,jaco lutou deus venceu duas casas israel prome...,0.017341,0.008444,0.006512,0.010382,0.008768
3,2022-10-05 09:00:36,83f03c843a33c1933b0caf9252d97527,e3988dfe85b2ba2fa0499a428dd8a20a,,,,False,False,False,"BOM DIA\n\n""MANTER A ESPERAN√áA""\n\nS√≥ quem man...",...,Texto,telegram,,,manter esperanca mantem caridade mantem tambem...,0.013571,0.009565,0.005952,0.010638,0.004699
4,2022-10-05 09:07:29,,43da8c10b93fb7c9078577a567f68ebc,bf38cc385ba2ab65d4facb176ef50c0b.jpg,image/jpg,,True,False,False,"Muito obrigado pelo seu feedback, parab√©ns, co...",...,Imagem,telegram,,bf38cc385ba2ab65d4facb176ef50c0b,obrigado feedback parabens continue fazendo ne...,0.010179,0.007304,0.007055,0.015147,0.003441


In [35]:
df_final_telegram.to_csv('./resultado_api_perspective/faKeTelegram_API_Perspective.BR_2022.csv')