In [75]:
import pandas as pd
import os
import json
import datetime as dt
from dateutil import parser 
import re
from concurrent.futures import ThreadPoolExecutor
from utilities.preprocessors import normalize_and_clean, extract_keys_values, clean_and_split_data
from utilities.loaders import read_doc_files, read_rtf_files

%load_ext autoreload
%autoreload 2

The autoreload extension is already loaded. To reload it, use:
  %reload_ext autoreload


In [76]:
input_dir = './rain input'
files = os.listdir(input_dir)
files

['Dataset#5405November 21 2024 kaidro AMA.docx',
 'Dataset#540911252024 kaidro game features.docx',
 'Dataset#5445WF Community Round Overview.rtf',
 'Dataset#5446alpha LLS test.rtf']

In [77]:
docs_files = [file for file in files if file.endswith('.docx')]
docs = read_doc_files(input_dir=input_dir, files=docs_files)
docs

{'Dataset#5405November 21 2024 kaidro AMA': ['Kaidro information center',
  '\nAnimation development will intensify next year, producer roles will kick in as we get a Pilot leaderboard',
  'small OPEN beta - January 2025',
  'bigger OPEN beta - Steam next fest; we already applied. February 5, 2025',
  'game launch - April 2025',
  'alpha mobile - April 2025',
  '',
  '2⃣ BURNING EVENT ',
  'November 28 to December 5',
  ' Adepts and Runners are involved',
  ' Reduce supply, get extra aKDR before TGE 👀',
  ' Limit for each category, check announcements',
  ' No limit for journals',
  ' Leaderboard will show you how many aKDR you earned from burning',
  " update on aKDR for burn, initially it's 50 but they listened to the community and it will be higher. Details next week. ",
  '',
  '3⃣ SYNERGY NUMBERS 🎰',
  ' coming out early next week',
  '',
  '4⃣ TOKEN GENERATION EVENT ($KDR) 🪙',
  ' DATE: mid-December',
  'TGE and Kaidro cinematic will be dropped on the same day. ',
  ' the cinemat

In [78]:
rtf_files = [file for file in files if file.endswith('.rtf')]
rtfs = read_rtf_files(input_dir=input_dir, files=rtf_files)
rtfs

{'Dataset#5445WF Community Round Overview': ['',
  '',
  '',
  ' Community Round Overview',
  'The Community Round token sale will take place on\xa0Impossible finance. Please ensure that you complete the KYC process beforehand, as it’s required for all.',
  'Token Sale Information:',
  'Token:\xa0$WF',
  'Supply:\xa044M tokens',
  'Price:\xa0$0.045 per token (FDV: $45M)',
  'Vesting:\xa020% available at TGE, 1 month lock, 5 months vesting',
  "Note:\xa0Please, due to current listing partner negotiations, we're under an embargo for revealing full tokenomics until early next week ",
  '',
  ' Structure of the Community Round',
  'The Community Round will have two main stages:',
  'ROUND 1️ – December 3, 2024',
  'Reserved for Ronin stakers, KOLs (Key Opinion Leaders), and the Impossible Finance community.',
  'Ronin Stakers:\xa0$500k',
  'KOLs: $400k',
  'Impossible Finance community: $100k',
  'ROUND 2️ – December 5, 2024',
  'Open to the entire Wild Forest community with specific alloc

In [79]:
output_dir = './Rain output'
for name, lists in docs.items():
    clean_and_split_data(name, lists, output_dir=output_dir, cleaner=normalize_and_clean)

kaidro information center
animation development will intensify next year, producer roles will kick in as we get a pilot leaderboard
small open beta january 2025
bigger open beta steam next fest; we already applied. february 5, 2025
game launch april 2025
alpha mobile april 2025
2 burning event
november 28 to december 5
adepts and runners are involved
reduce supply, get extra akdr before tge
limit for each category, check announcements
no limit for journals
leaderboard will show you how many akdr you earned from burning
update on akdr for burn, initially it is 50 but they listened to the community and it will be higher. details next week.
3 synergy numbers
coming out early next week
4 token generation event kdr
date: mid december
tge and kaidro cinematic will be dropped on the same day.
the cinematic will show the final quality of the animation. youtube and x it will run for 2 mins. paid ad will be deployed.
additional airdrops to nft holders may be before or after tge.
5 kaidro merch
h

In [80]:
for name, lists in rtfs.items():
    clean_and_split_data(name, lists, output_dir=output_dir, cleaner=normalize_and_clean)

community round overview
the community round token sale will take place on impossible finance. please ensure that you complete the kyc process beforehand, as it is required for all.
token sale information:
token: wf
supply: 44m tokens
price: 0.045 per token fdv: 45m
vesting: 20 percent available at tge, 1 month lock, 5 months vesting
note: please, due to current listing partner negotiations, we are under an embargo for revealing full tokenomics until early next week
structure of the community round
the community round will have two main stages:
round 1 december 3, 2024
reserved for ronin stakers, kols key opinion leaders , and the impossible finance community.
ronin stakers: 500000
kols: 400000
impossible finance community: 100000
round 2 december 5, 2024
open to the entire wild forest community with specific allocation pools for nft holders:
lord stakers: 600000 for 90 day staking participants
legendary unit nft holders: 150000
epic and legendary skin nft holders: 150000
lord soft sta

In [None]:
from utilities.loaders import read_files

In [86]:
loaded_files = read_files(input_dir, files)
loaded_files

{'Dataset#5405November 21 2024 kaidro AMA': ['Kaidro information center',
  '\nAnimation development will intensify next year, producer roles will kick in as we get a Pilot leaderboard',
  'small OPEN beta - January 2025',
  'bigger OPEN beta - Steam next fest; we already applied. February 5, 2025',
  'game launch - April 2025',
  'alpha mobile - April 2025',
  '',
  '2⃣ BURNING EVENT ',
  'November 28 to December 5',
  ' Adepts and Runners are involved',
  ' Reduce supply, get extra aKDR before TGE 👀',
  ' Limit for each category, check announcements',
  ' No limit for journals',
  ' Leaderboard will show you how many aKDR you earned from burning',
  " update on aKDR for burn, initially it's 50 but they listened to the community and it will be higher. Details next week. ",
  '',
  '3⃣ SYNERGY NUMBERS 🎰',
  ' coming out early next week',
  '',
  '4⃣ TOKEN GENERATION EVENT ($KDR) 🪙',
  ' DATE: mid-December',
  'TGE and Kaidro cinematic will be dropped on the same day. ',
  ' the cinemat

In [87]:
loaded_files.items()

dict_items([('Dataset#5405November 21 2024 kaidro AMA', ['Kaidro information center', '\nAnimation development will intensify next year, producer roles will kick in as we get a Pilot leaderboard', 'small OPEN beta - January 2025', 'bigger OPEN beta - Steam next fest; we already applied. February 5, 2025', 'game launch - April 2025', 'alpha mobile - April 2025', '', '2⃣ BURNING EVENT ', 'November 28 to December 5', ' Adepts and Runners are involved', ' Reduce supply, get extra aKDR before TGE 👀', ' Limit for each category, check announcements', ' No limit for journals', ' Leaderboard will show you how many aKDR you earned from burning', " update on aKDR for burn, initially it's 50 but they listened to the community and it will be higher. Details next week. ", '', '3⃣ SYNERGY NUMBERS 🎰', ' coming out early next week', '', '4⃣ TOKEN GENERATION EVENT ($KDR) 🪙', ' DATE: mid-December', 'TGE and Kaidro cinematic will be dropped on the same day. ', ' the cinematic will show the final quality o

In [88]:
from utilities.utilities import rename_all

In [89]:
rename_all('C:/Users/LARRY/Documents/Scripts/virtuals-internship/Rain output')