In [1]:
# Adjusting current working directory to parent directory
from pathlib import Path
from os import chdir
from platform import system

try:
    current_directory
except: # First  run - initialize current_directory
    current_directory = Path.cwd()
    if system() == "Linux": # Colab
        from google.colab import drive
        drive.mount('/content/drive')
        current_directory = f"{current_directory}/drive/MyDrive/Colab Notebooks/RecTour2024Challenge"
    else:
        current_directory = current_directory.parent
finally:
    chdir(current_directory)



# External imports
import pandas as pd
import numpy as np


# Internal imports
from src.data.csv_tools import csv_to_dataframe, dataframe_to_csv, save_submission
from src.data.pickle_tools import save_to_pickle, load_pickle
from src.data.keras_tools import save_keras_model, load_keras_model
from src.utils.preprocessing_tools import *

In [2]:
file_prefix = "SubmissionPart"

dfs_list = [pd.read_csv(f"{file_prefix}{i}.csv") for i in range(20)]

concatenated_df = pd.concat(dfs_list, ignore_index=True)

In [4]:
concatenated_df.shape

(199138, 12)

In [5]:
save_submission(concatenated_df)

In [36]:
before_df = pd.read_csv("out\submission.csv")

In [37]:
before_df

Unnamed: 0,ID,accommodation_id,user_id,review_1,review_2,review_3,review_4,review_5,review_6,review_7,review_8,review_9,review_10
0,1,2086452554,5f83c2ae-d803-4b4c-9d25-1226f90297ce,c2728aa2-bb2a-4213-83f3-9d222d0e8ee7,bef6e9c8-6684-4342-a90a-aabe33842034,7ecf0ac8-5ca5-4c37-9684-d941e2e25de4,a32fb7d0-0094-487a-979d-cf2a1477ef8e,4b5e6c8a-022c-4d4c-a48b-20ec834147fe,475cc7ad-814c-4a1f-908d-f84d3157a09e,5169c480-02af-4f20-b1a8-43e3c60aa54e,3d60e063-62ab-449e-943a-1df52dfb50ae,f6ffc11a-72c3-435c-b979-0adfca785734,102d0b69-9ddd-4325-82ae-56cd6dcf6e3b
1,2,-202362622,a194a2ef-9487-4cf0-8828-dd5803c8b9d1,da7c0021-f1d6-46a9-ad92-2e12ab0ac532,0e783796-c266-49cc-8a32-a5810cd974d4,ee634d44-e8bc-4025-a6fd-56eb582139e9,8dae5a9b-a7ec-4832-8268-705a988804b1,062cf4d0-96f2-4829-aac6-8e856ddd0675,c4d1101a-48ba-41ea-9792-a5c35e791741,8a08383a-b898-4d52-a4e2-e0ccc9857c5b,9737170f-7a42-4ec4-b61f-b5fd0eb75297,2390ba16-ad0a-4e55-ad88-896644b556f3,5331a5d3-761b-4b2c-bc92-6be1ffa97be4
2,3,-1390928232,cfb878d0-af56-4b0d-90ff-87095b1a56d6,7d76a628-cc4e-4878-b635-717000955191,37233246-2c25-4587-98d2-226810e2beb0,2dc633a9-41ed-4baf-a6f3-06bc4b63028f,a076c0fb-3eb9-4af3-86e9-5ab7e4563209,d423dac5-24f7-45c8-9121-a86af413faa0,b0a15004-66f4-4f00-b842-4d53ac944f7b,def0b28b-b2d0-44e5-b569-1d1407505a06,dbae01e2-627f-4e53-9d9e-05499b21e203,2b439689-e779-4f6e-bc20-0b1fb1490b74,d0f1cbfa-e137-4ba7-a411-828422b650c7
3,4,1007230055,19ffcbff-8500-482a-b5af-c55cb4235259,b3c1453c-441f-4295-accd-9a1e5c7281f8,b4e6ec65-11ed-4c4e-85c1-5542cb11e88a,7d2c70ab-05e3-4286-b6df-da37df928991,19b225e9-52c0-49e0-afd0-81ca0b47179e,264c7b34-12f4-4db3-bc6a-2940a3574746,4d1193bb-8875-4cc8-8757-6e125a709007,0a6db562-e884-4e8c-a31c-e847f9538280,c110d4e5-7b28-4d07-9d28-5914daa611b5,0ac123d1-b4f0-4836-b4e5-b10ba3508598,645e97b0-7adc-4812-b74a-6d5ec61df8b4
4,5,135365139,98d6a06b-131c-464d-86e7-b74dd4894ae2,f25d1abd-9f50-456d-92b3-52535b81cb82,4d8dc561-8628-413a-b696-a4c9aa752891,566ccbd5-ffad-41bd-8cd2-7b14c7007903,18485a5a-bf27-452f-9ec4-3f9be25dc9a2,dec68244-d0cb-4877-afbb-c7d0d54d1174,21bda358-dbaa-4ff5-ae04-9eea794be314,58817e53-35c7-4e90-aecc-03fc3bdb471a,d0cd3e25-685d-42bd-a7d8-c8e12a67e8e1,89cf2c04-56e2-4e35-ae4b-197033cf0291,e319c691-9e9a-4b08-9e23-3fc2178d9423
...,...,...,...,...,...,...,...,...,...,...,...,...,...
199133,199134,-1289007108,51bd5a4a-d30c-44bd-ac92-2547f04c0eb2,797d0343-f426-4060-96da-210898c77f2b,81e8f60a-f88a-4ee5-b613-a56e2a93ddcb,ab6cb8e6-0683-4494-b589-d5ce09db2dea,407fad0e-54ba-41c2-bdf6-2ce4f3c61104,d94fc74a-64b4-4a44-9cc3-bf6973dcd06c,db48d143-aac1-4ace-b1f5-75e2cc4bae48,cfdbea99-2262-4a92-b2cd-7a2ccd00b992,9a84228c-bc75-4267-aa4c-9aaa303b4bdd,06e1c1e1-2f44-4488-aa28-3b9c8dadbaac,5e642baf-b719-432e-b01c-c48705801477
199134,199135,1899287801,34eea0b9-90d4-43c9-bb87-72636cf866b7,ab52a870-b60b-495d-b115-985c3de89229,e633fefe-1e1d-4e70-816d-4d925ea2e404,34b81853-4d65-49e4-baff-aeacc3b809ab,d1cea374-3c7d-47ca-84ef-c6efb45552aa,13f831e2-29a0-4325-be8d-643c1df5dd5c,d0354f90-801a-4773-94f2-501d0430566b,3343a155-e3a3-41a6-8ff9-6d451554610c,bb405834-5ab4-42d1-8102-02246bb073e2,9d2cba08-51e2-47ec-8ed4-9afa3a5e1aea,c83eebfb-f7ad-41ce-a8de-a1500e38c294
199135,199136,-525864996,ee2fe24a-68f8-4633-8e5e-dd3eda402a65,be377698-eb69-42e7-a5bf-a61bc9e09772,29f81d7c-307f-429b-8bb0-212b8bea3ad7,8a75ea34-26cb-42e9-90df-e9539758bdb7,25a83b75-c5f1-42c4-b570-1ccaf0a484da,a4f600fe-af84-491b-8546-4fc7d9adfd2b,cdb5b392-8fe6-436c-9de4-dede80e6a82a,d3e1db39-6d33-4db3-889e-46ae02976cc2,78b1d072-3568-46a0-b363-20ef919c02f6,24737cd6-ecca-4b8c-9e94-07eb25d5da99,b1fc2354-9af6-4867-b404-ea8a782e268d
199136,199137,1007230055,3cbfa9e0-90bd-4414-ae0a-3d9777316a45,b4e6ec65-11ed-4c4e-85c1-5542cb11e88a,c110d4e5-7b28-4d07-9d28-5914daa611b5,1f127d8f-2ac9-4b76-8910-c8781855cfeb,f60bfcda-5abe-4954-aefb-e20f2b5fe8dc,12663a04-cf45-43ff-b03b-1f9d3852ea7a,45539ceb-4d7a-4b3b-a324-8e7e07c6967f,03e6ff55-ba6a-435b-9a4b-e87a8ded099e,4dc32edd-3fb9-4f48-932a-bb053c71e3e7,264c7b34-12f4-4db3-bc6a-2940a3574746,3b73a8ce-1c5b-437b-bce6-31f7ae25081e


In [32]:
# reverse 
sub_df = sub_df[["accommodation_id", "user_id", "review_10", "review_9", "review_8", "review_7", "review_6", "review_5", "review_4", "review_3", "review_2", "review_1"]]

In [34]:
sub_df.columns = ["accommodation_id", "user_id", "review_1", "review_2", "review_3", "review_4", "review_5", "review_6", "review_7", "review_8", "review_9", "review_10"]

In [38]:
save_submission(sub_df)