In [1]:
# 기본 라이브러리
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
import seaborn as sns

# 그래프 기본 테마 설정
sns.set()

# 그래프 기본 설정
plt.rcParams['font.family'] = 'Malgun Gothic'
plt.rcParams['figure.figsize'] = 12, 6
plt.rcParams['font.size'] = 14
plt.rcParams['axes.unicode_minus'] = False

# 복잡한 통계 처리를 위한 라이브러리
from scipy import stats

In [2]:
d2023 = pd.read_csv('data/2023.csv', encoding='cp949')
d2024 = pd.read_csv('data/2024.csv', encoding='utf-8')

d2023.info() # 16195 row * 365 columns
d2024.info() # 16216 row * 402 columns


  d2023 = pd.read_csv('data/2023.csv', encoding='cp949')


<class 'pandas.core.frame.DataFrame'>
RangeIndex: 16196 entries, 0 to 16195
Columns: 365 entries, pnid to weight
dtypes: float64(293), int64(71), object(1)
memory usage: 45.1+ MB
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 16216 entries, 0 to 16215
Columns: 402 entries, pnid to weight
dtypes: float64(348), int64(54)
memory usage: 49.7 MB


In [3]:
# 연도별 데이터에 year 컬럼 추기
d2023['year'] = 2023
d2024['year'] = 2024

In [4]:
# 2023
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd.set_option('display.width', 1000)

# print(d2023.isna().sum())

# null값이 포함된 항목 중 제외 가능한 항목 넣기
keep = [
    "pnid",
    "RVIT",
    "Q11",
    "Q12a01", "Q12a02", "Q12a03", "Q12a04", "Q12a05", "Q12a06", "Q12a07", "Q12a08", "Q12a09", "Q12a10",
    "Q12a11", "Q12a12", "Q12a13", "Q12a14", "Q12a15", "Q12a16", "Q12a17", "Q12a18", "Q12a19", "Q12a20",
    "Q12a21", "Q12a22", "Q12a23", "Q12a24", "Q12a25", "Q12a26",
    "Q13", "Q14",
    "D_MON", "D_BUN", "D_NAT", "D_SEX", "D_AGE", "D_MOK",
    "weight",
    "여행사1인대체", "가이드1인대체", "숙박비1인대체", "음식점1인대체", "식음료1인대체", "한국한국1인대체", "한국국외1인대체", "한국수상1인대체",
    "한국철도1인대체", "한국도로1인대체", "대여서1인대체", "유류비1인대체", "문화서1인대체", "오락및1인대체",
    "쇼핑비1인대체", "데이터1인대체", "치료및1인대체", "미용서1인대체", "기타비1인대체", "총액1인TOT2",
    "M박HAP", "M일HAP",
    "Q9_2a01", "Q9_2a02", "Q9_2a03", "Q9_2a04", "Q9_2a05", "Q9_2a06", "Q9_2a07", "Q9_2a08",
    "Q9_2a09", "Q9_2a10", "Q9_2a11", "Q9_2a12", "Q9_2a13", "Q9_2a14", "Q9_2a15", "Q9_2a16", "Q9_2a17",
    "Q9_1_1",
    "Q8a01", "Q8a02", "Q8a03", "Q8a04", "Q8a05", "Q8a06", "Q8a07", "Q8a08", "Q8a09", "Q8a10",
    "Q8a11", "Q8a12", "Q8a13", "Q8a14", "Q8a15", "Q8a16", "Q8a17", "Q8a18", "Q8a19", "Q7A",
    "Q4_2a1", "Q4_2a2", "Q4_2a3", "Q4_2a_dk", "Q4_1a1", "Q4a1",
    "Q3_2a1", "Q3_1a1",
    "TYP", "Q1", "Q1_1a1", "Q1_1a2", "Q1_1a3", "year"
]

d23 = d2023[keep]
d23.head()
d23.info() # 117 columns

new_name = {
    "pnid": "id",
    "RVIT": "revisit_num",
    "Q11": "satis_overall",
    "Q12a01": "satis_food",
    "Q12a02": "satis_shop",
    "Q12a03": "satis_nature",
    "Q12a04": "satis_history",
    "Q12a05": "satis_tradition",
    "Q12a06": "satis_gallery",
    "Q12a07": "satis_kpop",
    "Q12a08": "satis_performance",
    "Q12a09": "satis_festival",
    "Q12a10": "satis_fun",
    "Q12a11": "satis_entertainment",
    "Q12a12": "satis_beauty",
    "Q12a13": "satis_heal",
    "Q12a14": "satis_sport_view",
    "Q12a15": "satis_sport_part",
    "Q12a16": "satis_immigration",
    "Q12a17": "satis_safe",
    "Q12a18": "satis_expense",
    "Q12a19": "satis_sleep",
    "Q12a20": "satis_transport",
    "Q12a21": "satis_map",
    "Q12a22": "satis_guide_public",
    "Q12a23": "satis_mobile",
    "Q12a24": "satis_other",
    "Q12a25": "satis_guide_digital",
    "Q12a26": "satis_guide_private",
    "Q13": "revisit_think",
    "Q14": "recommend_think",
    "D_MON": "month",
    "D_BUN": "quarter",
    "D_NAT": "nationality",
    "D_SEX": "sex",
    "D_AGE": "age",
    "D_MOK": "purpose",
    "D_NUM": "duration",
    "D_GUB": "group_type",
    "weight": "weight",
    "여행사1인대체": "money_agency",
    "가이드1인대체": "money_guide",
    "숙박비1인대체": "money_stay",
    "음식점1인대체": "money_food",
    "식음료1인대체": "money_cafe",
    "국제한국1인대체": "money_airport_int_korea",
    "국제국외1인대체": "money_airport_int_foreign",
    "국제수상1인대체": "money_ship_foreign",
    "한국한국1인대체": "money_airplane_high",
    "한국국외1인대체": "money_airplane_low",
    "한국수상1인대체": "money_ship",
    "한국철도1인대체": "money_train",
    "한국도로1인대체": "money_road",
    "대여서1인대체": "money_rent",
    "유류비1인대체": "money_oil",
    "문화서1인대체": "money_culture",
    "오락및1인대체": "money_entertainment",
    "쇼핑비1인대체": "money_shop",
    "데이터1인대체": "money_lte",
    "치료및1인대체": "money_heal",
    "미용서1인대체": "money_beauty",
    "기타비1인대체": "money_etc",
    "총액1인TOT2": "money_total",
    "M박HAP": "stay_night",
    "M일HAP": "stay_total",
    "Q9_2a01": "seoul",
    "Q9_2a02": "gyeonggi",
    "Q9_2a03": "incheon",
    "Q9_2a04": "gangwon",
    "Q9_2a05": "daejeon",
    "Q9_2a06": "chungbuk",
    "Q9_2a07": "chungnam",
    "Q9_2a08": "sejong",
    "Q9_2a09": "gyeongbuk",
    "Q9_2a10": "gyeongnam",
    "Q9_2a11": "daegu",
    "Q9_2a12": "ulsan",
    "Q9_2a13": "busan",
    "Q9_2a14": "gwangju",
    "Q9_2a15": "jeonbuk",
    "Q9_2a16": "jeonnam",
    "Q9_2a17": "jeju",
    "Q9_1_1": "favorite_place",
    "Q8a01": "part_food",
    "Q8a02": "part_shop",
    "Q8a03": "part_nature",
    "Q8a04": "part_history",
    "Q8a05": "part_tradition",
    "Q8a06": "part_gallery",
    "Q8a07": "part_kpop",
    "Q8a08": "part_performance",
    "Q8a09": "part_festival",
    "Q8a10": "part_fun",
    "Q8a11": "part_entertainment",
    "Q8a12": "part_beauty",
    "Q8a13": "part_heal",
    "Q8a14": "part_sport_view",
    "Q8a15": "part_sport_part",
    "Q8a16": "part_conference",
    "Q8a17": "part_business",
    "Q8a18": "part_study",
    "Q8a19": "part_etc",
    "MQ7_1": "group_size",
    "Q7A": "companion",
    "Q4_2a1": "lack_info1",
    "Q4_2a2": "lack_info2",
    "Q4_2a3": "lack_info3",
    "Q4_2a_dk": "lack_info_unknown",
    "Q4_1a1": "collect_site",
    "Q4a1": "info_collect",
    "Q3_2a1": "infra",
    "Q3_1a1": "activity",
    "TYP": "type",
    "Q1": "main_purpose",
    "Q1_1a1": "interest1",
    "Q1_1a2": "interest2",
    "Q1_1a3": "interest3",
    "year" : "year"
}

d23 = d23.rename(columns=new_name)
d23.head()


<class 'pandas.core.frame.DataFrame'>
RangeIndex: 16196 entries, 0 to 16195
Columns: 112 entries, pnid to year
dtypes: float64(83), int64(29)
memory usage: 13.8 MB


Unnamed: 0,id,revisit_num,satis_overall,satis_food,satis_shop,satis_nature,satis_history,satis_tradition,satis_gallery,satis_kpop,satis_performance,satis_festival,satis_fun,satis_entertainment,satis_beauty,satis_heal,satis_sport_view,satis_sport_part,satis_immigration,satis_safe,satis_expense,satis_sleep,satis_transport,satis_map,satis_guide_public,satis_mobile,satis_other,satis_guide_digital,satis_guide_private,revisit_think,recommend_think,month,quarter,nationality,sex,age,purpose,weight,money_agency,money_guide,money_stay,money_food,money_cafe,money_airplane_high,money_airplane_low,money_ship,money_train,money_road,money_rent,money_oil,money_culture,money_entertainment,money_shop,money_lte,money_heal,money_beauty,money_etc,money_total,stay_night,stay_total,seoul,gyeonggi,incheon,gangwon,daejeon,chungbuk,chungnam,sejong,gyeongbuk,gyeongnam,daegu,ulsan,busan,gwangju,jeonbuk,jeonnam,jeju,favorite_place,part_food,part_shop,part_nature,part_history,part_tradition,part_gallery,part_kpop,part_performance,part_festival,part_fun,part_entertainment,part_beauty,part_heal,part_sport_view,part_sport_part,part_conference,part_business,part_study,part_etc,companion,lack_info1,lack_info2,lack_info3,lack_info_unknown,collect_site,info_collect,infra,activity,type,main_purpose,interest1,interest2,interest3,year
0,6,4,5,5.0,5.0,,,,,,5.0,,,,,,,,5,5,5,5,5,5,5,5,5,5,,5,5,1,1,3,2,2,1,866.099893,0.0,0.0,123.53,308.82,46.32,0.0,0,0.0,54.04,77.2,0.0,0.0,23.16,0.0,386.02,20.07,54.04,0.0,0.0,1633.64,26,27,1.0,,,4.0,,,,,,,,,,,,,,11040,1.0,2.0,,,,,,8.0,,,,,,,,,,,,1,8.0,6.0,,,2.0,1.0,6.0,1.0,1,1,2.0,3.0,4.0,2023
1,7,4,5,,5.0,5.0,,,,,,,,5.0,,,,,5,5,5,5,5,5,5,5,5,5,,5,5,1,1,1,1,3,2,191.333757,0.0,0.0,0.0,772.04,0.0,0.0,0,0.0,0.0,0.0,0.0,77.2,0.0,0.0,772.04,0.0,0.0,0.0,0.0,2007.3,6,7,1.0,,,,,,,,,,,,,,,,,11521,,2.0,3.0,,,,,,,,11.0,,,,,,,,,1,,,,11.0,6.0,3.0,3.0,3.0,1,2,2.0,9.0,7.0,2023
2,8,2,5,5.0,,,,,,,,,,,,,,,5,4,4,5,5,5,5,5,5,5,,5,5,1,1,4,2,1,5,244.838755,0.0,0.0,100.0,50.0,0.0,0.0,0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1650.0,1,2,,,3.0,,,,,,,,,,,,,,,28003,1.0,,,,,,,,,,,,,,,,,,,1,5.0,,,,,4.0,,,1,5,,,,2023
3,10,1,5,,,,5.0,,,,,,,,,,,5.0,5,5,5,5,5,4,5,9,5,5,,4,4,1,1,5,1,5,3,555.272342,0.0,0.0,1921.5,640.5,0.0,0.0,0,0.0,0.0,256.2,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3586.8,7,8,1.0,,,,,,,,,,,,,,,,,11071,,,,4.0,,,,,,,,,,,15.0,16.0,,,,1,,,,11.0,,4.0,,,1,3,,,,2023
4,11,3,4,5.0,5.0,,5.0,,,,,,,,,,,,5,5,5,5,5,5,5,5,5,5,,5,5,1,1,1,2,4,2,193.434506,0.0,0.0,0.0,433.2,0.0,0.0,0,0.0,0.0,14.44,0.0,0.0,0.0,0.0,1155.2,43.32,0.0,0.0,0.0,2151.56,70,71,1.0,,3.0,,,,,,,,,,,,,,,11012,1.0,2.0,,4.0,,,,,,,,,,,,,,,,1,,,,11.0,,4.0,3.0,2.0,1,2,8.0,3.0,7.0,2023


In [5]:
# 2024
pd.set_option('display.max_columns', None)
pd.set_option('display.max_rows', None)
pd.set_option('display.width', 1000)

# null값이 포함된 항목 중 제외 가능한 항목 넣기
keep = [
    "pnid",
    "RVIT",
    "Q11",
    "Q12a01", "Q12a02", "Q12a03", "Q12a04", "Q12a05", "Q12a06", "Q12a07", "Q12a08", "Q12a09", "Q12a10",
    "Q12a11", "Q12a12", "Q12a13", "Q12a14", "Q12a15", "Q12a16", "Q12a17", "Q12a18", "Q12a19", "Q12a20",
    "Q12a21", "Q12a22", "Q12a23", "Q12a24", "Q12a25", "Q12a26",
    "Q13", "Q14",
    "D_MON", "D_BUN", "D_NAT", "D_SEX", "D_AGE", "D_MOK",
    "weight",
    "여행사1인대체", "가이드1인대체", "숙박비1인대체", "음식점1인대체", "식음료1인대체", "한국한국1인대체", "한국국외1인대체", "한국수상1인대체",
    "한국철도1인대체", "한국도로1인대체", "대여서1인대체", "유류비1인대체", "문화서1인대체", "오락및1인대체",
    "쇼핑비1인대체", "데이터1인대체", "치료및1인대체", "미용서1인대체", "기타비1인대체", "총액1인TOT2",
    "M박HAP", "M일HAP",
    "Q9_2a01", "Q9_2a02", "Q9_2a03", "Q9_2a04", "Q9_2a05", "Q9_2a06", "Q9_2a07", "Q9_2a08",
    "Q9_2a09", "Q9_2a10", "Q9_2a11", "Q9_2a12", "Q9_2a13", "Q9_2a14", "Q9_2a15", "Q9_2a16", "Q9_2a17",
    "Q9_1_1",
    "Q8a01", "Q8a02", "Q8a03", "Q8a04", "Q8a05", "Q8a06", "Q8a07", "Q8a08", "Q8a09", "Q8a10",
    "Q8a11", "Q8a12", "Q8a13", "Q8a14", "Q8a15", "Q8a16", "Q8a17", "Q8a18", "Q8a19", "Q7A",
    "Q4_2a1", "Q4_2a2", "Q4_2a3", "Q4_2a_dk", "Q4_1a1", "Q4a1",
    "Q3_2a1", "Q3_1a1",
    "TYP", "Q1", "Q1_1a1", "Q1_1a2", "Q1_1a3", "year"
]

d24 = d2024[keep]
d24.head()
d24.info() # 117 columns

new_name = {
    "pnid": "id",
    "RVIT": "revisit_num",
    "Q11": "satis_overall",
    "Q12a01": "satis_food",
    "Q12a02": "satis_shop",
    "Q12a03": "satis_nature",
    "Q12a04": "satis_history",
    "Q12a05": "satis_tradition",
    "Q12a06": "satis_gallery",
    "Q12a07": "satis_kpop",
    "Q12a08": "satis_performance",
    "Q12a09": "satis_festival",
    "Q12a10": "satis_fun",
    "Q12a11": "satis_entertainment",
    "Q12a12": "satis_beauty",
    "Q12a13": "satis_heal",
    "Q12a14": "satis_sport_view",
    "Q12a15": "satis_sport_part",
    "Q12a16": "satis_immigration",
    "Q12a17": "satis_safe",
    "Q12a18": "satis_expense",
    "Q12a19": "satis_sleep",
    "Q12a20": "satis_transport",
    "Q12a21": "satis_map",
    "Q12a22": "satis_guide_public",
    "Q12a23": "satis_mobile",
    "Q12a24": "satis_other",
    "Q12a25": "satis_guide_digital",
    "Q12a26": "satis_guide_private",
    "Q13": "revisit_think",
    "Q14": "recommend_think",
    "D_MON": "month",
    "D_BUN": "quarter",
    "D_NAT": "nationality",
    "D_SEX": "sex",
    "D_AGE": "age",
    "D_MOK": "purpose",
    "D_NUM": "duration",
    "D_GUB": "group_type",
    "weight": "weight",
    "여행사1인대체": "money_agency",
    "가이드1인대체": "money_guide",
    "숙박비1인대체": "money_stay",
    "음식점1인대체": "money_food",
    "식음료1인대체": "money_cafe",
    "국제한국1인대체": "money_airport_int_korea",
    "국제국외1인대체": "money_airport_int_foreign",
    "국제수상1인대체": "money_ship_foreign",
    "한국한국1인대체": "money_airplane_high",
    "한국국외1인대체": "money_airplane_low",
    "한국수상1인대체": "money_ship",
    "한국철도1인대체": "money_train",
    "한국도로1인대체": "money_road",
    "대여서1인대체": "money_rent",
    "유류비1인대체": "money_oil",
    "문화서1인대체": "money_culture",
    "오락및1인대체": "money_entertainment",
    "쇼핑비1인대체": "money_shop",
    "데이터1인대체": "money_lte",
    "치료및1인대체": "money_heal",
    "미용서1인대체": "money_beauty",
    "기타비1인대체": "money_etc",
    "총액1인TOT2": "money_total",
    "M박HAP": "stay_night",
    "M일HAP": "stay_total",
    "Q9_2a01": "seoul",
    "Q9_2a02": "gyeonggi",
    "Q9_2a03": "incheon",
    "Q9_2a04": "gangwon",
    "Q9_2a05": "daejeon",
    "Q9_2a06": "chungbuk",
    "Q9_2a07": "chungnam",
    "Q9_2a08": "sejong",
    "Q9_2a09": "gyeongbuk",
    "Q9_2a10": "gyeongnam",
    "Q9_2a11": "daegu",
    "Q9_2a12": "ulsan",
    "Q9_2a13": "busan",
    "Q9_2a14": "gwangju",
    "Q9_2a15": "jeonbuk",
    "Q9_2a16": "jeonnam",
    "Q9_2a17": "jeju",
    "Q9_1_1": "favorite_place",
    "Q8a01": "part_food",
    "Q8a02": "part_shop",
    "Q8a03": "part_nature",
    "Q8a04": "part_history",
    "Q8a05": "part_tradition",
    "Q8a06": "part_gallery",
    "Q8a07": "part_kpop",
    "Q8a08": "part_performance",
    "Q8a09": "part_festival",
    "Q8a10": "part_fun",
    "Q8a11": "part_entertainment",
    "Q8a12": "part_beauty",
    "Q8a13": "part_heal",
    "Q8a14": "part_sport_view",
    "Q8a15": "part_sport_part",
    "Q8a16": "part_conference",
    "Q8a17": "part_business",
    "Q8a18": "part_study",
    "Q8a19": "part_etc",
    "MQ7_1": "group_size",
    "Q7A": "companion",
    "Q4_2a1": "lack_info1",
    "Q4_2a2": "lack_info2",
    "Q4_2a3": "lack_info3",
    "Q4_2a_dk": "lack_info_unknown",
    "Q4_1a1": "collect_site",
    "Q4a1": "info_collect",
    "Q3_2a1": "infra",
    "Q3_1a1": "activity",
    "TYP": "type",
    "Q1": "main_purpose",
    "Q1_1a1": "interest1",
    "Q1_1a2": "interest2",
    "Q1_1a3": "interest3",
    "year" : "year"
}

d24 = d24.rename(columns=new_name)
d24.head()


<class 'pandas.core.frame.DataFrame'>
RangeIndex: 16216 entries, 0 to 16215
Columns: 112 entries, pnid to year
dtypes: float64(84), int64(28)
memory usage: 13.9 MB


Unnamed: 0,id,revisit_num,satis_overall,satis_food,satis_shop,satis_nature,satis_history,satis_tradition,satis_gallery,satis_kpop,satis_performance,satis_festival,satis_fun,satis_entertainment,satis_beauty,satis_heal,satis_sport_view,satis_sport_part,satis_immigration,satis_safe,satis_expense,satis_sleep,satis_transport,satis_map,satis_guide_public,satis_mobile,satis_other,satis_guide_digital,satis_guide_private,revisit_think,recommend_think,month,quarter,nationality,sex,age,purpose,weight,money_agency,money_guide,money_stay,money_food,money_cafe,money_airplane_high,money_airplane_low,money_ship,money_train,money_road,money_rent,money_oil,money_culture,money_entertainment,money_shop,money_lte,money_heal,money_beauty,money_etc,money_total,stay_night,stay_total,seoul,gyeonggi,incheon,gangwon,daejeon,chungbuk,chungnam,sejong,gyeongbuk,gyeongnam,daegu,ulsan,busan,gwangju,jeonbuk,jeonnam,jeju,favorite_place,part_food,part_shop,part_nature,part_history,part_tradition,part_gallery,part_kpop,part_performance,part_festival,part_fun,part_entertainment,part_beauty,part_heal,part_sport_view,part_sport_part,part_conference,part_business,part_study,part_etc,companion,lack_info1,lack_info2,lack_info3,lack_info_unknown,collect_site,info_collect,infra,activity,type,main_purpose,interest1,interest2,interest3,year
0,57,4,5,,5.0,5.0,,,,,,,,,,,,,,5,5,5,5,5,5,5,5,5,5,5,5,1,1,13,2,5,1,198.02,,10.0,1000.0,500.0,100.0,0.0,0.0,0.0,50.0,100.0,0.0,0.0,0.0,50.0,500.0,0.0,0.0,0.0,0.0,2710.0,5,6,1.0,,,,,,,,,,,,,,,,,11001,,2.0,3.0,,,,,,,,,,,,,,,,,2,,,,11.0,1.0,1.0,3.0,1.0,1,1,7.0,,,2024
1,58,4,5,5.0,5.0,,,4.0,,,,,,,,,,,,4,4,4,4,4,4,4,4,4,4,5,5,1,1,3,2,4,1,784.28,,0.08,202.46,121.48,0.0,0.0,0.0,0.0,0.0,24.3,0.0,0.0,4.05,0.0,485.91,8.1,0.0,0.0,0.0,1364.68,4,5,1.0,,,,,,,,,,,,,,,,,11001,1.0,2.0,,,5.0,,,,,,,,,,,,,,,2,,,,11.0,5.0,1.0,6.0,11.0,1,1,7.0,10.0,2.0,2024
2,59,3,4,5.0,5.0,,,,,,,,,,5.0,,,,,5,3,5,5,5,5,3,5,5,5,4,4,1,1,3,2,3,1,607.02,,0.16,161.48,161.48,16.15,0.0,0.0,0.0,8.07,32.3,0.0,0.0,0.0,32.3,322.95,8.07,0.0,0.0,0.0,1065.9,5,6,1.0,,,,,,,,,,,,,,,,,41001,1.0,2.0,,,,,,,,,,12.0,,,,,,,,2,,,,11.0,,4.0,2.0,12.0,1,1,7.0,2.0,8.0,2024
3,60,1,5,5.0,,5.0,,5.0,,,,,,5.0,,,,,,5,5,5,5,5,5,5,5,5,5,5,5,1,1,1,1,2,1,1049.5,,1.4,279.18,209.38,0.0,0.0,0.0,0.0,69.79,27.92,0.0,0.0,0.0,0.0,139.59,0.0,0.0,0.0,0.0,922.68,5,6,1.0,,,,,,,,,,,,,,,,,11001,1.0,,3.0,,5.0,,,,,,11.0,,,,,,,,,1,,,,11.0,5.0,4.0,2.0,11.0,1,1,8.0,7.0,3.0,2024
4,61,4,4,,4.0,,,4.0,,,,,,,4.0,,,,,4,3,4,4,4,4,3,4,4,4,5,5,1,1,3,2,2,1,876.8,,0.32,161.47,32.29,16.15,0.0,0.0,0.0,32.29,32.29,0.0,0.0,0.0,0.0,968.81,16.15,0.0,0.0,0.0,1647.3,4,5,1.0,2.0,,,,,,,,,,,,,,,,11506,,2.0,,,5.0,,,,,,,12.0,,,,,,,,2,,,,11.0,,3.0,4.0,1.0,1,1,2.0,9.0,10.0,2024


In [6]:
d2324 = pd.concat([d23, d24], ignore_index=True)
d2324.head()

Unnamed: 0,id,revisit_num,satis_overall,satis_food,satis_shop,satis_nature,satis_history,satis_tradition,satis_gallery,satis_kpop,satis_performance,satis_festival,satis_fun,satis_entertainment,satis_beauty,satis_heal,satis_sport_view,satis_sport_part,satis_immigration,satis_safe,satis_expense,satis_sleep,satis_transport,satis_map,satis_guide_public,satis_mobile,satis_other,satis_guide_digital,satis_guide_private,revisit_think,recommend_think,month,quarter,nationality,sex,age,purpose,weight,money_agency,money_guide,money_stay,money_food,money_cafe,money_airplane_high,money_airplane_low,money_ship,money_train,money_road,money_rent,money_oil,money_culture,money_entertainment,money_shop,money_lte,money_heal,money_beauty,money_etc,money_total,stay_night,stay_total,seoul,gyeonggi,incheon,gangwon,daejeon,chungbuk,chungnam,sejong,gyeongbuk,gyeongnam,daegu,ulsan,busan,gwangju,jeonbuk,jeonnam,jeju,favorite_place,part_food,part_shop,part_nature,part_history,part_tradition,part_gallery,part_kpop,part_performance,part_festival,part_fun,part_entertainment,part_beauty,part_heal,part_sport_view,part_sport_part,part_conference,part_business,part_study,part_etc,companion,lack_info1,lack_info2,lack_info3,lack_info_unknown,collect_site,info_collect,infra,activity,type,main_purpose,interest1,interest2,interest3,year
0,6,4,5,5.0,5.0,,,,,,5.0,,,,,,,,5.0,5,5,5,5,5,5,5,5,5,,5,5,1,1,3,2,2,1,866.099893,0.0,0.0,123.53,308.82,46.32,0.0,0.0,0.0,54.04,77.2,0.0,0.0,23.16,0.0,386.02,20.07,54.04,0.0,0.0,1633.64,26,27,1.0,,,4.0,,,,,,,,,,,,,,11040,1.0,2.0,,,,,,8.0,,,,,,,,,,,,1,8.0,6.0,,,2.0,1.0,6.0,1.0,1,1,2.0,3.0,4.0,2023
1,7,4,5,,5.0,5.0,,,,,,,,5.0,,,,,5.0,5,5,5,5,5,5,5,5,5,,5,5,1,1,1,1,3,2,191.333757,0.0,0.0,0.0,772.04,0.0,0.0,0.0,0.0,0.0,0.0,0.0,77.2,0.0,0.0,772.04,0.0,0.0,0.0,0.0,2007.3,6,7,1.0,,,,,,,,,,,,,,,,,11521,,2.0,3.0,,,,,,,,11.0,,,,,,,,,1,,,,11.0,6.0,3.0,3.0,3.0,1,2,2.0,9.0,7.0,2023
2,8,2,5,5.0,,,,,,,,,,,,,,,5.0,4,4,5,5,5,5,5,5,5,,5,5,1,1,4,2,1,5,244.838755,0.0,0.0,100.0,50.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,1650.0,1,2,,,3.0,,,,,,,,,,,,,,,28003,1.0,,,,,,,,,,,,,,,,,,,1,5.0,,,,,4.0,,,1,5,,,,2023
3,10,1,5,,,,5.0,,,,,,,,,,,5.0,5.0,5,5,5,5,4,5,9,5,5,,4,4,1,1,5,1,5,3,555.272342,0.0,0.0,1921.5,640.5,0.0,0.0,0.0,0.0,0.0,256.2,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,0.0,3586.8,7,8,1.0,,,,,,,,,,,,,,,,,11071,,,,4.0,,,,,,,,,,,15.0,16.0,,,,1,,,,11.0,,4.0,,,1,3,,,,2023
4,11,3,4,5.0,5.0,,5.0,,,,,,,,,,,,5.0,5,5,5,5,5,5,5,5,5,,5,5,1,1,1,2,4,2,193.434506,0.0,0.0,0.0,433.2,0.0,0.0,0.0,0.0,0.0,14.44,0.0,0.0,0.0,0.0,1155.2,43.32,0.0,0.0,0.0,2151.56,70,71,1.0,,3.0,,,,,,,,,,,,,,,11012,1.0,2.0,,4.0,,,,,,,,,,,,,,,,1,,,,11.0,,4.0,3.0,2.0,1,2,8.0,3.0,7.0,2023


In [7]:
d2324.to_csv('data/d2324.csv')