# Combine Labelled Title and Content Data (Vertical)

This notebook combines the Title and Content files **vertically** (stacking rows), removing the first row from the Content file prior to merging.

In [5]:
import pandas as pd
import os

In [6]:
# Define file paths
file1_path = r'(A) Data/Need To Vote/Final Labelled_News Title_400 Data.csv'
file2_path = r'(A) Data/Need To Vote/Final Labelled_News Content_400 Data.csv'
output_path = r'(A) Data/Need To Vote/Combined_Labelled_Data.csv'

# Load the datasets
try:
    df_title = pd.read_csv(file1_path)
    df_content = pd.read_csv(file2_path)
    print(f"Loaded Title data with shape: {df_title.shape}")
    print(f"Loaded Content data with shape: {df_content.shape}")
except FileNotFoundError as e:
    print(f"Error: {e}")
    print("Please check if the file paths are correct.")

Loaded Title data with shape: (418, 7)
Loaded Content data with shape: (415, 7)


In [7]:
# Remove the 1st row from the Content file
if 'df_content' in locals():
    # iloc[1:] drops the first row (index 0)
    df_content_modified = df_content.iloc[1:].reset_index(drop=True)
    print(f"Shape of Content data after removing 1st row: {df_content_modified.shape}")

Shape of Content data after removing 1st row: (414, 7)


In [8]:
# Combine the dataframes VERTICALLY (stacking rows)
if 'df_title' in locals() and 'df_content_modified' in locals():
    # axis=0 is the default, which stacks vertically
    # ignore_index=True ensures the new dataframe has a clean sequential index
    combined_df = pd.concat([df_title, df_content_modified], axis=0, ignore_index=True)
    
    print(f"Shape of combined dataframe: {combined_df.shape}")
    display(combined_df.head())
    
    # Export to CSV
    combined_df.to_csv(output_path, index=False)
    print(f"Successfully saved combined file to: {output_path}")

Shape of combined dataframe: (832, 7)


Unnamed: 0,News_Data,1st Annotator,2nd Annotator,3rd Annotator,Voting Result,Final Take,Labelling
0,"Olahraga Pilates Makin Populer, Ini Deret Manf...",Positive,Positive,Positive,Positive,Positive,1
1,"Janice Tjen Luar Biasa, Lolos di 2 Nomor Final...",Positive,Positive,Positive,Positive,Positive,1
2,Siapakah Pasukan RSF yang Diduga Bantai Ribuan...,Negative,Negative,Neutral,Negative,Negative,-1
3,Pertamina Peduli Salurkan Bantuan untuk Korban...,Positive,Positive,Neutral,Positive,Positive,1
4,"Cuaca Panas, Hujan hingga Banjir Rob Bayangi S...",Negative,Negative,Neutral,Negative,Negative,-1


Successfully saved combined file to: (A) Data/Need To Vote/Combined_Labelled_Data.csv
