In [None]:
type(ranker)

lightgbm.basic.Booster

In [1]:
import os
import pandas as pd

def split_csv(file_path, output_dir, rows_per_chunk=10000):
    """
    Splits a CSV file into smaller chunks.

    Args:
        file_path (str): Path to the original CSV file.
        output_dir (str): Directory to store the smaller chunk files.
        rows_per_chunk (int): Number of rows per chunk.
    """
    os.makedirs(output_dir, exist_ok=True)
    df_iter = pd.read_csv(file_path, chunksize=rows_per_chunk)
    
    for i, chunk in enumerate(df_iter):
        chunk_file = os.path.join(output_dir, f"chunk_{i:03}.csv")
        chunk.to_csv(chunk_file, index=False)
        print(f"Saved: {chunk_file}")

def combine_csv_chunks(input_dir, output_file):
    """
    Recombines CSV chunks into a single CSV file.

    Args:
        input_dir (str): Directory containing CSV chunk files.
        output_file (str): Path to save the recombined CSV file.
    """
    chunk_files = sorted(
        [f for f in os.listdir(input_dir) if f.startswith("chunk_") and f.endswith(".csv")]
    )

    df_list = []
    for chunk_file in chunk_files:
        chunk_path = os.path.join(input_dir, chunk_file)
        df = pd.read_csv(chunk_path)
        df_list.append(df)
        print(f"Loaded: {chunk_file}")

    full_df = pd.concat(df_list, ignore_index=True)
    full_df.to_csv(output_file, index=False)
    print(f"Recombined CSV saved to: {output_file}")

In [2]:
split_csv('complete_sentiment.csv','sentiment_brokendown')

Saved: sentiment_brokendown/chunk_000.csv
Saved: sentiment_brokendown/chunk_001.csv
Saved: sentiment_brokendown/chunk_002.csv
Saved: sentiment_brokendown/chunk_003.csv
Saved: sentiment_brokendown/chunk_004.csv
Saved: sentiment_brokendown/chunk_005.csv
Saved: sentiment_brokendown/chunk_006.csv
Saved: sentiment_brokendown/chunk_007.csv
Saved: sentiment_brokendown/chunk_008.csv
Saved: sentiment_brokendown/chunk_009.csv
Saved: sentiment_brokendown/chunk_010.csv
Saved: sentiment_brokendown/chunk_011.csv
Saved: sentiment_brokendown/chunk_012.csv
Saved: sentiment_brokendown/chunk_013.csv
Saved: sentiment_brokendown/chunk_014.csv
