In [2]:
import pandas as pd

# Load your CSV file (replace 'your_file.csv' with the actual file path in Colab)
df = pd.read_csv('/content/llm-human-readable__content_perfect3_processed_data_part-00000-edbbc52d-1449-48a9-af87-48d605e9922a-c000.csv')

# Mapping for broadband types to their full names (if needed)
bb_type_mapping = {
    'Fixed Broadband': 'Fixed Broadband',
    'Fixed Wireless Access': 'Fixed Wireless Access'
}

# Function to generate the new summary based on the proposed template
def create_uniform_summary(row):
    try:
        # Extract values from the row using the correct column names
        carrier = row['hh_bb_carrier']  # e.g., Comcast
        bb_type = bb_type_mapping.get(row['bb_type'], row['bb_type'])  # Map broadband type
        distinct_hh = int(row['distinct_hhid_count'])  # Number of distinct households
        total_hh = int(row['total_hhids'])  # Total households
        carrier_share = float(row['carrier_share']) * 100  # Convert to percentage (e.g., 0.282 → 28.2)

        # Format the summary using the proposed template
        summary = (f"In the USA, during 2024, July, "
                   f"{carrier} providing {bb_type} services served {distinct_hh:,} households "
                   f"out of a total of {total_hh:,} in the country, resulting in a market share of {carrier_share:.1f}%.")

        return summary
    except Exception as e:
        return f"Error processing row: {str(e)}"

# Apply the function to the Human_Readable_Summary column
df['Human_Readable_Summary'] = df.apply(create_uniform_summary, axis=1)

# Save the updated CSV (replace 'updated_file.csv' with your desired output file name)
df.to_csv('updated_file.csv', index=False)

# Display the updated summaries to verify
print(df[['Human_Readable_Summary']])

# Check for any errors in the summaries
errors = df[df['Human_Readable_Summary'].str.contains("Error processing row")]
if not errors.empty:
    print("\nRows with errors:")
    print(errors)
else:
    print("\nNo errors found in the summaries.")

                                Human_Readable_Summary
0    In the USA, during 2024, July, Comcast providi...
1    In the USA, during 2024, July, Spectrum provid...
2    In the USA, during 2024, July, AT&T providing ...
3    In the USA, during 2024, July, Verizon providi...
4    In the USA, during 2024, July, Cox providing F...
..                                                 ...
110  In the USA, during 2024, July, Clearwave Fiber...
111  In the USA, during 2024, July, IdeaTek providi...
112  In the USA, during 2024, July, Union Wireless ...
113  In the USA, during 2024, July, Xtream providin...
114  In the USA, during 2024, July, Vast Broadband ...

[115 rows x 1 columns]

No errors found in the summaries.
