In [6]:
import requests
import csv

In [12]:
orig_file = "chronicabsenteeism24.txt"

In [8]:
def download_large_file(url, output_file_path):
    """
    Downloads a large file from the given URL and saves it as a .csv file.

    Args:
        url (str): The URL to download the file from.
        output_file_path (str): The path to save the downloaded file.
    """
    try:
        # Stream the file from the URL to avoid loading it all at once in memory
        with requests.get(url, stream=True) as response:
            response.raise_for_status()  # Check for request errors

            # Open the output file in write-binary mode
            with open(output_file_path, 'wb') as file:
                # Write the content in chunks of 1 MB each
                for chunk in response.iter_content(chunk_size=1024 * 1024):
                    if chunk:  # Ensure there's data to write
                        file.write(chunk)

        print(f"File downloaded successfully and saved as {output_file_path}")

    except requests.exceptions.RequestException as e:
        print(f"Error downloading the file: {e}")

# Example usage:
url = "https://www3.cde.ca.gov/demo-downloads/attendance/" + orig_file  # Replace with your actual URL
output_file_path = orig_file         # The output CSV file path
download_large_file(url, output_file_path)


File downloaded successfully and saved as chronicabsenteeism23.txt


In [13]:
def convert_tab_delimited_to_csv(input_file_path, output_file_path):
    """
    Converts a tab-delimited file to a CSV file.

    Args:
        input_file_path (str): The path to the input tab-delimited file.
        output_file_path (str): The path to save the converted CSV file.
    """
    try:
        # Open the tab-delimited file for reading
        with open(input_file_path, 'r', newline='', encoding='ISO-8859-1') as tsv_file:
            # Create a CSV reader that recognizes tabs as delimiters
            tsv_reader = csv.reader(tsv_file, delimiter='\t')
            
            # Open the output CSV file for writing
            with open(output_file_path, 'w', newline='', encoding='utf-8') as csv_file:
                csv_writer = csv.writer(csv_file)

                # Write each row from the tab-delimited file to the CSV file
                for row in tsv_reader:
                    csv_writer.writerow(row)

        print(f"File converted successfully and saved as {output_file_path}")

    except Exception as e:
        print(f"Error converting file: {e}")

# Example usage:
input_file_path = orig_file         # Replace with the path of your downloaded tab-delimited file
output_file_path = orig_file + '.csv'  # The path for the resulting CSV file
convert_tab_delimited_to_csv(input_file_path, output_file_path)

File converted successfully and saved as chronicabsenteeism24.txt.csv
