In [3]:
import pandas as pd
from openai import OpenAI
import os
import time

# Initialize the OpenAI client
client = OpenAI(api_key=os.getenv('OPENAI_API_KEY'))

# Get the current time
current_time = time.time()

# List all files
response = client.files.list()

# Prepare data for DataFrame
data_for_df = []
for file in response.data:
    # Calculate the age of the file in seconds
    file_age = current_time - file.created_at
    if file_age < 150000:  # 86400 seconds in 24 hours
        data_for_df.append({
            'Filename': file.filename,
            'File ID': file.id,
            'Created At': file.created_at
        })

# Create DataFrame
df = pd.DataFrame(data_for_df)
df.sort_values(by='Created At', ascending=False, inplace=True)

df

Unnamed: 0,Filename,File ID,Created At
0,actualfreedom.com.au---library---topics---peop...,file-kea3DFYKA4kSUGXNKCLS7soV,1715032377
1,actualfreedom.com.au---richard---listbcorrespo...,file-6QkrydgszsHPkjpHPQBE7Wcl,1715032377
2,www.actualfreedom.com.au---richard---listbcorr...,file-MD3F39PLeCo1k5En6mmFJ03Y,1715032376
3,actualfreedom.com.au---richard---abditorium---...,file-m2WgKhmw0PMhMbvHSZJCRy0k,1715032374
4,actualfreedom.com.au---richard---abditorium---...,file-bgekQYqXgKPFo0zbvMqiyNTv,1715032366
...,...,...,...
7178,library---topics---relativism.html,file-0SjQA6g7VOR7Kpzv4JLnl2WA,1714947282
7179,actualism---peter---selected-writings---pcetri...,file-Njr0AW1V2smlXMmKGYHzHJxp,1714947281
7180,actualism---peter---selected-correspondence---...,file-uihtDMNkWi65jZLyfs1bYyc3,1714947280
7181,richard---selectedcorrespondence---sc-morals.html,file-EFBdJbvLNKPXtsEp5eVUghwm,1714947280


In [4]:
# Save the entire DataFrame to a CSV file, sorted by 'Created At' from oldest to newest
df.sort_values(by='Created At', ascending=True).to_csv('file_ids.csv', index=False)
print("DataFrame saved to file_ids.csv")


DataFrame saved to file_ids.csv


In [5]:
# Proceed with deletion
# Load data from CSV file
df_from_csv = pd.read_csv('file_ids.csv')

# Delete files listed in the DataFrame
for index, row in df_from_csv.iterrows():
    client.files.delete(row['File ID'])
    print(f"Deleted file {row['Filename']} with ID {row['File ID']}")

Deleted file introduction---humanbeings.html with ID file-h2T0GQUpIoxVWHZgWxMjt6Lw
Deleted file richard---selectedcorrespondence---sc-morals.html with ID file-EFBdJbvLNKPXtsEp5eVUghwm
Deleted file actualism---peter---selected-correspondence---corr-materialism2.html with ID file-uihtDMNkWi65jZLyfs1bYyc3
Deleted file actualism---peter---selected-writings---pcetriggers.html with ID file-Njr0AW1V2smlXMmKGYHzHJxp
Deleted file introduction---index.html with ID file-C5oip9NQM1nwGLk4DeXjJiOA
Deleted file library---topics---relativism.html with ID file-0SjQA6g7VOR7Kpzv4JLnl2WA
Deleted file actualism---vineeto---selected-correspondence---corr-science.html with ID file-YoNp3f6K0hmBo8EsCn9qdPX6
Deleted file actualism---vineeto---selected-correspondence---corr-fear2.html with ID file-sojJ0t1NMPTtVAOrY9prfnvM
Deleted file actualism---vineeto---selected-correspondence---corr-authority2.html with ID file-yHAa35g0PunA6OTpu9lhN2Bk
Deleted file sundry---frequentquestions---FAQ34a.html with ID file-r4Gpl0