In [None]:
import os
import pymupdf # PyMuPDF

def rename_pdf_files(folder_path):
    """
    Renames all PDF files in a given folder based on page count and 
    the text length of the first page.
    
    Logic:
    - Base name: OriginalName_Pg[PageCount]
    - Suffix: "_text" if the first page text length > 60, otherwise "_pic"
    """
    
    # Check if the folder exists
    if not os.path.isdir(folder_path):
        print(f"Error: Folder not found at {folder_path}")
        return

    print(f"Starting file renaming in: {folder_path}")
    
    for old_file_name in os.listdir(folder_path):
        # Only process PDF files
        if old_file_name.lower().endswith(".pdf"):
            
            # Construct the full path
            old_file_path = os.path.join(folder_path, old_file_name)
            
            try:
                # 1. Open the PDF document
                doc = pymupdf.open(old_file_path)
                
                # Get the base file name without the extension (.pdf)
                base_name = os.path.splitext(old_file_name)[0]
                
                # 2. Get Page Count and First Page Text
                page_count = doc.page_count
                
                # Load the first page (index 0) and get its text
                text = doc.load_page(0).get_text()
                
                # Close the document to release the file handle
                doc.close() 

                # 3. Apply the renaming logic
                
                # Start with the file name and page count
                new_name_prefix = f"{base_name}_Pg{page_count}"
                
                # Apply the text/pic suffix logic
                if len(text) > 60:
                    new_file_name = new_name_prefix + "_text.pdf"
                else:
                    new_file_name = new_name_prefix + "_pic.pdf"
                    
                # 4. Construct the new file path
                new_file_path = os.path.join(folder_path, new_file_name)
                
                # 5. Rename the file
                if old_file_name != new_file_name:
                    os.rename(old_file_path, new_file_path)
                    print(f"Renamed: '{old_file_name}' -> '{new_file_name}'")
                else:
                    print(f"Skipped: '{old_file_name}' (Name is already correct)")

            except Exception as e:
                print(f"Could not process file {old_file_name}: {e}")
                
    print("\nFile renaming complete.")

In [None]:
# --- Define the folder path ---
# **IMPORTANT**: Change this to the actual absolute or relative path 
# of your 'original' folder.
pdf_folder = "Back_Dataset/original" 

# Execute the function
rename_pdf_files(pdf_folder)