In [3]:
import os
import pandas as pd
import re
from datetime import datetime, timedelta
import logging
from datetime import timedelta

# Configure logging
logging.basicConfig(level=logging.DEBUG, format='%(asctime)s - %(levelname)s - %(message)s')
# Set of processed chats to ensure each chat is analyzed only once
processed_chats = set()

# Function to process a single line of chat
def process_line(line):
    pattern = r'(\d{1,2}/\d{1,2}/\d{2}), (\d{1,2}:\d{2}\s?[AaPp][Mm]) - (.*?): (.*)'
    match = re.match(pattern, line)
    if match:
        logging.debug(f"match file")
        date_str, time_str, sender, message = match.groups()
        date = datetime.strptime(date_str, '%d/%m/%y')
        time = datetime.strptime(time_str, '%I:%M %p').strftime('%H:%M')
        return {'date': date, 'time': time, 'sender': sender, 'message': message}
    else:
        return None

def process_line_for_delay(line):
    pattern = r'(\d{1,2}/\d{1,2}/\d{2}), (\d{1,2}:\d{2}\s?[AaPp][Mm]) - (.*?): (.*)'
    match = re.match(pattern, line)
    if match:
        date_str, time_str, sender, message = match.groups()
        datetime_str = date_str + ' ' + time_str
        datetime_obj = datetime.strptime(datetime_str, '%d/%m/%y %I:%M %p')
        return {'datetime': datetime_obj, 'sender': sender, 'message': message}
    else:
        return None

# Function to read the chat file specifically for delay calculation
def read_chat_file_for_delay(file_path):
    with open(file_path, 'r', encoding='utf-8') as file:
        lines = file.readlines()

    concatenated_lines = []
    current_message = ""
    date_pattern = re.compile(r'^\d{1,2}/\d{1,2}/\d{2}, \d{1,2}:\d{2}\s?[AaPp][Mm] - ')

    for line in lines:
        if date_pattern.match(line):
            if current_message:
                concatenated_lines.append(current_message)
            current_message = line.rstrip()
        else:
            # Append this line to the current message, if it's not empty
            if current_message:
                current_message += " " + line.strip()
    if current_message:
        concatenated_lines.append(current_message)

    return pd.DataFrame([process_line_for_delay(line) for line in concatenated_lines if process_line_for_delay(line) is not None])

# The process_line_for_delay function remains the same
       
    
def calculate_time_spent_student(chat_df, target_date, employee_name):
    student_messages = chat_df[(chat_df['date'].dt.date == target_date) & (chat_df['sender'] != employee_name)]
    total_chars = student_messages['message'].str.len().sum()
    time_spent_seconds = (total_chars / 10) * 5
    return strfdelta(timedelta(seconds=time_spent_seconds)) 

def format_delay_time(seconds):
    hours = seconds // 3600
    minutes = (seconds % 3600) // 60
    if hours > 0:
        return f"{hours} hr {minutes} mins"
    else:
        return f"{minutes} mins"

def calculate_employee_delay(chat_df, employee_name, target_date):
    delays = []
    delay_times = []
    messages_for_reference = []

    last_student_message_time = None
    employee_responded_after_student = False

    delay_counter = 1

    for index, row in chat_df.iterrows():
        # Ensure datetime is correctly formatted
        row_date = row['datetime'].date()

        if row_date != target_date:
            continue

        if row['sender'] != employee_name:
            last_student_message_time = row['datetime']
            employee_responded_after_student = False
        elif row['sender'] == employee_name and last_student_message_time is not None and not employee_responded_after_student:
            time_diff = row['datetime'] - last_student_message_time

            if time_diff > timedelta(minutes=15):
                formatted_time = row['datetime'].strftime('%d %b %Y %I:%M%p')
                delays.append(f"{delay_counter} - {formatted_time}")
                delay_counter += 1

                delay_times.append(format_delay_time(time_diff.seconds))

                start_index = max(0, index - 5)
                end_index = min(index + 5, len(chat_df))
                context_messages = chat_df.iloc[start_index:end_index]

                formatted_context_messages = [f"{idx+1} - {message_row['datetime'].strftime('%d %b %Y %I:%M%p')} - {message_row['sender']}: {message_row['message']}" for idx, message_row in context_messages.iterrows()]
                formatted_message = "\n".join(formatted_context_messages)
                messages_for_reference.append(formatted_message)

            employee_responded_after_student = True

    # Combine the lists into multiline strings
    delays_str = "\n".join(delays)
    delay_times_str = "\n".join(delay_times)
    messages_for_reference_str = "\n".join(messages_for_reference)

    return delays_str, delay_times_str, messages_for_reference_str

def is_broken_chat_student(chat_df, employee_name, target_date):
    # Adjust for the previous day
    previous_day = target_date - timedelta(days=1)

    # Filter messages for the previous day
    daily_messages = chat_df[chat_df['date'].dt.date == previous_day]

    # Check if both the employee and the student had at least one text on that day
    if daily_messages.empty:
        return 'No'  # No conversation happened on this day

    employee_messages = daily_messages[daily_messages['sender'] == employee_name]
    student_messages = daily_messages[daily_messages['sender'] != employee_name]

    # Check if both parties have sent at least one message
    if employee_messages.empty or student_messages.empty:
        return 'No'  # One of the parties did not send any message

    # Check the sender of the last message of the day
    last_message_sender = daily_messages.iloc[-1]['sender']

    # If the last message is from the employee, it's a broken chat by the student
    if last_message_sender == employee_name:
        return 'Yes'

    return 'No'
    
def count_missed_replies_student(chat_df, employee_name, report_date):
    count = 0
    for i in range(7):
        check_date = report_date - timedelta(days=i)
        messages_on_date = chat_df[chat_df['date'].dt.date == check_date]
        employee_messages = messages_on_date[messages_on_date['sender'] == employee_name]
        student_messages = messages_on_date[messages_on_date['sender'] != employee_name]
        if employee_messages.empty and not student_messages.empty:
            count += 1
    return count

def count_missed_replies_studentt(chat_df, employee_name, target_date):
    previous_day = target_date - timedelta(days=1)
    #print(f"Checking for missed replies on: {previous_day}")

    daily_messages = chat_df[chat_df['date'].dt.date == previous_day]
    
    employee_messages = daily_messages[daily_messages['sender'] == employee_name]
    student_messages = daily_messages[daily_messages['sender'] != employee_name]

    #print(f"Employee messages count: {len(employee_messages)}")
    #print(f"Student messages count: {len(student_messages)}")

    # Check if there are messages from the employee but none from the student
    if not employee_messages.empty and student_messages.empty:
        #print("Missed reply found.")
        return 'Yes'
    
    #print("No missed reply.")
    return 'No'

def count_missed_replies_last_7_days(chat_df, employee_name, start_date):
    missed_replies_count = 0

    # Iterate over the last 7 days
    for i in range(7):
        date_to_check = start_date - timedelta(days=i)
        messages_on_date = chat_df[chat_df['date'].dt.date == date_to_check]

        # Check if there are messages on this date
        if not messages_on_date.empty:
            # Check if there's any message from the employee on this day
            employee_messages = messages_on_date[messages_on_date['sender'] == employee_name]
            
            # Check if there's any message from others (leads) on this day
            lead_messages = messages_on_date[messages_on_date['sender'] != employee_name]

            # If there are messages from others but none from the employee, count as a missed reply
            if not lead_messages.empty and employee_messages.empty:
                missed_replies_count += 1

    return missed_replies_count

# Function to calculate the time spent in chat based on message lengths
def calculate_time_spent(chat_df, target_date, employee_name, team_folder):
    daily_messages = chat_df[(chat_df['date'].dt.date == target_date) & (chat_df['sender'] == employee_name)]

    if daily_messages.empty:
        return '00:00:00'

    total_time_spent_seconds = 0

    for index, row in daily_messages.iterrows():
        message = row['message']
        total_chars = len(message)

        if team_folder == "KAM" and total_chars > 700:
            time_spent_seconds = 5  # Cap at 5 seconds for long messages in KAM team folder
        else:
            time_spent_seconds = total_chars * 0.2  # Assuming 0.2 seconds per character

        total_time_spent_seconds += time_spent_seconds

        # Optional: Debug print
        #print(f"New Chat Found in {team_folder}")
        #print(f"Message Length: '{total_chars}'")
        #print(f"Message: '{message}' - Time Spent: {time_spent_seconds} seconds")

    time_spent_timedelta = timedelta(seconds=total_time_spent_seconds)
    formatted_time_spent = strfdelta(time_spent_timedelta)

    return formatted_time_spent

def strfdelta(tdelta):
    hours, remainder = divmod(tdelta.seconds, 3600)
    minutes, seconds = divmod(remainder, 60)
    return f"{hours:02}:{minutes:02}:{seconds:02}"   

def calculate_lead_response(chat_df, employee_name, target_date):
    """
    Calculates the lead response based on the number of texts exchanged between the employee and others (non-employee).
    - If only the employee sent messages, the response is 100%.
    - If only non-employees sent messages, the response is 0%.
    - Otherwise, it's the ratio of the employee's texts to the total texts, constrained between 1% and 99%.
    """
    # Filter messages for the target date
    daily_messages = chat_df[chat_df['date'].dt.date == target_date]
    
    # Check if there are any messages from the employee and others on the target date
    employee_messages = daily_messages[daily_messages['sender'] == employee_name]
    non_employee_messages = daily_messages[daily_messages['sender'] != employee_name]

    # If only the employee sent messages
    if not employee_messages.empty and non_employee_messages.empty:
        return 0

    # If only non-employees sent messages
    if employee_messages.empty and not non_employee_messages.empty:
        return 100

    # If both the employee and non-employees have sent messages
    if not employee_messages.empty and not non_employee_messages.empty:
        num_texts_employee = len(employee_messages)
        num_texts_non_employee = len(non_employee_messages)
        total_texts = num_texts_employee + num_texts_non_employee
        lead_response = (num_texts_employee / total_texts) * 100
        return max(min(lead_response, 99), 1)

    # If neither the employee nor non-employees sent messages
    return 0



def calculate_broken_chat_within_working_hrs(chat_df, employee_name, report_date, team_folder):
    # Adjust working hours based on team folder
    if team_folder == 'EWYL':
        # KAM Team working hours: 7:30 AM to 4:00 PM
        work_start_time = datetime(report_date.year, report_date.month, report_date.day, 7, 30, 0)
        work_end_time = datetime(report_date.year, report_date.month, report_date.day, 16, 30, 0)
    else:
        # Default working hours for other teams: 12:00 AM to 12:00 PM
        work_start_time = datetime(report_date.year, report_date.month, report_date.day, 0, 0, 0)
        work_end_time = datetime(report_date.year, report_date.month, report_date.day, 23, 59, 0)

    # Filter the messages for the given report date
    messages_on_date = chat_df[chat_df['datetime'].dt.date == report_date.date()]

    # Check if both employee and lead have messaged on the report date
    if not messages_on_date.empty:
        employee_messages = messages_on_date[messages_on_date['sender'] == employee_name]
        lead_messages = messages_on_date[messages_on_date['sender'] != employee_name]
        last_message_sender = messages_on_date.iloc[-1]['sender']
        # Ensure both the employee and lead have at least one message
        if not employee_messages.empty and not lead_messages.empty:
            # Get the time of the last message from the lead
            last_lead_message_time = lead_messages.iloc[-1]['datetime']

            # Check if the last message is from the lead and within working hours
            if last_message_sender != employee_name and (work_start_time <= last_lead_message_time <= work_end_time):
                return 'Yes'  # Broken chat if last message from the lead is within working hours
            else:
                return 'No'  # Not a broken chat if last message from the lead is outside working hours or from the employee

    # If no messages or only one party messaged, return 'No'
    return 'No'

def calculate_broken_chat(chat_df, employee_name, report_date):
    # Filter the messages for the given report date
    messages_on_date = chat_df[chat_df['date'].dt.date == report_date]
    
    # Check if both employee and lead have messaged on the report date
    if not messages_on_date.empty:
        employee_messages = messages_on_date[messages_on_date['sender'] == employee_name]
        lead_messages = messages_on_date[messages_on_date['sender'] != employee_name]
        
        # Ensure both the employee and lead have at least one message
        if not employee_messages.empty and not lead_messages.empty:
            # Check if the last message is from the lead
            last_message_sender = messages_on_date.iloc[-1]['sender']
            return last_message_sender != employee_name

    

def missed_replies_employee(chat_df, employee_name, target_date):
    # Filter messages for the target date
    daily_messages = chat_df[chat_df['date'].dt.date == target_date]
    
    # Check if there are any messages from the student
    student_messages = daily_messages[daily_messages['sender'] != employee_name]
    
    # Check if there are any messages from the employee
    employee_messages = daily_messages[daily_messages['sender'] == employee_name]
    
    # If there are student messages but no employee messages, consider it a missed reply
    if not student_messages.empty and employee_messages.empty:
        return 'Yes'
    
    return 'No'

def missed_replies_employee_after_working_hrs(chat_df, employee_name, target_date, team_folder):
    # Check if the team folder is 'KAM Team' to define different working hours
    if team_folder == 'EWYL':
        # EWYL Team working hours: 7:30 AM to 4:00 PM
        work_start_time = datetime(target_date.year, target_date.month, target_date.day, 7, 30, 0)
        work_end_time = datetime(target_date.year, target_date.month, target_date.day, 16, 30, 0)
    
    elif team_folder == 'KAM':
       # KAM Team working hours: 7:30 AM to 4:00 PM
        work_start_time = datetime(target_date.year, target_date.month, target_date.day, 11, 30, 0)
        work_end_time = datetime(target_date.year, target_date.month, target_date.day, 21, 30, 0)

    else:
        # Default working hours for other teams: 12:00 AM to 12:00 PM
        work_start_time = datetime(target_date.year, target_date.month, target_date.day, 0, 0, 0)
        work_end_time = datetime(target_date.year, target_date.month, target_date.day, 23, 59, 0)

    # Ensure target_date is a datetime object
    if not isinstance(target_date, datetime):
        raise ValueError("target_date must be a datetime object")

    # Filter messages for the target date using 'datetime' column
    daily_messages = chat_df[chat_df['datetime'].dt.date == target_date.date()]
    
    # Check if there are any messages from the student
    student_messages = daily_messages[daily_messages['sender'] != employee_name]
    
    # Check if there are any messages from the employee
    employee_messages = daily_messages[daily_messages['sender'] == employee_name]

    # If there are student messages but no employee messages
    if not student_messages.empty and employee_messages.empty:
        print(f"ENTER THE LOOP:{student_messages}")
        # Check if any student message is within working hours
        for _, row in student_messages.iterrows():
            message_time = row['datetime']
            if work_start_time <= message_time <= work_end_time:
                return 'Yes'  # Missed reply within working hours
        return 'No'  # All student messages are outside working hours

    return 'No'

# Function to read the chat file and return a dataframe
def read_chat_file(file_path):
    with open(file_path, 'r', encoding='utf-8') as file:
        lines = file.readlines()

    concatenated_lines = []
    current_message = ""
    date_pattern = re.compile(r'^\d{1,2}/\d{1,2}/\d{2}, \d{1,2}:\d{2}\s?[AaPp][Mm] - ')

    for line in lines:
        if date_pattern.match(line):
            if current_message:
                concatenated_lines.append(current_message)
            current_message = line.rstrip()
        else:
            # Append this line to the current message, if it's not empty
            if current_message:
                current_message += " " + line.strip()
    if current_message:
        concatenated_lines.append(current_message)

    return pd.DataFrame([process_line(line) for line in concatenated_lines if process_line(line) is not None])

# process_line function remains the same


# Function to extract the chat file name based on a specific pattern
def extract_chat_name(chat_file_name):
    #logging.debug(f"Extracting name from chat file: {chat_file_name}")
    match = re.search(r'WhatsApp Chat with _?(.*?)(?:\(\d+\))?_?\.txt', chat_file_name)
    if match:
        extracted_name = re.sub(r'_*(?:\(\d+\))?$', '', match.group(1))
        #logging.debug(f"Extracted chat name: {extracted_name}")
        return extracted_name
    #logging.warning(f"No match found for chat file name: {chat_file_name}")
    return None

# Function to calculate the total count of missed replies by the student for the last N days
def calculate_total_count_missed_replies_student(chat_df, employee_name, num_days):
    total_count = 0

    # Iterate over the last N days
    for i in range(num_days):
        target_date = report_date - timedelta(days=i)
        count = count_missed_replies_student(chat_df, employee_name, target_date)
        total_count += count

    return total_count

# Function to extract the start date from a chat file
def get_chat_start_date(chat_df):
    if not chat_df.empty:
        #logging.debug(f"Extracted chat name: {chat_df['date'].min().date()}")
        return chat_df['date'].min().date()
    return None

# Function to process a single chat file
def process_chat_file(file_path, report_date, main_directory, team_folder, employee_folder):
    global processed_chats
    broken_chat_count = 0
    missed_reply_count = 0
    max_time_spent = ('', '00:00:00')  # (date, time)

    chat_file_name = os.path.basename(file_path)
    #logging.debug(f"Processing chat file: {chat_file_name}")

    chat_name = extract_chat_name(chat_file_name)
    #logging.debug(f"Chat name extracted: {chat_name}")



    

    if chat_name is None:
        #logging.warning(f"Chat name could not be extracted for file: {chat_file_name}")
        return None
    if chat_name in processed_chats:
        #logging.info(f"Chat file already processed: {chat_name}")
        return None

    processed_chats.add(chat_name)
    #logging.debug(f"Chat file added to processed list: {chat_name}")

    chat_df = read_chat_file(file_path)
    if chat_df.empty:
        #logging.warning(f"Chat DataFrame is empty for file: {chat_file_name}")
        return None
    chat_start_date = get_chat_start_date(chat_df)

    # Use read_chat_file_for_delay specifically for delay calculations
    chat_df_for_delay = read_chat_file_for_delay(file_path)
    if chat_df_for_delay.empty:
        return None

    
    target_date = report_date - timedelta(days=1)

    # Call the function with the target date
    delays, delay_times, messages_for_reference = calculate_employee_delay(chat_df_for_delay, employee_folder, target_date)
    



    # Calculate the time spent on Day 0 (report_date - 1 day)
    day_0_date = report_date - timedelta(days=1)
    day_0_time_spent = calculate_time_spent(chat_df, day_0_date, employee_folder,team_folder)
    #day_0_time_spent = timedelta(hours=int(day_0_time_spent.split(':')[0]), minutes=int(day_0_time_spent.split(':')[1]), seconds=int(day_0_time_spent.split(':')[2]))
    # Calculate the lead response based on text length difference for Day 0
    lead_response_day_0 = calculate_lead_response(chat_df, employee_folder, day_0_date)
     
    day_0_date = report_date - timedelta(days=1)  # Assuming report_date is a datetime object of the target date
    broken_chat = calculate_broken_chat(chat_df, employee_folder, day_0_date)
    missed_replies_day_0 = missed_replies_employee(chat_df, employee_folder, day_0_date)

    # Get the current datetime
    today_datetime = datetime.now()

    # Get today's date with time part (assuming start of the day as default)
    today_date_1 = today_datetime.replace(hour=0, minute=0, second=0, microsecond=0)

    # If today_date.weekday() logic remains the same
    # ...

    # Now, when you calculate target_date, it remains a datetime object
    target_date_1 = today_date_1 - timedelta(days=1)


    Actual_missed_Reply = missed_replies_employee_after_working_hrs(chat_df_for_delay, employee_folder, target_date_1,team_folder)
    Actual_broken_chat = calculate_broken_chat_within_working_hrs(chat_df_for_delay, employee_folder, target_date_1,team_folder)
    total_count_missed_reply_student = calculate_total_count_missed_replies_student(chat_df, employee_folder, 14)
    


    
    for i in range(7):  # Assuming you're checking the past 7 days
        check_date = report_date - timedelta(days=i)
        
        # Check for broken chats
        if calculate_broken_chat(chat_df, employee_folder, check_date):
            broken_chat_count += 1

        # Check for missed replies
        start_date_for_missed_replies = report_date - timedelta(days=7)
        
        missed_replies_count = count_missed_replies_last_7_days(chat_df, employee_folder, start_date_for_missed_replies)

        # Check for max time spent
        time_spent = calculate_time_spent(chat_df, check_date, employee_folder,team_folder)
        if time_spent > max_time_spent[1]:
            max_time_spent = (check_date.strftime('%m-%d-%Y'), time_spent)
    
    
    
    # Calculate the time spent by students
    time_spent_student = {
    'Day 0 (Student)': calculate_time_spent_student(chat_df, report_date - timedelta(days=1), employee_folder),
    'Day 1 (Student)': calculate_time_spent_student(chat_df, report_date - timedelta(days=2), employee_folder),
    'Day 2 (Student)': calculate_time_spent_student(chat_df, report_date - timedelta(days=3), employee_folder),
    }
    
    # Inside the process_chat_file function, after calculating day_0_time_spent:
    day_0_date = report_date - timedelta(days=1)
    day_1_date = report_date - timedelta(days=2)
    day_2_date = report_date - timedelta(days=3)

    # Calculate time spent by student for Day 0, Day 1, and Day 2
    time_spent_student_day_0 = calculate_time_spent_student(chat_df, day_0_date, employee_folder)
    time_spent_student_day_1 = calculate_time_spent_student(chat_df, day_1_date, employee_folder)
    time_spent_student_day_2 = calculate_time_spent_student(chat_df, day_2_date, employee_folder)



    total_time_spent_student = time_spent_student['Day 0 (Student)']

    broken_chat_student = is_broken_chat_student(chat_df, employee_folder, report_date)

    mmissed_reply_student = count_missed_replies_studentt(chat_df, employee_folder, report_date)

    # Calculate the time spent on each day relative to the report date
    time_spent = {}
    for i in range(1, 4):  # Start from 1 since we want Day 0 to be the day before the report date
        target_date = report_date - timedelta(days=i)
        time_spent[f'Day {i-1}'] = calculate_time_spent(chat_df, target_date, employee_folder,team_folder)
    
    target_date_for_chat_start_Date = report_date - timedelta(days=1)
    day_indicator_employee = (target_date_for_chat_start_Date - chat_start_date).days
    #logging.debug(f"day indicator employee: {day_indicator_employee}")
    # Determine Day Indicator based on chat start date
    if chat_start_date:
        if (target_date_for_chat_start_Date - chat_start_date).days == 0:
          
            day_indicator = 'Day 0'
        elif (target_date_for_chat_start_Date - chat_start_date).days == 1:
            
            day_indicator = 'Day 1'
        elif (target_date_for_chat_start_Date - chat_start_date).days == 2:
            
            day_indicator = 'Day 2'

        elif (target_date_for_chat_start_Date - chat_start_date).days == 3:
            
            day_indicator = 'OLD'

        else:
            day_indicator = 'OLD'  # For chats that don't fall into Day 0, Day 1, or Day 2

    

    main_directory_name = os.path.basename(main_directory)

    row = {
        'Date': main_directory_name,
        'Team Folder': team_folder,
        'Employee Folder': employee_folder,
        'Chat File Name': chat_name,        # Inserting the extracted chat name
        'Day Indicator': day_indicator,
        'Total_Time_Spent_Employee': day_0_time_spent,  # Use Day 0 time as the total time spent
        'LR': lead_response_day_0,  # Add the lead response here
        'Broken Chat(Employee)': 'Yes' if broken_chat else 'No',
        'Missed Replies (Employee)': missed_replies_day_0,
        'Count_Broken_Chat_Employee (Employee)': broken_chat_count,
        'Count_Missed_Replies_Missed_Replies (Employee)': missed_replies_count,
        'Date of Max time': max_time_spent[0],
        **time_spent,
        'Total Time Spent (Student)': total_time_spent_student,
        'Broken Chat (Student)': broken_chat_student,
        'Missed Replies (Student)': mmissed_reply_student,
        'Day_0_Time_Spent_Student': time_spent_student_day_0,  # Add time spent for Day 0
        'Day_1_Time_Spent_Student': time_spent_student_day_1,  # Add time spent for Day 1
        'Day_2_Time_Spent_Student': time_spent_student_day_2,
        'Total_Count_Missed_Reply_Chat_Student' : total_count_missed_reply_student,
        'Employee Delays': delays,
        'Delay Durations': delay_times,
        'Messages for Reference': messages_for_reference,
        'Actual Missed Reply from Employee': Actual_missed_Reply,
        'Actual Broken Chat from Employee' : Actual_broken_chat,
    }
    #logging.debug(f"Row created for chat: {row}")
    return row

# Main directory path construction and report date setting
# Main directory path construction and report date setting
local_date_format = '%Y-%m-%d'  # Adjust this to your local date format
main_directory = 'F:\\Github-mauriceyeng\\Chat-Analyzer-V2\\Chat Folder from Drive\\2024-01-06-20240106T044019Z-001'  # Replace with your base directory path

# Get today's date
today_date = datetime.now().date()

# Check the day of the week
if today_date.weekday() in range(1, 6):  # Tuesday to Saturday
    report_date = today_date
else:  # Monday
    # You can adjust the number of days to subtract based on your specific requirements
    report_date = today_date - timedelta(days=1)
    logging.debug(f"Report Date: {report_date}")
report_date_str_local = report_date.strftime(local_date_format)
main_directory_path = os.path.join(main_directory, report_date_str_local)

# Function to navigate through the directory structure and process all chat files
def process_team_folders(main_directory, report_date):
    all_data = []
    for team_folder in os.listdir(main_directory):
        team_path = os.path.join(main_directory, team_folder)
        if not os.path.isdir(team_path):
            continue
        for employee_folder in os.listdir(team_path):
            employee_path = os.path.join(team_path, employee_folder)
            if not os.path.isdir(employee_path):
                continue
            for chat_file in os.listdir(employee_path):
                chat_file_path = os.path.join(employee_path, chat_file)
                row = process_chat_file(chat_file_path, report_date, main_directory, team_folder, employee_folder)
                if row:
                    all_data.append(row)
                    logging.debug(f"Row appended for chat file: {chat_file}")
    df = pd.DataFrame(all_data)
    #logging.debug(f"DataFrame constructed with {len(df)} rows")
    return df

# Process all team folders and chats based on the report date
all_chats_df = process_team_folders(main_directory_path, report_date)


# Save to a CSV file
csv_file_path = 'F:\\Github-mauriceyeng\\Chat-Analyzer-V2\\Chat Folder from Drive\\2024-01-06-20240106T044019Z-001\\data.csv'  # Define your desired path and file name

all_chats_df.to_csv(csv_file_path, index=False)
#print(f"DataFrame saved as CSV at {csv_file_path}")
# Display the result
#print(all_chats_df)

2024-01-06 10:35:44,270 - DEBUG - Row appended for chat file: WhatsApp Chat with Abraham EWYL22E0848.txt
2024-01-06 10:35:44,398 - DEBUG - Row appended for chat file: WhatsApp Chat with Allen EWYL22E0762.txt
2024-01-06 10:35:44,544 - DEBUG - Row appended for chat file: WhatsApp Chat with Alson EWYL22E0675.txt
2024-01-06 10:35:44,663 - DEBUG - Row appended for chat file: WhatsApp Chat with Andipa EWYL22E0389.txt
2024-01-06 10:35:44,794 - DEBUG - Row appended for chat file: WhatsApp Chat with Anesu EWYL22E0418.txt
2024-01-06 10:35:44,919 - DEBUG - Row appended for chat file: WhatsApp Chat with Anotidaishe EWYL23E0378.txt
2024-01-06 10:35:45,044 - DEBUG - Row appended for chat file: WhatsApp Chat with Ayanda EWYL23E0703.txt
2024-01-06 10:35:45,204 - DEBUG - Row appended for chat file: WhatsApp Chat with Benjamin EWYL23E1044.txt
2024-01-06 10:35:45,322 - DEBUG - Row appended for chat file: WhatsApp Chat with Bernadette EWYL22E0557.txt
2024-01-06 10:35:45,447 - DEBUG - Row appended for chat

2024-01-06 10:35:54,033 - DEBUG - Row appended for chat file: WhatsApp Chat with Sijamali EWYL23E1017.txt
2024-01-06 10:35:54,144 - DEBUG - Row appended for chat file: WhatsApp Chat with Sikhululekile EWYL23E0108.txt
2024-01-06 10:35:54,271 - DEBUG - Row appended for chat file: WhatsApp Chat with Sithabisiwe EWYL22E1220.txt
2024-01-06 10:35:54,399 - DEBUG - Row appended for chat file: WhatsApp Chat with Tadiwa EWYL23E1065.txt
2024-01-06 10:35:54,531 - DEBUG - Row appended for chat file: WhatsApp Chat with Tadiwanashe EWYL22E0420.txt
2024-01-06 10:35:54,656 - DEBUG - Row appended for chat file: WhatsApp Chat with Tadiwanashe EWYL23E0879.txt
2024-01-06 10:35:54,774 - DEBUG - Row appended for chat file: WhatsApp Chat with Tafadzwa EWYL22E0128.txt
2024-01-06 10:35:54,906 - DEBUG - Row appended for chat file: WhatsApp Chat with Tafadzwa EWYL22E1230.txt
2024-01-06 10:35:55,031 - DEBUG - Row appended for chat file: WhatsApp Chat with Taisha EWYL23E0131.txt
2024-01-06 10:35:55,150 - DEBUG - Ro

2024-01-06 10:36:03,775 - DEBUG - Row appended for chat file: WhatsApp Chat with Michael EWYL22E0173.txt
2024-01-06 10:36:03,922 - DEBUG - Row appended for chat file: WhatsApp Chat with Milan EWYL23E0847.txt
2024-01-06 10:36:04,050 - DEBUG - Row appended for chat file: WhatsApp Chat with Mishael EWYL23E0479.txt
2024-01-06 10:36:04,184 - DEBUG - Row appended for chat file: WhatsApp Chat with Mthuli EWYL23E0227.txt
2024-01-06 10:36:04,291 - DEBUG - Row appended for chat file: WhatsApp Chat with Munyaradzi EWYL21E0861.txt
2024-01-06 10:36:04,421 - DEBUG - Row appended for chat file: WhatsApp Chat with Munyaradzi EWYL23E1052.txt
2024-01-06 10:36:04,560 - DEBUG - Row appended for chat file: WhatsApp Chat with Natasha EWYL22E1100.txt
2024-01-06 10:36:04,692 - DEBUG - Row appended for chat file: WhatsApp Chat with Neo EWYL23E0196.txt
2024-01-06 10:36:04,831 - DEBUG - Row appended for chat file: WhatsApp Chat with Nicole EWYL23E1068.txt
2024-01-06 10:36:04,963 - DEBUG - Row appended for chat f

2024-01-06 10:36:13,700 - DEBUG - Row appended for chat file: WhatsApp Chat with Derylin EWYL23E0863.txt
2024-01-06 10:36:13,818 - DEBUG - Row appended for chat file: WhatsApp Chat with Desire EWYL22E0689.txt
2024-01-06 10:36:13,950 - DEBUG - Row appended for chat file: WhatsApp Chat with Edwin EWYL22E0823.txt
2024-01-06 10:36:14,066 - DEBUG - Row appended for chat file: WhatsApp Chat with Ephinas EWYL23E0036.txt
2024-01-06 10:36:14,186 - DEBUG - Row appended for chat file: WhatsApp Chat with Evans EWYL22E1255.txt
2024-01-06 10:36:14,299 - DEBUG - Row appended for chat file: WhatsApp Chat with Francine EWYL22E1258.txt
2024-01-06 10:36:14,436 - DEBUG - Row appended for chat file: WhatsApp Chat with Fungai EWYL22E0706.txt
2024-01-06 10:36:14,557 - DEBUG - Row appended for chat file: WhatsApp Chat with Gerald EWYL22E1202.txt
2024-01-06 10:36:14,680 - DEBUG - Row appended for chat file: WhatsApp Chat with Glory EWYL23E0796.txt
2024-01-06 10:36:14,818 - DEBUG - Row appended for chat file: W

2024-01-06 10:36:24,407 - DEBUG - Row appended for chat file: WhatsApp Chat with Sharon EWYL23E0497.txt
2024-01-06 10:36:24,525 - DEBUG - Row appended for chat file: WhatsApp Chat with Shawn EWYL22E0868.txt
2024-01-06 10:36:24,653 - DEBUG - Row appended for chat file: WhatsApp Chat with Shekinah EWYL22E0169.txt
2024-01-06 10:36:24,785 - DEBUG - Row appended for chat file: WhatsApp Chat with Sibongile EWYL22E0635.txt
2024-01-06 10:36:24,917 - DEBUG - Row appended for chat file: WhatsApp Chat with Sibonginkosi EWYL23E0528.txt
2024-01-06 10:36:25,046 - DEBUG - Row appended for chat file: WhatsApp Chat with Silence EWYL22E1150.txt
2024-01-06 10:36:25,173 - DEBUG - Row appended for chat file: WhatsApp Chat with Simphiwe EWYL22E0976.txt
2024-01-06 10:36:25,290 - DEBUG - Row appended for chat file: WhatsApp Chat with Stina EWYL23E0256.txt
2024-01-06 10:36:25,414 - DEBUG - Row appended for chat file: WhatsApp Chat with Tadiwa EWYL22E0603.txt
2024-01-06 10:36:25,534 - DEBUG - Row appended for c

2024-01-06 10:36:34,585 - DEBUG - Row appended for chat file: WhatsApp Chat with Faith EWYL23E0159.txt
2024-01-06 10:36:34,710 - DEBUG - Row appended for chat file: WhatsApp Chat with Fanuel EWYL22E0893.txt
2024-01-06 10:36:34,874 - DEBUG - Row appended for chat file: WhatsApp Chat with Freda EWYL23E0996.txt
2024-01-06 10:36:34,999 - DEBUG - Row appended for chat file: WhatsApp Chat with Gervais EWYL22E1186.txt
2024-01-06 10:36:35,109 - DEBUG - Row appended for chat file: WhatsApp Chat with Grace EWYL23E0201.txt
2024-01-06 10:36:35,234 - DEBUG - Row appended for chat file: WhatsApp Chat with Gracious EWYL22E0492.txt
2024-01-06 10:36:35,372 - DEBUG - Row appended for chat file: WhatsApp Chat with Hazel EWYL22E1166.txt
2024-01-06 10:36:35,480 - DEBUG - Row appended for chat file: WhatsApp Chat with Heggah EWYL22E1270.txt
2024-01-06 10:36:35,661 - DEBUG - Row appended for chat file: WhatsApp Chat with Henriata EWYL22E1139.txt
2024-01-06 10:36:35,812 - DEBUG - Row appended for chat file: W

2024-01-06 10:36:45,159 - DEBUG - Row appended for chat file: WhatsApp Chat with Silas EWYL23E0930.txt
2024-01-06 10:36:45,274 - DEBUG - Row appended for chat file: WhatsApp Chat with Sindisiwe EWYL22E0892.txt
2024-01-06 10:36:45,412 - DEBUG - Row appended for chat file: WhatsApp Chat with Siphosenkosi EWYL22E0350.txt
2024-01-06 10:36:45,529 - DEBUG - Row appended for chat file: WhatsApp Chat with Stephen EWYL23E0322.txt
2024-01-06 10:36:45,644 - DEBUG - Row appended for chat file: WhatsApp Chat with Tadiwanashe EWYL23E0037.txt
2024-01-06 10:36:45,773 - DEBUG - Row appended for chat file: WhatsApp Chat with Tadiwanashe EWYL23E0795.txt
2024-01-06 10:36:45,905 - DEBUG - Row appended for chat file: WhatsApp Chat with Tafadzwa EWYL22E0272.txt
2024-01-06 10:36:46,045 - DEBUG - Row appended for chat file: WhatsApp Chat with Tafadzwa EWYL23E0250.txt
2024-01-06 10:36:46,191 - DEBUG - Row appended for chat file: WhatsApp Chat with TAFARA EWYL22E1329.txt
2024-01-06 10:36:46,327 - DEBUG - Row app

2024-01-06 10:36:54,927 - DEBUG - Row appended for chat file: WhatsApp Chat with Rejoice EWYL22E1085.txt
2024-01-06 10:36:55,059 - DEBUG - Row appended for chat file: WhatsApp Chat with Rhoda EWYL22E0988.txt
2024-01-06 10:36:55,177 - DEBUG - Row appended for chat file: WhatsApp Chat with Rutendo EWYL22E0220.txt
2024-01-06 10:36:55,302 - DEBUG - Row appended for chat file: WhatsApp Chat with Rutendo EWYL22E0703.txt
2024-01-06 10:36:55,428 - DEBUG - Row appended for chat file: WhatsApp Chat with Rutendo EWYL23E0521.txt
2024-01-06 10:36:55,546 - DEBUG - Row appended for chat file: WhatsApp Chat with Ruth EWYL22E1019.txt
2024-01-06 10:36:55,654 - DEBUG - Row appended for chat file: WhatsApp Chat with Senamiso EWYL22E0983.txt
2024-01-06 10:36:55,782 - DEBUG - Row appended for chat file: WhatsApp Chat with Shalom EWYL23E0506.txt
2024-01-06 10:36:55,893 - DEBUG - Row appended for chat file: WhatsApp Chat with Shaun EWYL22E0968.txt
2024-01-06 10:36:56,012 - DEBUG - Row appended for chat file: 

2024-01-06 10:37:05,603 - DEBUG - Row appended for chat file: WhatsApp Chat with Tiara 2K23JUN0698.txt
2024-01-06 10:37:05,731 - DEBUG - Row appended for chat file: WhatsApp Chat with Tinayeishe 2K23DEC0785.txt
2024-01-06 10:37:05,860 - DEBUG - Row appended for chat file: WhatsApp Chat with Tinotenda 2K23DEC2353R.txt
2024-01-06 10:37:05,997 - DEBUG - Row appended for chat file: WhatsApp Chat with Tinotendaishe 2K23DEC2325.txt
2024-01-06 10:37:06,150 - DEBUG - Row appended for chat file: WhatsApp Chat with Valentine 2K23SEP2895.txt
2024-01-06 10:37:06,285 - DEBUG - Row appended for chat file: WhatsApp Chat with Whatfor 2K23NOV0371.txt
2024-01-06 10:37:06,405 - DEBUG - Row appended for chat file: WhatsApp Chat with Alois 2K23DEC1526R.txt
2024-01-06 10:37:06,529 - DEBUG - Row appended for chat file: WhatsApp Chat with Amanda 2K23DEC2294R.txt
2024-01-06 10:37:06,663 - DEBUG - Row appended for chat file: WhatsApp Chat with Ange_lique 2K23DEC1972R.txt
2024-01-06 10:37:06,810 - DEBUG - Row ap

2024-01-06 10:37:16,424 - DEBUG - Row appended for chat file: WhatsApp Chat with Abercy 2K23APR1707.txt
2024-01-06 10:37:16,540 - DEBUG - Row appended for chat file: WhatsApp Chat with Anesu 2K23OCT2795.txt
2024-01-06 10:37:16,656 - DEBUG - Row appended for chat file: WhatsApp Chat with Anna 2K23APR0339.txt
2024-01-06 10:37:16,809 - DEBUG - Row appended for chat file: WhatsApp Chat with Ashley 2K23NOV2234.txt
2024-01-06 10:37:16,925 - DEBUG - Row appended for chat file: WhatsApp Chat with Blessing 2K23APR0698.txt
2024-01-06 10:37:17,041 - DEBUG - Row appended for chat file: WhatsApp Chat with Blessing 2K23APR1799.txt
2024-01-06 10:37:17,157 - DEBUG - Row appended for chat file: WhatsApp Chat with Chiedza 2K23NOV2116.txt
2024-01-06 10:37:17,273 - DEBUG - Row appended for chat file: WhatsApp Chat with Gracious 2K23OCT2745.txt
2024-01-06 10:37:17,411 - DEBUG - Row appended for chat file: WhatsApp Chat with Harriet 2K23AUG0392R.txt
2024-01-06 10:37:17,542 - DEBUG - Row appended for chat fi

2024-01-06 10:37:27,391 - DEBUG - Row appended for chat file: WhatsApp Chat with Elexise_Edoofa(26_12)AA-IE.txt
2024-01-06 10:37:27,610 - DEBUG - Row appended for chat file: WhatsApp Chat with Kimberly T Pamuchigere_Edoofa(20_12)KA.txt
2024-01-06 10:37:27,815 - DEBUG - Row appended for chat file: WhatsApp Chat with Kunonga Malon Shaun_Edoofa(21_12)KA - IE.txt
2024-01-06 10:37:28,037 - DEBUG - Row appended for chat file: WhatsApp Chat with Life_Edoofa(27_12)PG-IE.txt
2024-01-06 10:37:28,228 - DEBUG - Row appended for chat file: WhatsApp Chat with Makanaka Mutandwa_Edoofa(17_11)KA.txt
2024-01-06 10:37:28,437 - DEBUG - Row appended for chat file: WhatsApp Chat with Mitchelle_Edoofa(27_12)PG.txt
2024-01-06 10:37:28,660 - DEBUG - Row appended for chat file: WhatsApp Chat with Murewa Lisah T_Edoofa(14_12)KA - IE.txt
2024-01-06 10:37:28,862 - DEBUG - Row appended for chat file: WhatsApp Chat with Nephew_Edoofa(14_11)AA.txt
2024-01-06 10:37:29,063 - DEBUG - Row appended for chat file: WhatsApp

2024-01-06 10:37:40,129 - DEBUG - Row appended for chat file: WhatsApp Chat with Joshua Chisanga_EDOOFAZAMBNTS(21_12)GS(1).txt
2024-01-06 10:37:40,317 - DEBUG - Row appended for chat file: WhatsApp Chat with Joyce chiwala_EDOOFAZAMBNGS(03_01)GS(1).txt
2024-01-06 10:37:40,437 - DEBUG - Row appended for chat file: WhatsApp Chat with Judith Luchembe_EDOOFAZAMBNGS(03_01)GS(1).txt
2024-01-06 10:37:40,640 - DEBUG - Row appended for chat file: WhatsApp Chat with Junior Nesvinga_EDOOFA(03_01)GS-IE(1).txt
2024-01-06 10:37:40,852 - DEBUG - Row appended for chat file: WhatsApp Chat with Kativhu Keith_EDOOFA(14_12)GS(1).txt
2024-01-06 10:37:41,013 - DEBUG - Row appended for chat file: WhatsApp Chat with Kudzaishe Matambo_EDOOFA(27_11)GS(1).txt
2024-01-06 10:37:41,153 - DEBUG - Row appended for chat file: WhatsApp Chat with Kuhamba Tanatswa_EDOOFA(2_1)GS(1).txt
2024-01-06 10:37:41,276 - DEBUG - Row appended for chat file: WhatsApp Chat with Lamond Chingema_EDOOFA(05_01)GS(1).txt
2024-01-06 10:37:41

2024-01-06 10:37:52,548 - DEBUG - Row appended for chat file: WhatsApp Chat with Rosemary_Edoofa(22_11)HP.txt
2024-01-06 10:37:52,833 - DEBUG - Row appended for chat file: WhatsApp Chat with Rutendo_Edoofa(26_12)HP.txt
2024-01-06 10:37:53,100 - DEBUG - Row appended for chat file: WhatsApp Chat with Ruvimbo_Edoofa(19_12)HP.txt
2024-01-06 10:37:53,312 - DEBUG - Row appended for chat file: WhatsApp Chat with Sungano_Edoofa(28_12)HP.txt
2024-01-06 10:37:53,455 - DEBUG - Row appended for chat file: WhatsApp Chat with Tafadzwa_Edoofa(05_01)HP.txt
2024-01-06 10:37:53,706 - DEBUG - Row appended for chat file: WhatsApp Chat with Talent_Edoofa(26_12)HP.txt
2024-01-06 10:37:53,827 - DEBUG - Row appended for chat file: WhatsApp Chat with Tatenda_Edoofa(05_01)HP.txt
2024-01-06 10:37:54,036 - DEBUG - Row appended for chat file: WhatsApp Chat with Tinotenda_Edoofa(03_01)HP.txt
2024-01-06 10:37:54,257 - DEBUG - Row appended for chat file: WhatsApp Chat with Tinotenda_Edoofa(28_12)HP 2025.txt
2024-01-0

2024-01-06 10:38:04,332 - DEBUG - Row appended for chat file: WhatsApp Chat with Prisca_Edoofa(22_12)PG(1).txt
2024-01-06 10:38:04,598 - DEBUG - Row appended for chat file: WhatsApp Chat with Rabson_Edoofa(20_12)PG-IE(1).txt
2024-01-06 10:38:04,718 - DEBUG - Row appended for chat file: WhatsApp Chat with Rutendo_Edoofa(03_01)PG(1).txt
2024-01-06 10:38:04,909 - DEBUG - Row appended for chat file: WhatsApp Chat with Samantha_Edoofa(27_12)PG-IE(1).txt
2024-01-06 10:38:05,037 - DEBUG - Row appended for chat file: WhatsApp Chat with Sidumisile_Edoofa(02_01)PG(1).txt
2024-01-06 10:38:05,296 - DEBUG - Row appended for chat file: WhatsApp Chat with Tadiwanashe_Edoofa(03_01)PG-IE(1).txt
2024-01-06 10:38:05,484 - DEBUG - Row appended for chat file: WhatsApp Chat with Tafadzwa_Edoofa(18_12)PG-IE(1).txt
2024-01-06 10:38:05,673 - DEBUG - Row appended for chat file: WhatsApp Chat with Tanyaradzwa_Edoofa(22_12)PG(1).txt
2024-01-06 10:38:05,795 - DEBUG - Row appended for chat file: WhatsApp Chat with 

2024-01-06 10:38:19,330 - DEBUG - Row appended for chat file: WhatsApp Chat with Kokera Derrick Edoofa (28_12) SZ.txt
2024-01-06 10:38:19,473 - DEBUG - Row appended for chat file: WhatsApp Chat with Linda Malaba Edoofa (26_12) SZ.txt
2024-01-06 10:38:19,616 - DEBUG - Row appended for chat file: WhatsApp Chat with Mambara Faith Edoofa (05_01) SZ.txt
2024-01-06 10:38:19,763 - DEBUG - Row appended for chat file: WhatsApp Chat with Matongo Brighton Edoofa (26_12) SZ.txt
2024-01-06 10:38:19,905 - DEBUG - Row appended for chat file: WhatsApp Chat with Mirriam Ngalula Edoofa (04_01) SZ.txt
2024-01-06 10:38:20,137 - DEBUG - Row appended for chat file: WhatsApp Chat with Mishel Tadiwa Diwura Edoofa (16_11) SZ.txt
2024-01-06 10:38:20,335 - DEBUG - Row appended for chat file: WhatsApp Chat with Moyo Emma Edoofa (20_12) SZ.txt
2024-01-06 10:38:20,478 - DEBUG - Row appended for chat file: WhatsApp Chat with Munashe Oniswence Tomy Edoofa (02_01) SZ.txt
2024-01-06 10:38:20,610 - DEBUG - Row appended 

2024-01-06 10:38:33,063 - DEBUG - Row appended for chat file: WhatsApp Chat with Takudzwa Magwenzi_EDOOFA(03_01)SM24.txt
2024-01-06 10:38:33,251 - DEBUG - Row appended for chat file: WhatsApp Chat with Tanaka Mushonga_EDOOFA(07_12)SM23.txt
2024-01-06 10:38:33,388 - DEBUG - Row appended for chat file: WhatsApp Chat with Tanatswa Tsopotsa_EA(28_12)TR.txt
2024-01-06 10:38:33,599 - DEBUG - Row appended for chat file: WhatsApp Chat with THEARA MUDIMU_EA(21_11)TR.txt
2024-01-06 10:38:33,740 - DEBUG - Row appended for chat file: WhatsApp Chat with Wesley Kangoma_EDOOFAIE(29_12)SM23.txt


In [None]:
csv_file_path = 'F:\\Github-mauriceyeng\\Chat-Analyzer-V2\\Chat Folder from Drive\\2024-01-06-20240106T044019Z-001\\data.csv'  # Define your desired path and file name
