In [4]:
# importing libraries
import os
import requests  # with this we can make http request to fetch web pages.
from bs4 import BeautifulSoup # we uses BeautifulSoup for the Parsing html content.
import pandas as pd

# by taking url as a input and by using requests we gets the html content of the page 
def extract_article_text(url):
    try:
        response = requests.get(url)
        soup = BeautifulSoup(response.text, 'html.parser') #Parses the HTML using BeautifulSoup.

        # Extract title and article text (<p> tags)
        title = soup.find('title').text.strip()
        article_text = '\n'.join([p.text for p in soup.find_all('p')])

        return title, article_text
    except Exception as e:
        print(f"Error extracting data from {url}: {e}")
        return None, None

def main():
    # Read the input Excel file using pandas library
    input_file_path = 'Input.xlsx'
    df = pd.read_excel(input_file_path)

    # Create a directory to save text files
    output_directory = 'output_texts'
    os.makedirs(output_directory, exist_ok=True)

    # Loop through the URLs in the input file
    for index, row in df.iterrows():
        url_id = row['URL_ID']
        url = row['URL']

        # Extract article text
        title, article_text = extract_article_text(url)

        if title and article_text:
            # Save the extracted text to a file
            output_file_path = os.path.join(output_directory, f'{url_id}.txt') # here we takes the usrl_id as the name of output text file
            with open(output_file_path, 'w', encoding='utf-8') as file:
                file.write(f'Title: {title}\n\n{article_text}')

            print(f"Data extracted from {url} and saved to {output_file_path}")

if __name__ == "__main__":
    main()


Data extracted from https://insights.blackcoffer.com/rising-it-cities-and-its-impact-on-the-economy-environment-infrastructure-and-city-life-by-the-year-2040-2/ and saved to output_texts\blackassign0001.txt
Data extracted from https://insights.blackcoffer.com/rising-it-cities-and-their-impact-on-the-economy-environment-infrastructure-and-city-life-in-future/ and saved to output_texts\blackassign0002.txt
Data extracted from https://insights.blackcoffer.com/internet-demands-evolution-communication-impact-and-2035s-alternative-pathways/ and saved to output_texts\blackassign0003.txt
Data extracted from https://insights.blackcoffer.com/rise-of-cybercrime-and-its-effect-in-upcoming-future/ and saved to output_texts\blackassign0004.txt
Data extracted from https://insights.blackcoffer.com/ott-platform-and-its-impact-on-the-entertainment-industry-in-future/ and saved to output_texts\blackassign0005.txt
Data extracted from https://insights.blackcoffer.com/the-rise-of-the-ott-platform-and-its-imp

Data extracted from https://insights.blackcoffer.com/difference-between-artificial-intelligence-machine-learning-statistics-and-data-mining/ and saved to output_texts\blackassign0052.txt
Data extracted from https://insights.blackcoffer.com/how-python-became-the-first-choice-for-data-science/ and saved to output_texts\blackassign0053.txt
Data extracted from https://insights.blackcoffer.com/how-google-fit-measure-heart-and-respiratory-rates-using-a-phone/ and saved to output_texts\blackassign0054.txt
Data extracted from https://insights.blackcoffer.com/what-is-the-future-of-mobile-apps/ and saved to output_texts\blackassign0055.txt
Data extracted from https://insights.blackcoffer.com/impact-of-ai-in-health-and-medicine/ and saved to output_texts\blackassign0056.txt
Data extracted from https://insights.blackcoffer.com/telemedicine-what-patients-like-and-dislike-about-it/ and saved to output_texts\blackassign0057.txt
Data extracted from https://insights.blackcoffer.com/how-we-forecast-futu

In [12]:
import os
import requests
from bs4 import BeautifulSoup
import pandas as pd
from nltk.tokenize import word_tokenize, sent_tokenize
from nltk.corpus import stopwords
from nltk.probability import FreqDist
import nltk
# imported nltk librarie to perform text anlysis



# Created Function to extract title and text from a given URL
def extract_article_text(url):
    try:
        response = requests.get(url)
        #Parses the HTML using BeautifulSoup.
        soup = BeautifulSoup(response.text, 'html.parser')

        # Extract title and article text
        title = soup.find('title').text.strip()
        article_text = '\n'.join([p.text for p in soup.find_all('p')])

        return title, article_text
    except Exception as e:
        # Handle any errors that may occur during the extraction
        print(f"Error extracting data from {url}: {e}")
        return None, None
    
# this function is created fro the text analysis on the article text.
def perform_text_analysis(article_text):
    # Tokenize words and sentences
    words = word_tokenize(article_text)
    sentences = sent_tokenize(article_text)

    # Remove common english stopwords
    stop_words = set(stopwords.words('english'))
    filtered_words = [word.lower() for word in words if word.isalnum() and word.lower() not in stop_words]

    # Compute word frequency distribution
    word_freq_dist = FreqDist(filtered_words)

    # Compute variables text analysis metrics
    total_words = len(words)
    total_sentences = len(sentences)
    unique_words = len(set(filtered_words))
    most_common_word, most_common_word_freq = word_freq_dist.most_common(1)[0] if word_freq_dist else ('', 0)

    return total_words, total_sentences, unique_words, most_common_word, most_common_word_freq

# Main function to read input, perform analysis, and save results
def main():
    # Read the input Excel file containing URLs
    input_file_path = 'Input.xlsx'
    df_input = pd.read_excel(input_file_path)

    # Create an empty DataFrame to store analysis results
    columns = ['URL_ID', 'Total_Words', 'Total_Sentences', 'Unique_Words', 'Most_Common_Word', 'Most_Common_Word_Frequency']
    df_output = pd.DataFrame(columns=columns)

    # Loop through the URLs in the input file
    for index, row in df_input.iterrows():
        url_id = row['URL_ID']
        url = row['URL']

        # Extract article text
        title, article_text = extract_article_text(url)

        if title and article_text:
            # Perform text analysis on extracted articles text
            total_words, total_sentences, unique_words, most_common_word, most_common_word_freq = perform_text_analysis(article_text)

            # Append the analysis results to the output DataFrame
            df_output = df_output.append({
                'URL_ID': url_id,
                'Total_Words': total_words,
                'Total_Sentences': total_sentences,
                'Unique_Words': unique_words,
                'Most_Common_Word': most_common_word,
                'Most_Common_Word_Frequency': most_common_word_freq
            }, ignore_index=True)
            
            
            # Print a message indicating the completion of analysis for the current URL
            print(f"Textual analysis for {url} completed.")
    # Save the output DataFrame to the output structure Excel file
    output_structure_file = 'Output Data Structure.xlsx'
    df_output.to_excel(output_structure_file, index=False)
    print(f"Analysis results saved to {output_structure_file}")

if __name__ == "__main__":
    main()

  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/rising-it-cities-and-its-impact-on-the-economy-environment-infrastructure-and-city-life-by-the-year-2040-2/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/rising-it-cities-and-their-impact-on-the-economy-environment-infrastructure-and-city-life-in-future/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/internet-demands-evolution-communication-impact-and-2035s-alternative-pathways/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/rise-of-cybercrime-and-its-effect-in-upcoming-future/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/ott-platform-and-its-impact-on-the-entertainment-industry-in-future/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/the-rise-of-the-ott-platform-and-its-impact-on-the-entertainment-industry-by-2040/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/rise-of-cyber-crime-and-its-effects/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/rise-of-internet-demand-and-its-impact-on-communications-and-alternatives-by-the-year-2035-2/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/rise-of-cybercrime-and-its-effect-by-the-year-2040-2/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/rise-of-cybercrime-and-its-effect-by-the-year-2040/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/rise-of-internet-demand-and-its-impact-on-communications-and-alternatives-by-the-year-2035/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/rise-of-telemedicine-and-its-impact-on-livelihood-by-2040-3-2/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/rise-of-e-health-and-its-impact-on-humans-by-the-year-2030/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/rise-of-e-health-and-its-imapct-on-humans-by-the-year-2030-2/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/rise-of-telemedicine-and-its-impact-on-livelihood-by-2040-2/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/rise-of-telemedicine-and-its-impact-on-livelihood-by-2040-2-2/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/rise-of-chatbots-and-its-impact-on-customer-support-by-the-year-2040/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/rise-of-e-health-and-its-imapct-on-humans-by-the-year-2030/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-does-marketing-influence-businesses-and-consumers/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-advertisement-increase-your-market-value/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/negative-effects-of-marketing-on-society/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-advertisement-marketing-affects-business/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/rising-it-cities-will-impact-the-economy-environment-infrastructure-and-city-life-by-the-year-2035/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/rise-of-ott-platform-and-its-impact-on-entertainment-industry-by-the-year-2030/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/rise-of-electric-vehicles-and-its-impact-on-livelihood-by-2040/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/rise-of-electric-vehicle-and-its-impact-on-livelihood-by-the-year-2040/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/oil-prices-by-the-year-2040-and-how-it-will-impact-the-world-economy/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/an-outlook-of-healthcare-by-the-year-2040-and-how-it-will-impact-human-lives/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/ai-in-healthcare-to-improve-patient-outcomes/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/what-if-the-creation-is-taking-over-the-creator/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/what-jobs-will-robots-take-from-humans-in-the-future/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/will-machine-replace-the-human-in-the-future-of-work/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/will-ai-replace-us-or-work-with-us/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/man-and-machines-together-machines-are-more-diligent-than-humans-blackcoffe/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/in-future-or-in-upcoming-years-humans-and-machines-are-going-to-work-together-in-every-field-of-work/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-neural-networks-can-be-applied-in-various-areas-in-the-future/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-machine-learning-will-affect-your-business/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/deep-learning-impact-on-areas-of-e-learning/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-to-protect-future-data-and-its-privacy-blackcoffer/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-machines-ai-automations-and-robo-human-are-effective-in-finance-and-banking/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/ai-human-robotics-machine-future-planet-blackcoffer-thinking-jobs-workplace/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-ai-will-change-the-world-blackcoffer/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/future-of-work-how-ai-has-entered-the-workplace/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/ai-tool-alexa-google-assistant-finance-banking-tool-future/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/ai-healthcare-revolution-ml-technology-algorithm-google-analytics-industrialrevolution/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/all-you-need-to-know-about-online-marketing/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/evolution-of-advertising-industry/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-data-analytics-can-help-your-business-respond-to-the-impact-of-covid-19/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/covid-19-environmental-impact-for-the-future/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/environmental-impact-of-the-covid-19-pandemic-lesson-for-the-future/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-data-analytics-and-ai-are-used-to-halt-the-covid-19-pandemic/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/difference-between-artificial-intelligence-machine-learning-statistics-and-data-mining/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-python-became-the-first-choice-for-data-science/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-google-fit-measure-heart-and-respiratory-rates-using-a-phone/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/what-is-the-future-of-mobile-apps/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/impact-of-ai-in-health-and-medicine/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/telemedicine-what-patients-like-and-dislike-about-it/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-we-forecast-future-technologies/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/can-robots-tackle-late-life-loneliness/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/embedding-care-robots-into-society-socio-technical-considerations/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/management-challenges-for-future-digitalization-of-healthcare-services/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/are-we-any-closer-to-preventing-a-nuclear-holocaust/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/will-technology-eliminate-the-need-for-animal-testing-in-drug-development/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/will-we-ever-understand-the-nature-of-consciousness/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/will-we-ever-colonize-outer-space/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/what-is-the-chance-homo-sapiens-will-survive-for-the-next-500-years/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/why-does-your-business-need-a-chatbot/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-you-lead-a-project-or-a-team-without-any-technical-expertise/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/can-you-be-great-leader-without-technical-expertise/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-does-artificial-intelligence-affect-the-environment/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-to-overcome-your-fear-of-making-mistakes-2/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/is-perfection-the-greatest-enemy-of-productivity/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/global-financial-crisis-2008-causes-effects-and-its-solution/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/gender-diversity-and-equality-in-the-tech-industry/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-to-overcome-your-fear-of-making-mistakes/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-small-business-can-survive-the-coronavirus-crisis/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/impacts-of-covid-19-on-vegetable-vendors-and-food-stalls/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/impacts-of-covid-19-on-vegetable-vendors/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/impact-of-covid-19-pandemic-on-tourism-aviation-industries/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/impact-of-covid-19-pandemic-on-sports-events-around-the-world/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/changing-landscape-and-emerging-trends-in-the-indian-it-ites-industry/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/online-gaming-adolescent-online-gaming-effects-demotivated-depression-musculoskeletal-and-psychosomatic-symptoms/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/human-rights-outlook/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-voice-search-makes-your-business-a-successful-business/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-the-covid-19-crisis-is-redefining-jobs-and-services/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-to-increase-social-media-engagement-for-marketers/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/impacts-of-covid-19-on-streets-sides-food-stalls/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/coronavirus-impact-on-energy-markets-2/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/coronavirus-impact-on-the-hospitality-industry-5/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/lessons-from-the-past-some-key-learnings-relevant-to-the-coronavirus-crisis-4/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/estimating-the-impact-of-covid-19-on-the-world-of-work-2/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/estimating-the-impact-of-covid-19-on-the-world-of-work-3/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/travel-and-tourism-outlook/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/gaming-disorder-and-effects-of-gaming-on-health/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/what-is-the-repercussion-of-the-environment-due-to-the-covid-19-pandemic-situation/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/what-is-the-repercussion-of-the-environment-due-to-the-covid-19-pandemic-situation-2/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/impact-of-covid-19-pandemic-on-office-space-and-co-working-industries/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/contribution-of-handicrafts-visual-arts-literature-in-the-indian-economy/ completed.


  df_output = df_output.append({


Textual analysis for https://insights.blackcoffer.com/how-covid-19-is-impacting-payment-preferences/ completed.
Textual analysis for https://insights.blackcoffer.com/how-will-covid-19-affect-the-world-of-work-2/ completed.
Analysis results saved to Output Data Structure.xlsx


  df_output = df_output.append({


In [24]:
import re
import nltk
from nltk.tokenize import word_tokenize, sent_tokenize
from nltk.corpus import stopwords


def clean_text(text, stop_words):
    # Remove stop words and non-alphabetic characters
    cleaned_text = ' '.join([word.lower() for word in word_tokenize(text) if word.isalpha() and word.lower() not in stop_words])
    return cleaned_text

def calculate_sentiment_scores(text, positive_words, negative_words):
    positive_score = sum(1 for word in word_tokenize(text) if word.lower() in positive_words)
    negative_score = -1 * sum(1 for word in word_tokenize(text) if word.lower() in negative_words)
    
    polarity_score = (positive_score - negative_score) / (positive_score + negative_score + 0.000001)
    subjectivity_score = (positive_score + negative_score) / (len(word_tokenize(text)) + 0.000001)
    
    return positive_score, negative_score, polarity_score, subjectivity_score

def calculate_readability(text):
    sentences = sent_tokenize(text)
    words = word_tokenize(text)
    
    average_sentence_length = len(words) / len(sentences)
    percentage_complex_words = sum(1 for word in words if len(word) > 2) / len(words)
    
    fog_index = 0.4 * (average_sentence_length + percentage_complex_words)
    average_words_per_sentence = len(words) / len(sentences)
    complex_word_count = sum(1 for word in words if len(word) > 2)
    word_count = len(words)
    
    syllable_count_per_word = calculate_syllable_count(words)
    
    personal_pronouns_count = count_personal_pronouns(text)
    
    average_word_length = sum(len(word) for word in words) / len(words)
    
    return (
        average_sentence_length, percentage_complex_words, fog_index,
        average_words_per_sentence, complex_word_count, word_count,
        syllable_count_per_word, personal_pronouns_count, average_word_length
    )

def calculate_syllable_count(words):
    syllable_count = 0
    for word in words:
        syllable_count += sum(1 for char in word if char.lower() in 'aeiou')
        
        # Handle exceptions
        if word.endswith(('es', 'ed')):
            syllable_count -= 1
    
    return syllable_count

def count_personal_pronouns(text):
    personal_pronouns = re.findall(r'\b(?:I|we|my|ours|us)\b', text, flags=re.IGNORECASE)
    return len(personal_pronouns)

def main():
    # Load stop words, positive words, and negative words
    stop_words = set(stopwords.words('english'))
    
    with open('StopWords/positive-words.txt', 'r') as file:
        positive_words = set(file.read().splitlines())

    with open('StopWords/negative-words.txt', 'r') as file:
        negative_words = set(file.read().splitlines())
    
    # Replace 'YourTextHere' with the actual text you want to analyze
    your_text = 'Output Data Structure.xlsx'
    
    # Cleaning
    cleaned_text = clean_text(your_text, stop_words)
    
    # Sentiment Analysis
    positive_score, negative_score, polarity_score, subjectivity_score = calculate_sentiment_scores(cleaned_text, positive_words, negative_words)
    
    # Readability Analysis
    readability_results = calculate_readability(cleaned_text)
    
    # Output Results
    print(f"Positive Score: {positive_score}")
    print(f"Negative Score: {negative_score}")
    print(f"Polarity Score: {polarity_score}")
    print(f"Subjectivity Score: {subjectivity_score}")
    
    print("\nReadability Analysis:")
    print(f"Average Sentence Length: {readability_results[0]}")
    print(f"Percentage of Complex Words: {readability_results[1]}")
    print(f"Fog Index: {readability_results[2]}")
    print(f"Average Words Per Sentence: {readability_results[3]}")
    print(f"Complex Word Count: {readability_results[4]}")
    print(f"Word Count: {readability_results[5]}")
    print(f"Syllable Per Word: {readability_results[6]}")
    print(f"Personal Pronouns Count: {readability_results[7]}")
    print(f"Average Word Length: {readability_results[8]}")

if __name__ == "__main__":
    main()


Positive Score: 0
Negative Score: 0
Polarity Score: 0.0
Subjectivity Score: 0.0

Readability Analysis:
Average Sentence Length: 2.0
Percentage of Complex Words: 1.0
Fog Index: 1.2000000000000002
Average Words Per Sentence: 2.0
Complex Word Count: 2
Word Count: 2
Syllable Per Word: 5
Personal Pronouns Count: 0
Average Word Length: 5.0
