In [1]:
# Downloading libraries for web-scraping
!pip install requests
!pip install beautifulsoup4==4.9.3
!pip install bs4
!pip install html5lib
!pip install num2words
!pip install vaderSentiment

# Importing libraries for web-scraping and tokenization purposes
import requests
import nltk
import pandas as pd
import re
from textblob import TextBlob
from num2words import num2words
from bs4 import BeautifulSoup as bs
from vaderSentiment.vaderSentiment import SentimentIntensityAnalyzer

# The list of common words such as "a", "an", etc.
nltk.download('stopwords')
# Download a collection of popular resources from the NLTK library
nltk.download('popular', quiet=True)
# Sentence tokenization (Splitting a text into individual senteces)
nltk.download('punkt')
# English vocabulary database
nltk.download('wordnet')
# Used for training language models or evaluating nlp algothms
nltk.download('brown')
# Used for performing sentiment analysis on text
nltk.download('vader_lexicon')

from nltk.tokenize import sent_tokenize
from nltk.stem import WordNetLemmatizer
from nltk.sentiment.vader import SentimentIntensityAnalyzer
from nltk.corpus import stopwords
from nltk.stem import SnowballStemmer
from nltk.tokenize import word_tokenize

lemmatizer = WordNetLemmatizer()
analyzer = SentimentIntensityAnalyzer()
stemmer = SnowballStemmer("english")
stop_words = stopwords.words("english")

Collecting beautifulsoup4==4.9.3
  Downloading beautifulsoup4-4.9.3-py3-none-any.whl (115 kB)
[2K     [90m━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━━[0m [32m115.8/115.8 kB[0m [31m2.0 MB/s[0m eta [36m0:00:00[0m
Installing collected packages: beautifulsoup4
  Attempting uninstall: beautifulsoup4
    Found existing installation: beautifulsoup4 4.12.3
    Uninstalling beautifulsoup4-4.12.3:
      Successfully uninstalled beautifulsoup4-4.12.3
[31mERROR: pip's dependency resolver does not currently take into account all the packages that are installed. This behaviour is the source of the following dependency conflicts.
yfinance 0.2.37 requires beautifulsoup4>=4.11.1, but you have beautifulsoup4 4.9.3 which is incompatible.[0m[31m
[0mSuccessfully installed beautifulsoup4-4.9.3
Collecting bs4
  Downloading bs4-0.0.2-py2.py3-none-any.whl (1.2 kB)
Installing collected packages: bs4
Successfully installed bs4-0.0.2
Collecting num2words
  Downloading num2words-0.5.13-py3-none-any.whl (1

[nltk_data] Downloading package stopwords to /root/nltk_data...
[nltk_data]   Unzipping corpora/stopwords.zip.
[nltk_data] Downloading package punkt to /root/nltk_data...
[nltk_data]   Package punkt is already up-to-date!
[nltk_data] Downloading package wordnet to /root/nltk_data...
[nltk_data]   Package wordnet is already up-to-date!
[nltk_data] Downloading package brown to /root/nltk_data...
[nltk_data]   Unzipping corpora/brown.zip.
[nltk_data] Downloading package vader_lexicon to /root/nltk_data...


In [2]:
sentences = []

def scrape_clean (url, div_class):
  # Load the website
  website = requests.get(url).text
  soup = bs(website,'html.parser')

  # Find the div section that is the parent of all paragraphs
  div = soup.find_all('div', attrs={'class':div_class})

  # Get the text from paragraphs
  extracted_text = []
  for div in div:
      paragraphs = div.find_all('p')
      for paragraph in paragraphs:
          extracted_text.append(paragraph.get_text(strip=True))  # Remove leading/trailing whitespace

  # Splitting the text into sentences, remove the stopwords and punctuations, and save the cleaned version in a list
  sentences = []
  for text in extracted_text:
    sentence = sent_tokenize(text)
    for item in sentence:
      # Convert to lowercase
      text_lowercase = item.lower()
      # Remove punctuation
      text_without_punctuation = re.sub(r"[^\w\s]", "", text_lowercase)
      # Remove stopwords and stem words
      tokens = word_tokenize(text_without_punctuation)
      new_tokens = []
      for word in tokens:
        if word.isnumeric():
          word = num2words(word)
          new_tokens.append(lemmatizer.lemmatize(word))
          continue
        elif word not in stop_words:
          new_tokens.append(lemmatizer.lemmatize(word))
          continue
      # Join tokens back into a string
      cleaned_text = " ".join(new_tokens)
      sentences.append(cleaned_text)

  return sentences

In [3]:
def clean(list):    # For websites that don't allow us to do the web scrape
  cleaned = []
  for i in list:
    sentence = sent_tokenize(i)
    for item in sentence:
      # Convert to lowercase
      text_lowercase = item.lower()
      # Remove punctuation
      text_without_punctuation = re.sub(r"[^\w\s]", "", text_lowercase)
      # Remove stopwords and stem words
      tokens = word_tokenize(text_without_punctuation)
      new_tokens = []
      for word in tokens:
        if word.isnumeric():
          word = num2words(word)
          new_tokens.append(lemmatizer.lemmatize(word))
          continue
        elif word not in stop_words:
          new_tokens.append(lemmatizer.lemmatize(word))
          continue
      # Join tokens back into a string
      cleaned_text = " ".join(new_tokens)
      cleaned.append(cleaned_text)
  return cleaned

In [4]:
website1 = 'https://www.oneclickitsolution.com/blog/role-of-artificial-intelligence-in-the-travel-industry/#:~:text=AI%E2%80%99s%20Impact%20on%20Travel%20Industry%201%20ChatBots%3A%20Almost,of%20Artificial%20Intelligence.%20...%204%20Virtual%20Reality%3A%20'
class1 = 'entry-content entry clearfix'
text1 = scrape_clean(website1, class1)
sentences.extend(text1)
print(text1)

['artificial intelligenceenables computer machine mimic human mind perception learning decisionmaking problemsolving capability', 'ai wideranging branch computer science concerned building smart work machine capable performing task typically need human intelligence', 'ai made first appearance year one thousand, nine hundred and sixty-six john mccarthy dartmouth summer research project', 'ai requires four basic element work data program hardware interconnectivity different system', 'ai interdisciplinary science work multiple approach', 'relies big data processing capability multiple algorithm advancement machine learning deep learning creating paradigm shift virtually everytravel technology industrysector', 'ai probably part daily life several way', 'see targeted ad social medium might generated byartificial intelligence', 'ask digital assistant questionartificial intelligenceallows technology search web find helpful useful answer', 'shopping product recommendation favorite music app so

In [5]:
website2 = 'https://framey.io/blog/ai-and-the-future-of-travel-and-tourism/'
class2 = 'content-inner'
text2 = scrape_clean(website2, class2)
sentences.extend(text2)
print(text2)

['ai future travel', 'travel tourism industry poised undergo massive transformation coming year', 'rise artificial intelligence ai possibility traveler tour operator endless', 'ai technology used streamline booking process provide personalized recommendation create even immersive experience guest', 'blog post explore ai shape future travel tourism impact industry whole', 'get inspired start planning next adventure withframeytoday', 'table content', 'ai change travel industry', 'ai rapidly changing face travel tourism industry', 'recent year ai technology implemented almost area industry booking flight accommodation providing personalized recommendation destination', 'addition aidriven system enabled efficient operation hotel airline tourism company resulting better service traveler increased revenue business', 'according report statista ai estimated bring one hundred and forty-three billion revenue global travel tourism industry two thousand and twenty-two', 'growth expected continue a

In [6]:
website3 = 'https://www.forbes.com/sites/rogersands/2023/11/01/how-will-artificial-intelligence-impact-the-travel-industry/'
class3 = 'article-body fs-article fs-responsive-text current-article'
text3 = scrape_clean(website3, class3)
sentences.extend(text3)
print(text3)

['traveler ready put faith ai', 'artificial intelligence commonly known ai longawaited savior human race bane today fastpaced alwayslookingforashortcut society', 'although often without knowledge consent consumer affected ai realize', 'healthcare financial interaction transportation agriculture ai playing major role', 'travel industry immune farreaching tentacle', 'ai impact real travel experience', 'according thenational research groupnrg global data insight firm journalist using ai write online travel guide influencers showing follower plan vacation chatgpt two everyone small travel agency industry giant actively exploring use technology provide smoother safer interactive digital experience customer', 'theory aipowered travel tool could enormously helpful consumer helping take hassle vacation planning offering kind personalized advice previously available could afford service human travel agent', 'traveler really ready put faith ai come complex task like booking flight accommodation 

In [7]:
website4 = 'https://www.accenture.com/us-en/insights/travel/travel-ai-maturity'
class4 = 'root container responsivegrid'
text4 = scrape_clean(website4, class4)
sentences.extend(text4)
print(text4)

['current country united state', 'research report', '5minute read', 'survey travel executivespart extensive crossindustry analysis one thousand, six hundred csuite executive data science leader world largest organizationsreveals travel organization barely scratching surface inai', 'thirteen travel company ai maturity today unlock full potential', 'call ai achiever', 'ai achiever different know success ai science art', 'science algorithm meet art organizational adaptation', 'early success build confidence ai valuedriver broadly estimate across industry ai transformation happen much faster digital transformationon average sixteen month faster', 'mean travel specifically', 'creates clear sense urgency action', 'leader havent forgotten happened travel digital laggard', 'still business today continue play catch', 'growing consensus ai increasingly essential competitive advantage travel', 'ai maturityis mastering set key capability right combination across two category', 'industry ai achieve

In [8]:
website5 = 'https://explore.seeker.io/blog/ai-and-the-travel-industry'
class5 = 'sqs-html-content'
text5 = scrape_clean(website5, class5)
sentences.extend(text5)
print(text5)

['rapidly advancing field artificial intelligence ai revolutionizing various industry thetourism industryis exception', 'whether improvingtravel planning enhancing customer service optimizingmarketing strategy addressing ethical concern ai reshaping way experience engage tourism sector', 'two thousand and twenty-three year ai', 'although artificial intelligence ai around decade launch ofchatgpton november thirty two thousand and twenty-two followed host generative ai tool including google responsebard accelerated adoption artificial intelligence across industry', 'word anyone talking day', 'let take closer look ai potential application impact thetourism industry', 'artificial intelligence often abbreviated ai rapidly advancing field refers development computer system capable performing task would normally require human intelligence', 'ai system designed analyze vast amount data recognize pattern make decision prediction based information', 'ai system designed mimic human cognitive abil

In [9]:
website6 = 'https://www.mckinsey.com/industries/travel-logistics-and-infrastructure/our-insights/what-ai-means-for-travel-now-and-in-the-future'
class6 = 'mdc-o-content-body mck-u-dropcap'
text6 = scrape_clean(website6, class6)
sentences.extend(text6)
print(text6)

['ârevenge travelâitâs lot people daysâhitting runway big number make travel time lost pandemic', 'episode ofthe mckinsey podcast mckinsey partner alex cosmas vik krishnan join global editorial director lucia rahilly discus new report ontravel age ai technologyâs promise pitfall may mean travel industry overall', 'transcript edited clarity length', 'mckinsey podcastis cohosted roberta fusaro lucia rahilly', 'lucia rahillymuch research report drew interview executive seventeen company across five type travel business', 'one executive luca zambello ceo jurnyâan aifueled hospitality platform', 'say ai new normal', 'luca zambelloweâre beginning hockey stick', 'economically start potentially biggest technology disruption humanity ever seen', 'lucia rahillyso everyone talking disruptive juggernaut ai particularly gen ai generative ai', 'superhigh level acknowledging weâre still early day expect mean travel industry particular', 'vik krishnanthe travel industry unquestionably going significan

In [10]:
website7 = 'https://mize.tech/blog/6-examples-of-how-ai-is-used-in-the-travel-industry/'
class7 = 'wprt-container'
text7 = scrape_clean(website7, class7)
sentences.extend(text7)
print(text7)

['ai made advance many industry since invented', 'everchanging travel industry also taking advantage ai revolutionize way operates', 'result nowadays travel company highly leverage aipowered tool solution various process travel planning landing destination', 'article learn ai transformed lucrative travel industry using example application', 'also discus advance ai travel company aware order stay competitive industry', 'artificial intelligenceor ai branch computer science wheremachines computer simulate human intelligence1', 'ai machine programmed think like human perform task human', 'furthermore leverage problemsolving decisionmaking capability human being two', 'ai single technology rapidly evolving collection technology like deep learning machine learning expert system', 'example ai system selfdriving car spaceexploring robot learn experience', 'today ongoing research applicability advanced ai technology likegenerative adversarial networksandedge aiin various industry', 'role ai tou

In [11]:
website8 = 'https://www.revfine.com/artificial-intelligence-travel-industry/'
class8 = 'post-content'
text8 = scrape_clean(website8, class8)
sentences.extend(text8)
print(text8)

['artificial intelligence travel industry refers using ai technology enhance various aspect travel personalized recommendation efficient operation', 'important improves customer experience streamlines booking process optimizes pricing strategy assist predictive analysis making travel efficient tailored individual preference', 'ai role increasingly vital shaping future travel sector', 'table content', 'introduction', 'artificial intelligence constantly improving making reliable attractive business solution', 'particular business thetravel industryare taking advantage ai perform various administrative customer service task', 'learn us benefit artificial intelligence explain changing travel company operate', 'concept artificial intelligence ai often discussed slightly difficult define', 'essentially refers computer machine performing task would normally require human intelligence carry', 'could example learning lesson making decision recognizing interpreting speech', 'artificial intellige

In [12]:
website9 = 'https://startups.epam.com/blog/artificial-intelligence-in-tourism-and-travel-industry'
class9 = 'ArticlePage_mainContent___vpeu'
text9 = scrape_clean(website9, class9)
sentences.extend(text9)
print(text9)

['innovation revolutionized industry artificial intelligence tourism', 'moment virtually every company involved tourism us least one aipowered technology market forecast reaching twelve billion two thousand and twenty-six', 'innovation like natural language processing nlpbig data deep learning also improve quality travel experience', 'article discus relevance artificial intelligence tourism travel industry', 'also focus future prospect ai tourism factor modern user especially gen z millennials', 'ai revolution traveling chore', 'skyscanner could recommend cheap flight target destination airbnb could suggest top accommodation based previous trip fellow tourist could share tip tripadvisor', 'back spend time planning itinerary searching flight sorting several filter find therighthotel', 'ai changed multiple way following innovation', 'planning trip ai assistant help everything booking hotel adding date calendar', 'think ai travel assistant travel agent without actual human end', 'help dat

In [13]:
website10 = 'https://softwarehut.com/blog/business/artificial-intelligence-travel-industry'
class10 = 'blog-article-module--blogArticleContent--1a626'
text10 = scrape_clean(website10, class10)
sentences.extend(text10)
print(text10)

['gone day customer would spend hour looking flight hotel next trip', 'nowadays must ask siri check one many online portalssuch skyscanner', 'client nolonger need call customer service wait long checkin queue either', 'facebook messenger bot livechat airlineâs website', 'solution make travelling seamless experience possible artificial intelligence ai', 'currentlyâmany exist moreâin development', 'bear enormous implication change way travel industry operates saving customer time money mundane task', 'question adapt change use ai competitive advantage business', 'itâs travel industry benefit technology manyexamples use ai everyday life', 'chatbots data analysis facial image speech recognition â example ai implementation', 'whatâs artificial intelligence another buzzword tech world', 'ai implementation already become part business landscape', 'tone industry report changed year sceptical promising', 'ai technology improves business feel confident taking advantage', 'travel industry differe

In [14]:
website11 = 'https://easternpeak.com/blog/ai-use-cases-in-travel-and-hospitality/'
class11 = 'post__text'
text11 = scrape_clean(website11, class11)
sentences.extend(text11)
print(text11)

['expert persistently upgrading artificial intelligence solution making reliable effective instrument numerous sphere', 'tourism sector implementing best ai ml versatile segment', 'modern technology help business owner perform various administrative task offer excellent customer service one hand ensure effortless convenient practice traveler', 'increased deployment ml ai travel industry account enhancing personalization giving valuable advice ensuring speedy response period even employee absent', 'many hotel resort worldwide depend heavily artificial intelligence solution delivering service gaining strong reputation travel ai market projected exceed12 bn two thousand and twenty-six', 'present article cover successful us ml ai travel sector revealing efficient way boost operation within tourismrelated business', 'innovative computer system brought enormous change tourism sphere year ago still causing considerable paradigm shift', 'let closer look ai technology applied different sphere t

In [15]:
website12 = 'https://botshot.ai/resources/blog/how-ai-is-transforming-the-travel-industry'
class12 = 'MuiBox-root css-14l6jdq'
text12 = scrape_clean(website12, class12)
sentences.extend(text12)
print(text12)

['artificial intelligence ai travel industry topic conversation contemporary time', 'here', 'travel tourism industry growing rapidly city restore normalcy pandemic', 'increasing number traveler hospitality industry relying technology serve guest ever', 'result different technology used simplify streamline operation raise guest satisfaction', 'advantage artificial intelligence ai travel industry enormous farreaching', 'transforming way people travel', 'fact according anindustryarc report travel ai market expected exceed twelve bn two thousand and twenty-six', 'blog take way ai penetrated ai impacting travel tourism industry', 'ai changing travel industry sure', 'ai', 'artificial intelligence ai refers computer machine performing task would generally need human intelligence carry', 'simpler word intelligence perceives synthesizes infers information different human living being', 'ai existence long time', 'however necessary advancement recently become reliable enough carry complex task mi

In [16]:
website13 = 'https://inoxoft.com/blog/exploring-ai-use-cases-in-the-travel-industry/'
class13 = 'postContent__content'
text13 = scrape_clean(website13, class13)
sentences.extend(text13)
print(text13)

['light global pandemic transformative impact customer preference work dynamic travel industry undergoing digital renaissance', 'embracing social distancing measure propelled massive digitalization personal professional sphere', 'industry emerges challenge lockdown face task understanding catering new breed customer', 'business travel sector striving create ideal service experience often entail integrating innovative solution regular operation', 'question arises tool company leverage regain competitive edge recover setback endured pandemic', 'answer lie realm artificial intelligence', 'essence ai capability revolutionize every aspect industry', 'aidriven travel planner adept providing flexible scheduling option delivering realtime update notification ensuring maximum satisfaction traveler', 'furthermore aipowered feedback analysis tool invaluable optimizing error detection bug fixing update deployment process within travel domain', 'ai integration travel tourism empowers business custo

In [17]:
website14 = 'https://www.luxurytravelmagazine.com/news-articles/the-revolutionary-role-of-ai-in-the-travel-industry'
class14 = 'entry-content notopmargin'
text14 = scrape_clean(website14, class14)
sentences.extend(text14)
print(text14)

['travel industry dynamic everchanging field continues evolve remarkable way thanks advent cuttingedge technology', 'among technology artificial intelligence ai stand revolutionary force transforming travel industry profound unprecedented way', 'enhancing customer experience improving operational efficiency enabling highly personalized service impact ai nothing short extraordinary', 'ai influence extends beyond traditional travel agency empowering innovative company leveragedsp platformsfor targeted advertising dynamic travel package creation', 'platform fueled aipowered algorithm analyze vast amount data identify reach ideal customer laser precision tailoring travel offering specific need preference', 'intricate dance technology human ingenuity ai transforming travel industry shaping journey individual traveler meaningful unforgettable way', 'post well delve deeper intricacy revolution ofai travel exploring nuanced implication uncovering unexpected challenge arise amidst burst aipower

In [18]:
# Texts that can't be scraped from website
# https://www.weforum.org/agenda/2023/12/how-is-ai-reshaping-the-travel-tourism/
# https://business.booking.com/en-us/business-travel-resources/articles/business-travel-and-aI/?aid=1181029&label=msn-jVw1O*kpnhMQALsGbdeDlQ-80539282677219:tidat-2332339040468841:loc-188:neo:mtb:lp40862:dec:qsai%20in%20travel%20industry&utm_campaign=English_United_Kingdom%20EN%20GB&utm_medium=cpc&utm_source=bing&utm_term=jVw1O*kpnhMQALsGbdeDlQ&msclkid=0b42088af0451fb689e86e983355aca5
# https://amadeus.com/en/insights/themes/artificial-intelligence-travel-industry
# https://www.nytimes.com/2023/03/16/travel/chatgpt-artificial-intelligence-travel-vacation.html

not_scraped = ['In the dynamic landscape of travel, artificial intelligence (AI) stands as a beacon of transformation, reshaping our journey from the moment we decide to explore the world. In building an AI ecosystem for travellers, we have doubled conversion rates, shaped user loyalty and fostered global communities. Beyond streamlined planning, AI innovation redefines the very essence of travel, promising a future marked by efficiency, personalization and global enrichment.',
               'For businesses, AI is used to analyse historical booking patterns, market demand and external factors (e.g. weather and events) to optimize pricing in real time. Dynamic pricing strategies help companies adjust prices to maximize revenue and occupancy rates in hotels. AI is also employed for predictive maintenance in the transportation sector, helping to anticipate and address potential issues with vehicles and aircraft before they cause disruptions.',
               'For consumers, the future of smart travel planning is exemplified by efficiently deciphering complex requests and swiftly directing users to detailed itinerary planning, personalized recommendations and bookings. This is a process we’re continually improving with our travel assistant, eliminating the manual effort of input and filtering searches and making travel planning as effortless as chatting with a friend. TripGenie provides personalized, editable itineraries in less than a minute that would take hours or days to plan manually. It can also handle complex requests, such as multi-destination planning.',
               'During the COVID-19 pandemic, we saw augmented reality (AR) and virtual reality (VR) technologies enhance the travel experience by providing virtual tours, interactive maps and immersive experiences to help travellers explore destinations without actually visiting. A common use of AR is also in translation apps, allowing users to point their smartphones at foreign signs or text. The app then overlays translations onto real-world images, breaking down language barriers for travellers and allowing them to better experience their new environment.',
               'These shared experiences have the potential to deepen the relationship between travellers and travel partners. In our platforms, we have been experimenting with using AI to tap into the stories of travellers, forming algorithmic, AI-powered lists. These lists offer curated information based on user preferences and real-time data, encouraging a vibrant travel ecosystem and strong traveller communities.',
               'AI-powered chatbots and virtual assistants are used for customer service, providing instant responses to queries and assisting with booking processes. These systems can handle routine tasks, such as reservation changes and FAQs, and provide travel recommendations based on user preferences.',
               'Our AI chatbots handle numerous enquiries via text and voice, achieving impressive self-service resolution rates for airline tickets and hotels. This streamlined approach not only saves time and energy for customers, it also accelerates case-solving efficiency, allowing customer service teams to focus on more complex cases.',
               'As we look ahead, the future of AI in travel is poised to focus on efficient and highly personalized solutions tailored to individual travellers needs. This vision signifies the next phase of the travel industry and underscores the profound impact of AI in making travel more convenient, personalized and memorable for everyone.',
               'This AI push aligns with a thriving travel market with domestic and regional tourism experiencing substantial growth. During Chinas Golden Week, the first long holiday since the reopening of borders in 2023, outbound travel volume surged by over 800% compared to the previous year, while domestic tourism grew by nearly 200% this year. Chinas inbound tourism harbours immense potential and if elevated to 1.5% of GDP, it could yield a growth of over RMB 1.3 trillion.',
               'In this new era of travel, we are optimistic. As we continue to evolve in the realm of AI, the possibilities are not just exciting; they are limitless. AI is not merely changing the way we travel; it is revolutionising the very essence of our travel experiences, making them efficient, intuitive and deeply enriching.',
               'The trustworthiness of AI and its features is a complex and evolving concern. While AI technologies have demonstrated remarkable capabilities across many fields, general trustworthiness hinges on the ethical frameworks and structures in place. Issues such as biased algorithms, lack of transparency, and potential misuse of AI raise valid concerns. When it comes to corporate travel, privacy and safety are also essential.',
               'Ultra-personalized travel recommendations – Trust is highest (89%) in AI systems that provide ultra-personalized travel recommendations. Tailored suggestions enhance the overall travel experience, earning the confidence of business travelers.',
               'Real-time language translation services – The reliability of real-time language translation services is a cornerstone of trust (88%). Breaking down language barriers contributes to smoother interactions and increased trust in AI.',
               'Automated expense tracking and reporting – Trust in applications for automated expense tracking and reporting (88%) underscore their importance in the eyes of business travelers.',
               'Enhanced cyber protection – Despite the slightly lower perception of this AI feature, there is a growing level of confidence in enhanced cyber protection tools (78%). Businesses may need to continue to address concerns to build trust in cybersecurity solutions and explore the benefits of these features.',
               'A fascinating correlation emerges when exploring the relationship between interest and trust in AI. The younger generations (18–45 years old) exhibit a higher overall interest in tech features compared to their older counterparts (46 years old and above). Notably, younger professionals show a heightened interest in health and wellness monitoring apps compared to their older counterparts, reiterating the findings of Deliotte’s insights into travel trends. As business travel evolves, embracing AI isn’t just a choice, but a necessity. Understanding the interests, trust levels and preferences of business travelers is pivotal for businesses to offer tailored solutions such as chatbots, and machine learning models for suggesting options for flights, accommodation and car rentals.',
               'We are focused on ways to use artificial intelligence (AI) in the travel industry to better serve our customers, so they can better serve their customers, the end travelers. We see AI as a key enabler in making the overall travel experience smoother while helping travel players improve their businesses. AI is currently being integrated into many of our solutions. For example, for our airline customers, we have a dedicated team of Amadeus AI and machine learning (ML) experts working to support areas such as revenue management optimization, merchandising, and other business areas. We also have AI capabilities in distribution, airports, and hospitality, covering virtually all segments of the travel industry.',
               'To complement the different AI teams that focus on our travel solutions (e.g., airlines), we also have a dedicated research team composed of experimental research scientists and engineers. The mission of this team is to better understand travelers to enable smarter, seamless, and more sustainable travel experiences with AI. Our researchers deliver academic publications and push the boundaries of AI knowledge in travel. Their innovations are put into production with different Amadeus products and services using the latest machine learning models. We also have open self-service AI APIs for developers in the travel industry.',
               'We are continuously researching the behaviors of travelers to understand their motivations to travel. By doing so, we can better propose offers that might enrich their experience or alternatives that could improve their journey and satisfaction.',
               'By analyzing behaviors, segmenting, and clustering travelers, we can predict their actions leveraging AI technologies. For example, we are looking at choice modeling to predict what travelers will most likely choose when presented with different alternatives.',
               'We are working to create smooth and frictionless experiences for travelers by improving the efficiency of various travel related processes. An example of this is using AI to help optimize passenger processing at airports or accurately forecasting the amount of luggage in an aircraft.',
               'The travel industry may never be the same. Already, travelers can “converse” with the system, sharing information like a destination, time of year and interests, and getting back a personalized itinerary festooned with vivid descriptions. A reporter’s recent request for a two-day itinerary to Whistler, British Columbia, yielded ideas like snowshoeing with a guide who will point out the local flora and fauna, and taking a dog-sled ride “with a team of beautiful huskies” for a winter trip. Given additional parameters, ChatGPT will update its suggestions, so adding a preference for Thai food to the Whistler conversation prompted the system to give new restaurant suggestions. But ChatGPT does have limitations. First, its information base currently does not go beyond 2021, and it does not have access to important travel-related data that can change from moment to moment, like airline schedules and weather forecasts. New versions are being developed, including a major upgrade released this week, and are expected to keep improving. Also, the software doesn’t always know the difference between reliable and unreliable information on the internet, so it can offer answers that are untrue. ChatGPT’s maker, OpenAI, also warns that the software may occasionally produce “biased content.” Anyone can use the software, which is free and accessible via the OpenAI website. Tourist bureaus can ask ChatGPT to write marketing copy describing must-see sites, and travel advisers can use it to compose emails to their clients and create social media posts. Airline, hotel and rental car companies could use it to help their virtual agents answer a wider variety of questions. One travel adviser said she used ChatGPT to write a “firm but friendly breakup letter” to a client with whom she no longer wanted to work. The adviser had to rewrite the prompt — the term for a ChatGPT question or command — a few times to get what she wanted, but in the end it worked. “My client said she understood and wasn’t mad at me,” said the adviser, who asked to remain anonymous because she did not want her former client to know that ChatGPT had written the letter.',
               ]
cleaned = clean(not_scraped)
sentences.extend(cleaned)
print(cleaned)

['dynamic landscape travel artificial intelligence ai stand beacon transformation reshaping journey moment decide explore world', 'building ai ecosystem traveller doubled conversion rate shaped user loyalty fostered global community', 'beyond streamlined planning ai innovation redefines essence travel promising future marked efficiency personalization global enrichment', 'business ai used analyse historical booking pattern market demand external factor eg', 'weather event optimize pricing real time', 'dynamic pricing strategy help company adjust price maximize revenue occupancy rate hotel', 'ai also employed predictive maintenance transportation sector helping anticipate address potential issue vehicle aircraft cause disruption', 'consumer future smart travel planning exemplified efficiently deciphering complex request swiftly directing user detailed itinerary planning personalized recommendation booking', 'process continually improving travel assistant eliminating manual effort input 

In [19]:
for i in sentences:
  print(f'{i}\n')

artificial intelligenceenables computer machine mimic human mind perception learning decisionmaking problemsolving capability

ai wideranging branch computer science concerned building smart work machine capable performing task typically need human intelligence

ai made first appearance year one thousand, nine hundred and sixty-six john mccarthy dartmouth summer research project

ai requires four basic element work data program hardware interconnectivity different system

ai interdisciplinary science work multiple approach

relies big data processing capability multiple algorithm advancement machine learning deep learning creating paradigm shift virtually everytravel technology industrysector

ai probably part daily life several way

see targeted ad social medium might generated byartificial intelligence

ask digital assistant questionartificial intelligenceallows technology search web find helpful useful answer

shopping product recommendation favorite music app social medium friend s

In [20]:
# Use Vader library to get the polarity of the sentence
def getPolarity(text):
    polarity = SentimentIntensityAnalyzer().polarity_scores(text)
    if polarity['compound'] > 0:
      sentiment = 'postive'
    elif polarity['compound'] < 0:
      sentiment = 'negative'
    else:
      sentiment = 'neutral'
    return sentiment,polarity

In [21]:
data = []  # List to store dictionaries
for sentence in sentences:
  sentiment, polarity = getPolarity(sentence)
  new_item = {'sentence' : sentence, 'sentiment' : sentiment, 'category' : 'Travel'}
  data.append(new_item)

df = pd.DataFrame(data)

In [23]:
df.to_csv('Travel data (no numbers) - Vader ver.csv', index=False)