In [None]:
#1. Standardize emails to avoid capitalization difference
email = "cristache.Adrian@Example.COM"
normalized_email = email.lower()
print(normalized_email)


cristache.adrian@example.com


In [3]:
#2. Comparing values in a list without regard to case

country = "Romania"
if country.lower() == "romania":
    print("Match found")


Match found


In [None]:
#3. Cleaning data from a CSV column before loading into DB

names = ["ALICE", "Bob", "CHARLIE"]
clean_names = [name.lower() for name in names]
print(clean_names)


['alice', 'bob', 'charlie']


In [5]:
#4. Processing mixed-text logs for uniform search

log_entry = "ERROR: Disk Space Low"
if "error" in log_entry.lower():
    print("Error detected in log")


Error detected in log


In [None]:
#5. Creating case-insensitive unique keys

raw_key = "Customer_ID_123"
db_key = raw_key.lower()
print(db_key)


customer_id_123


In [None]:
#6. Generating uppercase country codes for standardized reporting

country_names = ["Romania", "france", "germany"]
country_codes = [name[:3].upper() for name in country_names]
print(country_codes)

['ROM', 'FRA', 'GER']


In [None]:
#7. Normalizing product SKUs before matching with an external API

skus_from_db = ["abc-123", "def-456", "ghi-789"]
normalized_skus = [sku.upper() for sku in skus_from_db]
print(normalized_skus)


['ABC-123', 'DEF-456', 'GHI-789']


In [None]:
#8. Creating uppercase SQL column aliases for consistency

columns = ["customer_id", "order_date", "total_amount"]
sql_select = ", ".join([f"{col} AS {col.upper()}" for col in columns])
print(sql_select)


customer_id AS CUSTOMER_ID, order_date AS ORDER_DATE, total_amount AS TOTAL_AMOUNT


In [None]:
#9.Tagging log entries with uppercase severity levels
log_entries = [
    {"level": "error", "message": "Disk full"},
    {"level": "warning", "message": "Memory usage high"},
]
tagged_logs = [f"[{entry['level'].upper()}] {entry['message']}" for entry in log_entries]
print(tagged_logs)




In [None]:
#10. Creating uppercase identifiers for deduplication in ETL pipelines

raw_ids = ["ab123", "Ab123", "AB124", "ab125"]
unique_ids = list(set([id.upper() for id in raw_ids]))
print(unique_ids)


['AB125', 'AB123', 'AB124']


In [1]:
#10. Formatting customer names imported from inconsistent data sources

raw_names = ["jOHn", "MARY", "alEX"]
formatted_names = [name.capitalize() for name in raw_names]
print(formatted_names)


['John', 'Mary', 'Alex']


In [None]:
#11. Standardizing product category labels for reporting

categories = ["electronics", "FURNITURE", "home appliances"]
standardized_categories = [cat.capitalize() for cat in categories]
print(standardized_categories)


['Electronics', 'Furniture', 'Home appliances']


In [None]:
#12. Cleaning and formatting city names from a CSV before geocoding

city_data = ["BUCHAREST", "cluj-napoca", "IaSi"]
clean_cities = [city.capitalize() for city in city_data]
print(clean_cities)


['Bucharest', 'Cluj-napoca', 'Iasi']


In [None]:
#13. Creating properly capitalized labels in an ETL output file

labels = ["total revenue", "average profit", "net loss"]
output_labels = [label.capitalize() for label in labels]
print(output_labels)


['Total revenue', 'Average profit', 'Net loss']


In [None]:
#14. Formatting API responses for display in dashboards

api_responses = ["success", "FAILED", "pending"]
formatted_status = [status.capitalize() for status in api_responses]
print(formatted_status)


['Success', 'Failed', 'Pending']


In [None]:
#15. Formatting book titles before inserting into a database

book_titles = ["the great gatsby", "to kill a mockingbird", "war and peace"]
formatted_titles = [title.title() for title in book_titles]
print(formatted_titles)


['The Great Gatsby', 'To Kill A Mockingbird', 'War And Peace']


In [None]:
#16. Standardizing multi-word city names for location matching

cities = ["new york", "los angeles", "san francisco"]
standardized_cities = [city.title() for city in cities]
print(standardized_cities)


['New York', 'Los Angeles', 'San Francisco']


In [None]:
#17.Preparing product names for clean display in a dashboard

products = ["apple iphone 14 pro", "samsung galaxy s23 ultra", "sony wh-1000xm5 headphones"]
clean_products = [product.title() for product in products]
print(clean_products)


['Apple Iphone 14 Pro', 'Samsung Galaxy S23 Ultra', 'Sony Wh-1000Xm5 Headphones']


In [None]:
#18. Formatting dataset column names for human-readable reports

columns = ["total sales amount", "average order value", "number of customers"]
readable_columns = [col.title() for col in columns]
print(readable_columns)

['Total Sales Amount', 'Average Order Value', 'Number Of Customers']


In [None]:
#19. Cleaning movie titles scraped from a website before storage

raw_movies = ["lord of the rings: the return of the king", "harry potter and the goblet of fire"]
formatted_movies = [movie.title() for movie in raw_movies]
print(formatted_movies)


['Lord Of The Rings: The Return Of The King', 'Harry Potter And The Goblet Of Fire']


In [12]:
#20. Comparing user input against a reference list in a multilingual dataset

allowed_countries = ["românia", "france", "germany"]
user_input = "ROMÂNIA"
if user_input.casefold() in [country.casefold() for country in allowed_countries]:
    print("Country match found")



Country match found


In [13]:
#21. Deduplicating names with mixed case and diacritics before loading into a database

names = ["André", "andré", "ANDRÉ", "Andre"]
unique_names = list(set([name.casefold() for name in names]))
print(unique_names)
    

['andré', 'andre']


In [None]:
#22. Matching product names from two systems with different casing rules

system_a = ["iPhone 14 Pro", "Samsung Galaxy S23"]
system_b = ["IPHONE 14 PRO", "samsung galaxy s23"]
matches = [p1 for p1 in system_a for p2 in system_b if p1.casefold() == p2.casefold()]
print(matches)


['iPhone 14 Pro', 'Samsung Galaxy S23']


In [17]:
#23.  Searching for keywords in text regardless of case or accents

text = "Sistémul a detectat o Eróare Critică"
if "eroare".casefold() in text.casefold():
    print("Error keyword found")



In [None]:
#24. Cleaning and comparing email domains ignoring case sensitivity
emails = ["John.Doe@Example.com", "alice@EXAMPLE.COM", "bob@example.com"]
unique_domains = list(set([email.split("@")[1].casefold() for email in emails]))
print(unique_domains)


['example.com']


In [None]:
#25.Cleaning and standardizing date formats before loading into a database

dates = ["2025-08-12", "2025/08/12", "2025.08.12"]
clean_dates = [d.replace("/", "-").replace(".", "-") for d in dates]
print(clean_dates)


['2025-08-12', '2025-08-12', '2025-08-12']


In [None]:
#26.Masking sensitive information in log files

csv_data = "Name;Age;Country\nAlice;30;USA\nBob;25;UK"
fixed_csv = csv_data.replace(";", ",")
print(fixed_csv)


Name,Age,Country
Alice,30,USA
Bob,25,UK


In [None]:
#27. Removing unwanted HTML tags from scraped data

html_data = "<div>Hello</div><p>World</p>"
clean_text = html_data.replace("<div>", "").replace("</div>", "").replace("<p>", "").replace("</p>", "")
print(clean_text)

HelloWorld


In [None]:
#28. Updating obsolete product codes in a dataset

products = ["PROD-001-OLD", "PROD-002-OLD", "PROD-003-OLD"]
updated_products = [p.replace("-OLD", "-NEW") for p in products]
print(updated_products)


['PROD-001-NEW', 'PROD-002-NEW', 'PROD-003-NEW']
