In [None]:
# This Python 3 environment comes with many helpful analytics libraries installed
# It is defined by the kaggle/python Docker image: https://github.com/kaggle/docker-python
# For example, here's several helpful packages to load

import numpy as np # linear algebra
import pandas as pd # data processing, CSV file I/O (e.g. pd.read_csv)

# Input data files are available in the read-only "../input/" directory
# For example, running this (by clicking run or pressing Shift+Enter) will list all files under the input directory

import os
for dirname, _, filenames in os.walk('/kaggle/input'):
    for filename in filenames:
        print(os.path.join(dirname, filename))

# You can write up to 20GB to the current directory (/kaggle/working/) that gets preserved as output when you create a version using "Save & Run All" 
# You can also write temporary files to /kaggle/temp/, but they won't be saved outside of the current session


Analyzing 2025 AI tool usage trends across text, image, video, and code to uncover adoption patterns and usage frequency

Purpose of the Project

The purpose of this project is to analyze and visualize trends in the adoption and usage of AI tools across different categories such as text, image, video, and code. With the rapid rise of generative AI, organizations and individuals are increasingly relying on these tools, but adoption varies by category, region, and usage frequency.

By cleaning and analyzing the dataset in Kaggle and building an interactive dashboard in Tableau, this project aims to:

Highlight the most popular AI tools in 2025.

Compare adoption patterns across different AI categories (text vs. image vs. video vs. code).

Understand usage frequency trends (occasional vs. daily usage).

Provide insights into demographics or regions driving adoption.

This project demonstrates the ability to work with both quantitative and categorical survey-style data, apply data wrangling techniques in Python, and present findings in a clear, interactive Tableau dashboard.

In [3]:
import pandas as pd

# -----------------------------
# 1️⃣ Load Dataset
# -----------------------------
df = pd.read_csv("/kaggle/input/ai-tools-usage-dataset-2025/ai_tools_usage_dataset.csv")  

# -----------------------------
# 2️⃣ Clean Data
# -----------------------------
# Fill missing numeric values with median
for col in ["Monthly Traffic", "Popularity Score"]:
    if col in df.columns:
        df[col] = df[col].fillna(df[col].median())

# Ensure 'Launch Date' is datetime
if "Launch Date" in df.columns:
    df["Launch Date"] = pd.to_datetime(df["Launch Date"], errors="coerce")

# -----------------------------
# 3️⃣ Create CSVs for Tableau
# -----------------------------

# Tool Popularity (Top 10 tools by Monthly Traffic)
tool_popularity = (
    df.groupby("Tool Name")["Monthly Traffic"]
      .sum()
      .reset_index()
      .sort_values(by="Monthly Traffic", ascending=False)
      .head(10)
)
tool_popularity.to_csv("/kaggle/working/tool_popularity.csv", index=False)

# Usage Trends (Monthly Traffic by Launch Date and Category)
usage_trends = (
    df.groupby(["Launch Date", "Category"])["Monthly Traffic"]
      .sum()
      .reset_index()
)
usage_trends.to_csv("/kaggle/working/usage_trends.csv", index=False)

# Category Heatmap (Average Monthly Traffic by Category & Free/Paid)
category_heatmap = (
    df.groupby(["Category", "Free/Paid"])["Monthly Traffic"]
      .mean()
      .reset_index()
)
category_heatmap.to_csv("/kaggle/working/category_heatmap.csv", index=False)

# Full cleaned dataset
df.to_csv("/kaggle/working/cleaned_ai_tools_usage_2025.csv", index=False)

print("✅ All CSVs saved in /kaggle/working/:")
print("- tool_popularity.csv")
print("- usage_trends.csv")
print("- category_heatmap.csv")
print("- cleaned_ai_tools_usage_2025.csv")


✅ All CSVs saved in /kaggle/working/:
- tool_popularity.csv
- usage_trends.csv
- category_heatmap.csv
- cleaned_ai_tools_usage_2025.csv
