In [None]:
# This Python 3 environment comes with many helpful analytics libraries installed
# It is defined by the kaggle/python Docker image: https://github.com/kaggle/docker-python
# For example, here's several helpful packages to load

import numpy as np # linear algebra
import pandas as pd # data processing, CSV file I/O (e.g. pd.read_csv)

# Input data files are available in the read-only "../input/" directory
# For example, running this (by clicking run or pressing Shift+Enter) will list all files under the input directory

import os
for dirname, _, filenames in os.walk('/kaggle/input'):
    for filename in filenames:
        print(os.path.join(dirname, filename))

# You can write up to 20GB to the current directory (/kaggle/working/) that gets preserved as output when you create a version using "Save & Run All" 
# You can also write temporary files to /kaggle/temp/, but they won't be saved outside of the current session

<div style="background-color:#121212;color:#e0e0e0;font-family:Arial,Helvetica,sans-serif;padding:20px;line-height:1.6;">
  <h1 style="color:#ff9800;margin-bottom:10px;">📚 Hybrid Learning in AI — SMS Spam Example</h1>

  <p style="margin-bottom:15px;">
    <strong style="color:#4fc3f7;">Hybrid Learning</strong> combines two or more approaches to build a stronger AI system.
    It blends the strengths of different methods, making them work together — much like combining a calculator’s speed 🖩 with a human’s judgment 🧠.
  </p>

  <h2 style="color:#ffcc80;margin-top:20px;">🔹 Why Use Hybrid Learning?</h2>
  <ul style="margin-left:20px;margin-bottom:15px;">
    <li>Better accuracy through synergy of techniques.</li>
    <li>Greater robustness against noisy or unexpected data.</li>
    <li>Flexibility — choose the right tool for the right part of the task.</li>
  </ul>

  <h2 style="color:#ffcc80;margin-top:20px;">🔹 Real-World Examples</h2>
  <ul style="margin-left:20px;margin-bottom:15px;">
    <li>Bank fraud detection using Neural Networks + Rule-based checks.</li>
    <li>Search engines combining Transformer NLP + TF-IDF ranking.</li>
    <li>Medical imaging with CNN predictions + doctor-verified rules.</li>
    <li>AI games blending supervised strategies + reinforcement learning.</li>
    <li>Network security using anomaly detection + classification.</li>
  </ul>

  <h2 style="color:#ffcc80;margin-top:20px;">📂 Our Tutorial Dataset — SMS Spam Collection</h2>
  <p style="margin-bottom:15px;">
    This dataset (<strong style="color:#81d4fa;">~500 KB</strong>) contains spam and ham (not spam) SMS messages.<br>
    <strong>Why it’s perfect:</strong> Tiny size, cleans easily, trains fast, and the task is relatable.
  </p>

  <h2 style="color:#ffcc80;margin-top:20px;">🛠 Hybrid Plan: TF-IDF Model + Keyword Rules</h2>
  <ol style="margin-left:20px;margin-bottom:15px;">
    <li><strong style="color:#4fc3f7;">ML Component</strong>
      <ul>
        <li>Convert SMS text to numerical vectors with TF-IDF.</li>
        <li>Train a Logistic Regression or Naive Bayes classifier.</li>
      </ul>
    </li>
    <li><strong style="color:#4fc3f7;">Rule-based Component</strong>
      <ul>
        <li>Define a dictionary of common spam words (<em>"free", "win", "click", "offer"</em>).</li>
        <li>If message contains enough triggers → predict spam directly.</li>
      </ul>
    </li>
    <li><strong style="color:#4fc3f7;">Hybrid Decision</strong>
      <ul>
        <li>If rules detect high spam risk → final label spam.</li>
        <li>Else → trust ML model output.</li>
      </ul>
    </li>
  </ol>

  <h2 style="color:#ffcc80;margin-top:20px;">📊 Tutorial Workflow</h2>
  <ol style="margin-left:20px;margin-bottom:15px;">
    <li>Dataset exploration — visualize spam vs. ham counts.</li>
    <li>Baseline ML Model — simple TF-IDF + Logistic Regression.</li>
    <li>Design keyword rules — experiment with thresholds.</li>
    <li>Combine outputs — weighted decision or rule priority.</li>
    <li>Evaluate — compare hybrid vs. pure ML performance.</li>
    <li>Conclusion — discuss where hybrid wins.</li>
  </ol>

  <h2 style="color:#ffcc80;margin-top:20px;">💡 Why This Tutorial Works Well</h2>
  <ul style="margin-left:20px;margin-bottom:15px;">
    <li>Lightweight — ideal for live demos and quick iteration.</li>
    <li>Clear step-by-step introduction to hybrid concepts.</li>
    <li>Real-world relevance — SMS spam filtering is everywhere.</li>
  </ul>

  <p style="margin-top:20px;font-style:italic;color:#b0bec5;">
    Tip: Treat Hybrid Learning like mixing coffee and milk ☕ + 🥛 — each can be good alone, but together, they create something smoother.
  </p>
</div>
