diff --git a/.github/actions/demo-notebook/action.yml b/.github/actions/demo-notebook/action.yml
index 1018155ed8..d2833736c4 100644
--- a/.github/actions/demo-notebook/action.yml
+++ b/.github/actions/demo-notebook/action.yml
@@ -37,15 +37,15 @@ runs:
           exit 1
         fi
 
-    - name: Execute ONLY the ValidMind for model development series with heap development
+    - name: Execute ONLY the ValidMind for development series with heap development
       shell: bash
       if: ${{ steps.find_dev_env.outcome == 'success' }}
       run: |
           cd site
           cp ../${{ inputs.dev_env }} ../.env
           source ../.env
-          quarto render --profile exe-demo notebooks/EXECUTED/model_development &> render_errors.log || {
-            echo "Execute for ValidMind for model development series failed";
+          quarto render --profile exe-demo notebooks/EXECUTED/development &> render_errors.log || {
+            echo "Execute for ValidMind for development series failed";
             cat render_errors.log;
             exit 1;
           }
@@ -59,15 +59,15 @@ runs:
           exit 1
         fi
 
-    - name: Execute ONLY the ValidMind for model validation series with heap development
+    - name: Execute ONLY the ValidMind for validation series with heap development
       shell: bash
       if: ${{ steps.find_valid_env.outcome == 'success' }}
       run: |
           cd site
           cp ../${{ inputs.valid_env }} ../.env
           source ../.env
-          quarto render --profile exe-demo notebooks/EXECUTED/model_validation &> render_errors.log || {
-            echo "Execute for ValidMind for model validation series failed";
+          quarto render --profile exe-demo notebooks/EXECUTED/validation &> render_errors.log || {
+            echo "Execute for ValidMind for validation series failed";
             cat render_errors.log;
             exit 1;
           }
\ No newline at end of file
diff --git a/.github/actions/prod-notebook/action.yml b/.github/actions/prod-notebook/action.yml
index e18a2e802c..c75c309d94 100644
--- a/.github/actions/prod-notebook/action.yml
+++ b/.github/actions/prod-notebook/action.yml
@@ -37,15 +37,15 @@ runs:
           exit 1
         fi
 
-    - name: Execute ONLY the ValidMind for model development series with heap production
+    - name: Execute ONLY the ValidMind for development series with heap production
       shell: bash
       if: ${{ steps.find_dev_env.outcome == 'success' }}
       run: |
           cd site
           cp ../${{ inputs.dev_env }} ../.env
           source ../.env
-          quarto render --profile exe-prod notebooks/EXECUTED/model_development &> render_errors.log || {
-            echo "Execute for ValidMind for model development series failed";
+          quarto render --profile exe-prod notebooks/EXECUTED/development &> render_errors.log || {
+            echo "Execute for ValidMind for development series failed";
             cat render_errors.log;
             exit 1;
           }
@@ -59,15 +59,15 @@ runs:
           exit 1
         fi
 
-    - name: Execute ONLY the ValidMind for model validation series with heap production
+    - name: Execute ONLY the ValidMind for validation series with heap production
       shell: bash
       if: ${{ steps.find_valid_env.outcome == 'success' }}
       run: |
           cd site
           cp ../${{ inputs.valid_env }} ../.env
           source ../.env
-          quarto render --profile exe-prod notebooks/EXECUTED/model_validation &> render_errors.log || {
-            echo "Execute for ValidMind for model validation series failed";
+          quarto render --profile exe-prod notebooks/EXECUTED/validation &> render_errors.log || {
+            echo "Execute for ValidMind for validation series failed";
             cat render_errors.log;
             exit 1;
           }
diff --git a/.github/actions/staging-notebook/action.yml b/.github/actions/staging-notebook/action.yml
index 0d8e967ddd..698dd86dcd 100644
--- a/.github/actions/staging-notebook/action.yml
+++ b/.github/actions/staging-notebook/action.yml
@@ -37,15 +37,15 @@ runs:
           exit 1
         fi
 
-    - name: Execute ONLY the ValidMind for model development series with heap staging
+    - name: Execute ONLY the ValidMind for development series with heap staging
       shell: bash
       if: ${{ steps.find_dev_env.outcome == 'success' }}
       run: |
           cd site
           cp ../${{ inputs.dev_env }} ../.env
           source ../.env
-          quarto render --profile exe-staging notebooks/EXECUTED/model_development &> render_errors.log || {
-            echo "Execute for ValidMind for model development series failed";
+          quarto render --profile exe-staging notebooks/EXECUTED/development &> render_errors.log || {
+            echo "Execute for ValidMind for development series failed";
             cat render_errors.log;
             exit 1;
           }
@@ -59,15 +59,15 @@ runs:
           exit 1
         fi
 
-    - name: Execute ONLY the ValidMind for model validation series with heap staging
+    - name: Execute ONLY the ValidMind for validation series with heap staging
       shell: bash
       if: ${{ steps.find_valid_env.outcome == 'success' }}
       run: |
           cd site
           cp ../${{ inputs.valid_env }} ../.env
           source ../.env
-          quarto render --profile exe-staging notebooks/EXECUTED/model_validation &> render_errors.log || {
-            echo "Execute for ValidMind for model validation series failed";
+          quarto render --profile exe-staging notebooks/EXECUTED/validation &> render_errors.log || {
+            echo "Execute for ValidMind for validation series failed";
             cat render_errors.log;
             exit 1;
           }
diff --git a/.github/workflows/deploy-docs-prod.yaml b/.github/workflows/deploy-docs-prod.yaml
index 24697c2f30..cce53a8fd1 100644
--- a/.github/workflows/deploy-docs-prod.yaml
+++ b/.github/workflows/deploy-docs-prod.yaml
@@ -75,10 +75,11 @@ jobs:
         with:
           version: ${{ vars.QUARTO_VERSION }}
 
-      - name: Install Poetry
-        run: |
-          curl -sSL https://install.python-poetry.org | python3 -
-          echo "$HOME/.local/bin" >> $GITHUB_PATH
+      - name: Set up uv
+        uses: astral-sh/setup-uv@v5
+
+      - name: Set up uv
+        uses: astral-sh/setup-uv@v5
 
       - name: Generate Python library docs
         run: |
@@ -91,8 +92,7 @@ jobs:
 
       - name: Generate template schema docs
         run: |
-          pip install json-schema-for-humans
-          BACKEND_ROOT=site/_source/backend python scripts/generate_template_schema_docs.py
+          BACKEND_ROOT=site/_source/backend uv run --with json-schema-for-humans python scripts/generate_template_schema_docs.py
 
       - name: Populate installation
         run: cp -r site/_source/installation/site/installation site/installation
diff --git a/.github/workflows/deploy-docs-staging.yaml b/.github/workflows/deploy-docs-staging.yaml
index 4c8f8fb69b..158faaff7a 100644
--- a/.github/workflows/deploy-docs-staging.yaml
+++ b/.github/workflows/deploy-docs-staging.yaml
@@ -75,10 +75,11 @@ jobs:
         with:
           version: ${{ vars.QUARTO_VERSION }}
 
-      - name: Install Poetry
-        run: |
-          curl -sSL https://install.python-poetry.org | python3 -
-          echo "$HOME/.local/bin" >> $GITHUB_PATH
+      - name: Set up uv
+        uses: astral-sh/setup-uv@v5
+
+      - name: Set up uv
+        uses: astral-sh/setup-uv@v5
 
       - name: Generate Python library docs
         run: |
@@ -91,8 +92,7 @@ jobs:
 
       - name: Generate template schema docs
         run: |
-          pip install json-schema-for-humans
-          BACKEND_ROOT=site/_source/backend python scripts/generate_template_schema_docs.py
+          BACKEND_ROOT=site/_source/backend uv run --with json-schema-for-humans python scripts/generate_template_schema_docs.py
 
       - name: Populate installation
         run: cp -r site/_source/installation/site/installation site/installation
diff --git a/.github/workflows/execute-pr-preview.yaml b/.github/workflows/execute-pr-preview.yaml
index 7fcd1d9675..a1b93b3fa8 100644
--- a/.github/workflows/execute-pr-preview.yaml
+++ b/.github/workflows/execute-pr-preview.yaml
@@ -76,7 +76,7 @@ jobs:
         echo VM_API_MODEL=${{ secrets.PLATFORM_VALID_MODEL }} >> valid.env
 
     # Only execute the demo notebooks for training if .env files are created
-    - name: Execute demo ValidMind for model development and validation series
+    - name: Execute demo ValidMind for development and validation series
       if: ${{ vars.ENABLE_DEMO_NOTEBOOK == 'true' && steps.create_dev_env.outcome == 'success' && steps.create_valid_env.outcome == 'success' }}
       uses: ./.github/actions/demo-notebook
       id: execute_demo_notebook
@@ -99,8 +99,8 @@ jobs:
       with:
         script: |
           const base = `https://docs-staging.validmind.ai/pr_previews/${{ github.head_ref }}`;
-          const devUrl = `${base}/notebooks/EXECUTED/model_development/1-set_up_validmind.html`;
-          const valUrl = `${base}/notebooks/EXECUTED/model_validation/1-set_up_validmind_for_validation.html`;
+          const devUrl = `${base}/notebooks/EXECUTED/development/1-set_up_validmind.html`;
+          const valUrl = `${base}/notebooks/EXECUTED/validation/1-set_up_validmind_for_validation.html`;
 
           // Delete old preview comments
           const { data: comments } = await github.rest.issues.listComments({
@@ -120,8 +120,8 @@ jobs:
 
           let comment = `## Execute training notebooks for PRs\n\n`;
           comment += `✓ INFO: Live previews are available —\n\n`;
-          comment += `- [Open model development series](${devUrl})\n`;
-          comment += `- [Open model validation series](${valUrl})\n`;
+          comment += `- [Open development series](${devUrl})\n`;
+          comment += `- [Open validation series](${valUrl})\n`;
 
           await github.rest.issues.createComment({
             owner: context.repo.owner,
diff --git a/.github/workflows/execute-prod.yaml b/.github/workflows/execute-prod.yaml
index 5fa62313da..93d3f9b049 100644
--- a/.github/workflows/execute-prod.yaml
+++ b/.github/workflows/execute-prod.yaml
@@ -59,7 +59,7 @@ jobs:
           echo VM_API_MODEL=${{ secrets.PLATFORM_VALID_MODEL }} >> valid.env
 
       # Only execute the production notebooks for training if .env files are created
-      - name: Execute production ValidMind for model development and validation series
+      - name: Execute production ValidMind for development and validation series
         if: ${{ steps.create_dev_env.outcome == 'success' && steps.create_valid_env.outcome == 'success' }}
         uses: ./.github/actions/prod-notebook
         id: execute-prod-notebook
diff --git a/.github/workflows/execute-staging.yaml b/.github/workflows/execute-staging.yaml
index b0b88b1d81..d692e5d149 100644
--- a/.github/workflows/execute-staging.yaml
+++ b/.github/workflows/execute-staging.yaml
@@ -59,7 +59,7 @@ jobs:
           echo VM_API_MODEL=${{ secrets.PLATFORM_VALID_MODEL }} >> valid.env
 
       # Only execute the staging notebooks for training if .env files are created
-      - name: Execute staging ValidMind for model development and validation series
+      - name: Execute staging ValidMind for development and validation series
         if: ${{ steps.create_dev_env.outcome == 'success' && steps.create_valid_env.outcome == 'success' }}
         uses: ./.github/actions/staging-notebook
         id: execute-staging-notebook
diff --git a/.github/workflows/lighthouse-check.yaml b/.github/workflows/lighthouse-check.yaml
index d96685de1c..de78a2ce5d 100644
--- a/.github/workflows/lighthouse-check.yaml
+++ b/.github/workflows/lighthouse-check.yaml
@@ -1,598 +1,421 @@
 name: Lighthouse check
 
 on:
-  pull_request:
-    types: [opened, synchronize, ready_for_review]
+  workflow_dispatch:
+    inputs:
+      mode:
+        description: "Audit mode"
+        required: true
+        default: "changed"
+        type: choice
+        options:
+          - "changed"
+          - "depth"
+      depth:
+        description: "Sitemap depth when mode is depth (0–2)"
+        required: true
+        default: "0"
+        type: choice
+        options:
+          - "0"
+          - "1"
+          - "2"
+      pr_number:
+        description: "Pull request number to audit"
+        required: true
+        type: string
 
 permissions:
+  contents: read
   issues: write
   pull-requests: write
-
-env:
-  # To change the default depth level:
-  # 0 — Top-level navigation only (e.g. /index.html, /guide/guides.html, /developer/validmind-library.html, etc.)
-  # 1 — All first-level subdirectories (e.g. /guide/*.html)
-  # 2 — All second-level subdirectories (e.g. /guide/attestation/*.html)
-  # Note: While the crawler technically supports deeper levels, expect the workflow to take >2-12 hours to complete
-  DEFAULT_DEPTH: '0'
+  actions: read
 
 jobs:
   lighthouse:
     runs-on: ubuntu-latest
-    if: github.event.pull_request.draft == false
+    if: github.event_name == 'workflow_dispatch'
     steps:
-    - name: Wait for validation workflow to complete
-      uses: actions/github-script@v6
-      with:
-        script: |
-          const maxWaitTime = 45 * 60 * 1000; // 45 minutes in milliseconds
-          const pollInterval = 60 * 1000; // 60 seconds in milliseconds
-          const startTime = Date.now();
-          
-          console.log(`Waiting for "Validate docs site" workflow to complete for PR #${context.issue.number}`);
-          console.log(`Head SHA: ${context.payload.pull_request.head.sha}`);
-          
-          while (Date.now() - startTime < maxWaitTime) {
-            try {
-              // Get workflow runs for the validate-docs-site workflow
-              const { data: runs } = await github.rest.actions.listWorkflowRunsForRepo({
-                owner: context.repo.owner,
-                repo: context.repo.repo,
-                workflow_id: 'validate-docs-site.yaml',
-                head_sha: context.payload.pull_request.head.sha,
-                per_page: 5
+      - name: Resolve PR context
+        id: pr
+        uses: actions/github-script@v6
+        with:
+          script: |
+            const owner = context.repo.owner;
+            const repo = context.repo.repo;
+
+            async function getPr(prNumber) {
+              const { data: pr } = await github.rest.pulls.get({
+                owner,
+                repo,
+                pull_number: prNumber,
               });
-              
-              console.log(`Found ${runs.workflow_runs.length} workflow runs for this commit`);
-              
-              if (runs.workflow_runs.length > 0) {
-                // Get the most recent run
-                const latestRun = runs.workflow_runs[0];
-                console.log(`Latest run: ${latestRun.id}, status: ${latestRun.status}, conclusion: ${latestRun.conclusion}`);
-                
-                if (latestRun.status === 'completed') {
-                  if (latestRun.conclusion === 'success') {
-                    console.log('✅ Validation workflow completed successfully');
-                    break;
-                  } else {
-                    throw new Error(`❌ Validation workflow failed with conclusion: ${latestRun.conclusion}`);
-                  }
-                } else if (latestRun.status === 'in_progress' || latestRun.status === 'queued') {
-                  console.log(`⏳ Validation workflow is ${latestRun.status}, continuing to wait...`);
-                } else {
-                  console.log(`⚠️  Unexpected status: ${latestRun.status}`);
-                }
-              } else {
-                console.log('⏳ No workflow runs found yet, validation may not have started...');
+              if (pr.draft) {
+                core.setFailed('Skipping Lighthouse for draft PR');
+                return null;
               }
-              
-              console.log(`Elapsed time: ${Math.round((Date.now() - startTime) / 1000 / 60)} minutes`);
-              await new Promise(resolve => setTimeout(resolve, pollInterval));
-              
-            } catch (error) {
-              console.error('Error checking workflow status:', error);
-              throw error;
+              const labels = (pr.labels || []).map(l => l.name);
+              const fullAudit = labels.includes('lighthouse:full');
+              return {
+                number: pr.number,
+                head_ref: pr.head.ref,
+                head_sha: pr.head.sha,
+                base_ref: pr.base.ref,
+                full_audit: fullAudit,
+              };
             }
+
+            const prNumber = parseInt('${{ inputs.pr_number }}', 10);
+            const info = await getPr(prNumber);
+            if (!info) return;
+
+            let mode = '${{ inputs.mode }}';
+            let depth = '${{ inputs.depth }}';
+            if (info.full_audit && mode === 'changed') {
+              mode = 'depth';
+              depth = '2';
+            }
+
+            core.setOutput('number', String(info.number));
+            core.setOutput('head_ref', info.head_ref);
+            core.setOutput('head_sha', info.head_sha);
+            core.setOutput('base_ref', info.base_ref);
+            core.setOutput('mode', mode);
+            core.setOutput('depth', depth);
+            core.setOutput('full_audit', String(info.full_audit));
+
+      - name: Check out repository
+        uses: actions/checkout@v4
+        with:
+          ref: ${{ steps.pr.outputs.head_sha }}
+          fetch-depth: 0
+
+      - name: Set environment
+        run: |
+          echo "PREVIEW_URL=https://docs-staging.validmind.ai/pr_previews/${{ steps.pr.outputs.head_ref }}" >> $GITHUB_ENV
+          echo "COMMIT_SHA=${{ steps.pr.outputs.head_sha }}" >> $GITHUB_ENV
+          echo "COMMIT_SHA_SHORT=$(echo ${{ steps.pr.outputs.head_sha }} | cut -c1-7)" >> $GITHUB_ENV
+          echo "LIGHTHOUSE_MODE=${{ steps.pr.outputs.mode }}" >> $GITHUB_ENV
+          echo "LIGHTHOUSE_DEPTH=${{ steps.pr.outputs.depth }}" >> $GITHUB_ENV
+          echo "PR_NUMBER=${{ steps.pr.outputs.number }}" >> $GITHUB_ENV
+
+      - name: Check for PR preview URL
+        id: check_preview
+        run: |
+          check_url() {
+            local url=$1
+            local status
+            status=$(curl -s -o /dev/null -w "%{http_code}" -I -A "Mozilla/5.0" "$url")
+            echo "Checking $url — status: $status"
+            [ "$status" -eq 200 ]
           }
-          
-          // Check if we timed out
-          if (Date.now() - startTime >= maxWaitTime) {
-            throw new Error('⏰ Timed out waiting for validation workflow to complete');
-          }
-          
-    - name: Check out repository
-      uses: actions/checkout@v4
-
-    - name: Get commit SHA
-      id: get_sha
-      run: |
-        echo "COMMIT_SHA=$(git rev-parse HEAD)" >> $GITHUB_ENV
-        echo "COMMIT_SHA_SHORT=$(git rev-parse --short HEAD)" >> $GITHUB_ENV
-
-    - name: Set PR preview URL
-      id: set_url
-      run: |
-        echo "PREVIEW_URL=https://docs-staging.validmind.ai/pr_previews/${{ github.head_ref }}" >> $GITHUB_ENV
-        echo "DEPTH=${{ env.DEFAULT_DEPTH }}" >> $GITHUB_ENV
-
-    - name: Check for PR preview URL and sitemap
-      id: check_preview
-      run: |
-        # Function to check if URL returns HTTP 200
-        check_url() {
-          local url=$1
-          local status
-          status=$(curl -s -o /dev/null -w "%{http_code}" -I -A "Mozilla/5.0" "$url")
-          echo "Checking $url — status: $status"
-          [ "$status" -eq 200 ]
-        }
-    
-        echo "Waiting for preview site to become available ..."
-        for i in {1..60}; do
-          if check_url "$PREVIEW_URL/index.html"; then
-            echo "Info: Preview site is now available"
-            break
+
+          echo "Waiting for preview site to become available ..."
+          for i in $(seq 1 30); do
+            if check_url "$PREVIEW_URL/index.html"; then
+              echo "Info: Preview site is now available"
+              break
+            fi
+            if [ "$i" -eq 30 ]; then
+              echo "Error: Preview URL did not become available after 30 minutes"
+              exit 1
+            fi
+            echo "Attempt $i/30: waiting 1 minute..."
+            sleep 60
+          done
+
+          if ! check_url "$PREVIEW_URL/sitemap.xml"; then
+            echo "Error: Sitemap missing at $PREVIEW_URL/sitemap.xml"
+            exit 1
           fi
-    
-          if [ $i -eq 60 ]; then
-            echo "Error: Preview URL did not become available after 60 minutes at $PREVIEW_URL/index.html"
+
+          echo "preview_exists=true" >> $GITHUB_OUTPUT
+
+      - name: Install Python dependencies
+        if: steps.check_preview.outputs.preview_exists == 'true'
+        run: |
+          python -m pip install --upgrade pip
+          pip install requests
+
+      - name: Generate URLs to check
+        if: steps.check_preview.outputs.preview_exists == 'true'
+        id: generate_urls
+        env:
+          INSTALLATION_USER: ${{ secrets.INSTALLATION_USER }}
+          INSTALLATION_PW: ${{ secrets.INSTALLATION_PW }}
+        run: |
+          cd site/scripts
+          python lighthouse_urls.py \
+            --mode "$LIGHTHOUSE_MODE" \
+            --base-ref "${{ steps.pr.outputs.base_ref }}" \
+            --depth "$LIGHTHOUSE_DEPTH" \
+            --preview-url "$PREVIEW_URL" \
+            --output ../../lhci-urls.txt \
+            --metadata ../../lighthouse-metadata.json \
+            --skip-file ../../lighthouse-skip.txt
+
+          if [ -f ../../lighthouse-skip.txt ]; then
+            echo "skip=true" >> $GITHUB_OUTPUT
+            echo "No site pages to audit in this PR."
+            exit 0
+          fi
+
+          if [ ! -s ../../lhci-urls.txt ]; then
+            echo "Error: No URLs were generated."
             exit 1
           fi
-    
-          echo "Attempt $i/60: Preview site not ready yet, waiting 1 minute..."
-          sleep 60
-        done
-    
-        if ! check_url "$PREVIEW_URL/sitemap.xml"; then
-          echo "Error: Sitemap does not exist at $PREVIEW_URL/sitemap.xml"
-          exit 1
-        fi
-    
-        echo "Debug: Checking installation page with URL-based auth..."
-        auth_url="https://${{ secrets.INSTALLATION_USER }}:${{ secrets.INSTALLATION_PW }}@docs-staging.validmind.ai/pr_previews/${{ github.head_ref }}/installation/index.html"
-        status=$(curl -s -o /dev/null -w "%{http_code}" -I -A "Mozilla/5.0" --anyauth "$auth_url")
-        echo "Checking $auth_url — status: $status"
-        if [ "$status" -ne 200 ]; then
-          echo "Error: Installation page is not accessible with authentication at $auth_url"
-          exit 1
-        fi
-    
-        echo "Info: Successfully accessed password-protected installation page"
-    
-        echo "preview_exists=true" >> $GITHUB_OUTPUT
-
-    - name: Install Lighthouse CI
-      if: steps.check_preview.outputs.preview_exists == 'true'
-      run: npm install -g @lhci/cli
-
-    - name: Install required Python packages
-      if: steps.check_preview.outputs.preview_exists == 'true'
-      run: |
-        python -m pip install --upgrade pip
-        pip install requests beautifulsoup4
-
-    - name: Generate URLs to check
-      if: steps.check_preview.outputs.preview_exists == 'true'
-      id: generate_urls
-      run: |
-        BASE_URL="$PREVIEW_URL"
-        
-        # Create a Python script to crawl the site
-        cat > crawl.py << 'EOF'
-        import requests
-        from bs4 import BeautifulSoup
-        import sys
-        from urllib.parse import urljoin, urlparse
-        import json
-        import xml.etree.ElementTree as ET
-        import base64
-        import os
-
-        # Define root pages to check
-        ROOT_PAGES = [
-            "index.html",
-            "get-started/get-started.html",
-            "guide/guides.html",
-            "developer/validmind-library.html",
-            "support/support.html",
-            "releases/all-releases.html",
-            "training/training.html"
-        ]
-
-        def get_auth_headers():
-            # Only use auth for installation pages
-            if 'installation/' in url:
-                # Create auth headers from environment variables
-                auth_string = base64.b64encode(f"{os.environ['INSTALLATION_USER']}:{os.environ['INSTALLATION_PW']}".encode()).decode()
-                return {"Authorization": f"Basic {auth_string}"}
-            return {}
-
-        def get_url_depth(url):
-            # Parse the URL to get just the path
-            path = urlparse(url).path
-            # Remove .html extension for depth calculation
-            path = path.replace('.html', '')
-            # Remove any leading/trailing slashes
-            path = path.strip('/')
-            
-            # Split into segments and count non-empty ones
-            segments = [x for x in path.split('/') if x]
-            
-            # For PR preview URLs, we need to skip the first 5 segments:
-            # /pr_previews/username/branch/name/
-            if 'pr_previews' in path:
-                # Skip the first 5 segments (pr_previews/username/branch/name/)
-                segments = segments[5:]
-            
-            # Debug the depth calculation
-            # print(f"URL depth calculation - Path: {path}, Segments: {segments}, Depth: {len(segments)}", file=sys.stderr)
-            
-            return len(segments)
-
-        def get_urls_from_sitemap(sitemap_url, max_depth):
-            try:
-                print(f"Fetching sitemap from {sitemap_url}", file=sys.stderr)
-                # Don't use auth for sitemap
-                response = requests.get(sitemap_url)
-                print(f"Sitemap response status: {response.status_code}", file=sys.stderr)
-                if response.status_code == 200:
-                    print(f"Sitemap content: {response.text[:500]}...", file=sys.stderr)
-                    root = ET.fromstring(response.content)
-                    # Get all URLs from sitemap
-                    all_urls = set()
-                    
-                    for url in root.findall('.//{http://www.sitemaps.org/schemas/sitemap/0.9}url'):
-                        loc = url.find('{http://www.sitemaps.org/schemas/sitemap/0.9}loc')
-                        if loc is not None:
-                            full_url = loc.text
-                            parsed_url = urlparse(full_url)
-                            
-                            # Extract the path part after the base URL
-                            path = parsed_url.path
-                            # Remove leading slash if present
-                            path = path.lstrip('/')
-                            
-                            # Only include .html files
-                            if path.endswith('.html'):
-                                # Check depth
-                                if get_url_depth(path) <= max_depth:
-                                    # Remove any segments that match the PR preview path
-                                    segments = path.split('/')
-                                    # Keep only the segments after the PR preview path
-                                    pr_preview_index = -1
-                                    for i, segment in enumerate(segments):
-                                        if segment == 'pr_previews':
-                                            pr_preview_index = i
-                                            break
-                                    if pr_preview_index >= 0:
-                                        segments = segments[pr_preview_index + 4:]  # Skip pr_previews/username/branch/name
-                                    path = '/'.join(segments)
-                                    all_urls.add(path)
-                                    print(f"Found URL in sitemap: {path}", file=sys.stderr)
-                    
-                    print(f"Found {len(all_urls)} URLs in sitemap:", file=sys.stderr)
-                    for url in sorted(all_urls):
-                        print(f"  {url}", file=sys.stderr)
-                    return sorted(list(all_urls))
-                else:
-                    print(f"Failed to fetch sitemap: {response.status_code}", file=sys.stderr)
-            except Exception as e:
-                print(f"Error processing sitemap {sitemap_url}: {str(e)}", file=sys.stderr)
-            return []
-
-        def get_links(url, max_depth, visited=None):
-            if visited is None:
-                visited = set()
-            
-            current_depth = get_url_depth(url)
-            print(f"Checking URL {url} at depth {current_depth}", file=sys.stderr)
-            
-            if current_depth > max_depth or url in visited:
-                print(f"Skipping {url} - depth {current_depth} > {max_depth} or already visited", file=sys.stderr)
-                return set()
-            
-            visited.add(url)
-            links = set()
-            
-            try:
-                print(f"Fetching {url}", file=sys.stderr)
-                headers = get_auth_headers()
-                response = requests.get(url, headers=headers)
-                print(f"Response status: {response.status_code}", file=sys.stderr)
-                if response.status_code == 200:
-                    soup = BeautifulSoup(response.text, 'html.parser')
-                    print(f"Found {len(soup.find_all('a', href=True))} links on page", file=sys.stderr)
-                    
-                    for a in soup.find_all('a', href=True):
-                        href = a['href']
-                        print(f"Processing link: {href}", file=sys.stderr)
-                        
-                        # Skip external links and anchors
-                        if href.startswith('#') or href.startswith('http'):
-                            print(f"Skipping external/anchor link: {href}", file=sys.stderr)
-                            continue
-                            
-                        # Convert relative URLs to absolute
-                        full_url = urljoin(url, href)
-                        print(f"Converted to full URL: {full_url}", file=sys.stderr)
-                        
-                        # Only include URLs from the same base domain
-                        if urlparse(full_url).netloc == urlparse(url).netloc:
-                            # Extract just the path part
-                            path = urlparse(full_url).path
-                            # Remove leading slash if present
-                            path = path.lstrip('/')
-                            
-                            # Only include .html files
-                            if path.endswith('.html'):
-                                print(f"Found HTML link: {path}", file=sys.stderr)
-                                links.add(path)
-                                # Only recursively get links if we haven't hit max depth
-                                if get_url_depth(path) < max_depth:
-                                    print(f"Recursively checking {path} at depth {get_url_depth(path)}", file=sys.stderr)
-                                    links.update(get_links(full_url, max_depth, visited))
-                                else:
-                                    print(f"Skipping recursive check for {path} - at max depth", file=sys.stderr)
-                        else:
-                            print(f"Skipping external domain link: {href}", file=sys.stderr)
-            except Exception as e:
-                print(f"Error processing {url}: {str(e)}", file=sys.stderr)
-            
-            return links
-
-        # Get command line arguments
-        base_url = sys.argv[1]
-        max_depth = int(sys.argv[2])
-        
-        print(f"Base URL: {base_url}", file=sys.stderr)
-        print(f"Max depth: {max_depth}", file=sys.stderr)
-
-        # Get all URLs
-        all_urls = set()
-        
-        if max_depth == 0:
-            # For depth 0, only check ROOT_PAGES
-            print("Depth is 0, only checking ROOT_PAGES", file=sys.stderr)
-            for root in ROOT_PAGES:
-                all_urls.add(root)
-                print(f"Added root page: {root}", file=sys.stderr)
-        else:
-            # For depth > 0, use sitemap
-            print(f"Depth is {max_depth}, using sitemap", file=sys.stderr)
-            sitemap_url = f"{base_url}/sitemap.xml"
-            sitemap_urls = get_urls_from_sitemap(sitemap_url, max_depth)
-            print(f"Found {len(sitemap_urls)} URLs in sitemap", file=sys.stderr)
-            all_urls.update(sitemap_urls)
-
-        # Print URLs to stdout, ensuring proper URL construction
-        print(f"Total URLs found: {len(all_urls)}", file=sys.stderr)
-        for url in sorted(all_urls):
-            # Remove any leading slashes from the URL to avoid double slashes
-            url = url.lstrip('/')
-            # Construct the full URL by joining base_url and url with a single slash
-            full_url = f"{base_url.rstrip('/')}/{url}"
-            print(full_url)
-            print(f"Added URL: {full_url}", file=sys.stderr)
-        EOF
-
-        # Run the crawler
-        python crawl.py "$BASE_URL" "$DEPTH" > lhci-urls.txt
-        
-        echo "Lighthouse will check the following URLs:"
-        cat lhci-urls.txt
-        echo -e "\nTotal number of URLs: $(wc -l < lhci-urls.txt)"
-        
-        # Verify we have URLs
-        if [ ! -s lhci-urls.txt ]; then
-          echo "Error: No URLs were generated. Check the debug output above."
-          exit 1
-        fi
-
-    - name: Create Lighthouse config
-      if: steps.check_preview.outputs.preview_exists == 'true'
-      run: |
-        cat > .lighthouserc.js << 'EOF'
-        const fs = require('fs');
-        const urls = fs.readFileSync('lhci-urls.txt', 'utf-8').split('\n').filter(Boolean);
-        
-        // Add auth to installation URLs using the same format as the URL check step
-        const urlsWithAuth = urls.map(url => {
-          if (url.includes('/installation/')) {
-            return `https://${process.env.INSTALLATION_USER}:${process.env.INSTALLATION_PW}@${new URL(url).host}${new URL(url).pathname}`;
-          }
-          return url;
-        });
-        
-        module.exports = {
-          ci: {
-            collect: {
-              url: urlsWithAuth,
-              numberOfRuns: 1,
-              settings: {
-                formFactor: 'desktop',
-                screenEmulation: {
-                  mobile: false,
-                  width: 1350,
-                  height: 940,
-                  deviceScaleFactor: 1,
-                  disabled: false,
+
+          echo "skip=false" >> $GITHUB_OUTPUT
+          echo "Lighthouse will check:"
+          cat ../../lhci-urls.txt
+
+          # Probe first URL from list (beyond index.html) when in changed mode
+          if [ "$LIGHTHOUSE_MODE" = "changed" ]; then
+            FIRST=$(head -n1 ../../lhci-urls.txt)
+            status=$(curl -s -o /dev/null -w "%{http_code}" -I -A "Mozilla/5.0" "$FIRST")
+            echo "Probe $FIRST — status: $status"
+            if [ "$status" -ne 200 ]; then
+              echo "Error: Changed page not reachable on preview"
+              exit 1
+            fi
+          fi
+
+      - name: Verify installation page auth
+        if: |
+          steps.check_preview.outputs.preview_exists == 'true' &&
+          steps.generate_urls.outputs.skip != 'true'
+        run: |
+          if ! grep -q '/installation/' lhci-urls.txt 2>/dev/null; then
+            echo "No installation pages in URL list — skipping auth check"
+            exit 0
+          fi
+          auth_url="https://${{ secrets.INSTALLATION_USER }}:${{ secrets.INSTALLATION_PW }}@docs-staging.validmind.ai/pr_previews/${{ steps.pr.outputs.head_ref }}/installation/index.html"
+          status=$(curl -s -o /dev/null -w "%{http_code}" -I -A "Mozilla/5.0" --anyauth "$auth_url")
+          echo "Checking installation page — status: $status"
+          if [ "$status" -ne 200 ]; then
+            echo "Error: Installation page not accessible with authentication"
+            exit 1
+          fi
+
+      - name: Post skip comment
+        if: steps.generate_urls.outputs.skip == 'true'
+        uses: actions/github-script@v6
+        with:
+          script: |
+            const prNumber = parseInt(process.env.PR_NUMBER, 10);
+            const body = `## Lighthouse check results\n\n✓ INFO: No site pages to audit in this PR.\n\nCommit SHA: [${process.env.COMMIT_SHA_SHORT}](${context.serverUrl}/${context.repo.owner}/${context.repo.repo}/commit/${process.env.COMMIT_SHA})`;
+            await github.rest.issues.createComment({
+              owner: context.repo.owner,
+              repo: context.repo.repo,
+              issue_number: prNumber,
+              body,
+            });
+
+      - name: Install Lighthouse CI
+        if: steps.generate_urls.outputs.skip != 'true' && steps.check_preview.outputs.preview_exists == 'true'
+        run: npm install -g @lhci/cli
+
+      - name: Create Lighthouse config
+        if: steps.generate_urls.outputs.skip != 'true' && steps.check_preview.outputs.preview_exists == 'true'
+        run: |
+          cat > .lighthouserc.js << 'EOF'
+          const fs = require('fs');
+          const urls = fs.readFileSync('lhci-urls.txt', 'utf-8').split('\n').filter(Boolean);
+
+          const urlsWithAuth = urls.map(url => {
+            if (url.includes('/installation/')) {
+              return `https://${process.env.INSTALLATION_USER}:${process.env.INSTALLATION_PW}@${new URL(url).host}${new URL(url).pathname}`;
+            }
+            return url;
+          });
+
+          module.exports = {
+            ci: {
+              collect: {
+                url: urlsWithAuth,
+                numberOfRuns: 3,
+                settings: {
+                  formFactor: 'desktop',
+                  screenEmulation: {
+                    mobile: false,
+                    width: 1350,
+                    height: 940,
+                    deviceScaleFactor: 1,
+                    disabled: false,
+                  },
+                  throttling: {
+                    rttMs: 40,
+                    throughputKbps: 10240,
+                    cpuSlowdownMultiplier: 1,
+                    requestLatencyMs: 0,
+                    downloadThroughputKbps: 0,
+                    uploadThroughputKbps: 0,
+                  },
                 },
-                throttling: {
-                  rttMs: 40,
-                  throughputKbps: 10240,
-                  cpuSlowdownMultiplier: 1,
-                  requestLatencyMs: 0,
-                  downloadThroughputKbps: 0,
-                  uploadThroughputKbps: 0,
+              },
+              assert: {
+                assertions: {
+                  'categories:accessibility': ['error', { minScore: 0.9 }],
                 },
               },
-            },
-            assert: {
-              assertions: {
-                'categories:accessibility': ['error', { minScore: 0.9 }],
+              upload: {
+                target: 'temporary-public-storage',
               },
             },
-            upload: {
-              target: 'temporary-public-storage',
-            },
-          },
-        };
-        EOF
-
-    - name: Run Lighthouse audit
-      if: steps.check_preview.outputs.preview_exists == 'true'
-      uses: treosh/lighthouse-ci-action@v11
-      id: lighthouse
-      continue-on-error: true
-      env:
-        INSTALLATION_USER: ${{ secrets.INSTALLATION_USER }}
-        INSTALLATION_PW: ${{ secrets.INSTALLATION_PW }}
-      with:
-        configPath: .lighthouserc.js
-        uploadArtifacts: true
-        temporaryPublicStorage: true
-
-    - name: Check Lighthouse audit result
-      if: steps.check_preview.outputs.preview_exists == 'true'
-      run: |
-        # Check if the manifest exists and is valid JSON
-        if [ -z "${{ steps.lighthouse.outputs.manifest }}" ]; then
-          echo "Error: Lighthouse audit failed - no manifest output"
-          exit 1
-        fi
-        
-        # Try to parse the manifest as JSON
-        if ! echo '${{ steps.lighthouse.outputs.manifest }}' | jq . > /dev/null 2>&1; then
-          echo "Error: Lighthouse audit failed - invalid manifest format"
-          exit 1
-        fi
-        
-        # Check if any URLs were successfully audited
-        if ! echo '${{ steps.lighthouse.outputs.manifest }}' | jq 'length > 0' > /dev/null 2>&1; then
-          echo "Error: Lighthouse audit failed - no URLs were successfully audited"
-          exit 1
-        fi
-
-    - name: Post Lighthouse results comment
-      if: steps.check_preview.outputs.preview_exists == 'true'
-      uses: actions/github-script@v6
-      with:
-        script: |
-          const runId = context.runId;
-          const baseUrl = process.env.PREVIEW_URL;
-          const commitSha = process.env.COMMIT_SHA;
-          const commitShaShort = process.env.COMMIT_SHA_SHORT;
-
-          // Get artifacts for this run
-          const { data: artifacts } = await github.rest.actions.listWorkflowRunArtifacts({
-            owner: context.repo.owner,
-            repo: context.repo.repo,
-            run_id: runId,
-          });
+          };
+          EOF
+
+      - name: Run Lighthouse audit
+        if: steps.generate_urls.outputs.skip != 'true' && steps.check_preview.outputs.preview_exists == 'true'
+        uses: treosh/lighthouse-ci-action@v11
+        id: lighthouse
+        env:
+          INSTALLATION_USER: ${{ secrets.INSTALLATION_USER }}
+          INSTALLATION_PW: ${{ secrets.INSTALLATION_PW }}
+        with:
+          configPath: .lighthouserc.js
+          uploadArtifacts: true
+          temporaryPublicStorage: true
+
+      - name: Check Lighthouse audit result
+        if: steps.generate_urls.outputs.skip != 'true' && steps.check_preview.outputs.preview_exists == 'true'
+        run: |
+          if [ -z "${{ steps.lighthouse.outputs.manifest }}" ]; then
+            echo "Error: Lighthouse audit failed - no manifest output"
+            exit 1
+          fi
 
-          // Lighthouse artifact
-          const lighthouseArtifact = artifacts.artifacts.find(a => a.name === 'lighthouse-report');
-          const lighthouseArtifactUrl = lighthouseArtifact
-            ? `https://github.com/${context.repo.owner}/${context.repo.repo}/actions/runs/${runId}/artifacts/${lighthouseArtifact.id}`
-            : null;
-
-          // Lighthouse
-          const manifest = '${{ steps.lighthouse.outputs.manifest }}';
-          let manifestJson;
-          try {
-            manifestJson = JSON.parse(manifest);
-            if (!Array.isArray(manifestJson) || manifestJson.length === 0) {
-              throw new Error('Invalid manifest format or empty results');
+          if ! echo '${{ steps.lighthouse.outputs.manifest }}' | jq . > /dev/null 2>&1; then
+            echo "Error: Lighthouse audit failed - invalid manifest format"
+            exit 1
+          fi
+
+          if ! echo '${{ steps.lighthouse.outputs.manifest }}' | jq 'length > 0' > /dev/null 2>&1; then
+            echo "Error: Lighthouse audit failed - no URLs were successfully audited"
+            exit 1
+          fi
+
+          # Fail if any page scored below 0.9 on accessibility
+          below=$(echo '${{ steps.lighthouse.outputs.manifest }}' | jq '[.[] | select(.summary.accessibility < 0.9)] | length')
+          if [ "$below" -gt 0 ]; then
+            echo "Error: $below page(s) scored below 0.9 on accessibility"
+            echo '${{ steps.lighthouse.outputs.manifest }}' | jq -r '.[] | select(.summary.accessibility < 0.9) | "\(.url): \(.summary.accessibility)"'
+            exit 1
+          fi
+
+      - name: Post Lighthouse results comment
+        if: steps.generate_urls.outputs.skip != 'true' && steps.check_preview.outputs.preview_exists == 'true'
+        uses: actions/github-script@v6
+        env:
+          LIGHTHOUSE_MODE: ${{ env.LIGHTHOUSE_MODE }}
+          LIGHTHOUSE_DEPTH: ${{ env.LIGHTHOUSE_DEPTH }}
+        with:
+          script: |
+            const fs = require('fs');
+            const prNumber = parseInt(process.env.PR_NUMBER, 10);
+            const runId = context.runId;
+            const baseUrl = process.env.PREVIEW_URL;
+            const commitSha = process.env.COMMIT_SHA;
+            const commitShaShort = process.env.COMMIT_SHA_SHORT;
+            const mode = process.env.LIGHTHOUSE_MODE;
+            const depth = process.env.LIGHTHOUSE_DEPTH;
+
+            let metadata = {};
+            try {
+              metadata = JSON.parse(fs.readFileSync('lighthouse-metadata.json', 'utf8'));
+            } catch (e) {
+              console.log('No metadata file:', e.message);
             }
-          } catch (error) {
-            console.error('Error parsing Lighthouse manifest:', error);
-            await github.rest.issues.createComment({
+
+            const manifest = '${{ steps.lighthouse.outputs.manifest }}';
+            let manifestJson;
+            try {
+              manifestJson = JSON.parse(manifest);
+              if (!Array.isArray(manifestJson) || manifestJson.length === 0) {
+                throw new Error('Invalid manifest');
+              }
+            } catch (error) {
+              await github.rest.issues.createComment({
+                owner: context.repo.owner,
+                repo: context.repo.repo,
+                issue_number: prNumber,
+                body: `## Lighthouse check results\n\n⚠️ WARN: Failed to parse Lighthouse results. [Workflow run](https://github.com/${context.repo.owner}/${context.repo.repo}/actions/runs/${runId})`,
+              });
+              return;
+            }
+
+            const { data: comments } = await github.rest.issues.listComments({
               owner: context.repo.owner,
               repo: context.repo.repo,
-              issue_number: context.issue.number,
-              body: `## Lighthouse check results\n\n⚠️ WARN: Failed to parse Lighthouse results. Please check the [workflow run](https://github.com/${context.repo.owner}/${context.repo.repo}/actions/runs/${runId}) for details.`
+              issue_number: prNumber,
             });
-            return;
-          }
-          
-          // Delete old Lighthouse comments
-          const { data: comments } = await github.rest.issues.listComments({
-            owner: context.repo.owner,
-            repo: context.repo.repo,
-            issue_number: context.issue.number,
-          });
-          
-          // Delete any previous comments from this workflow
-          for (const comment of comments) {
-            if (comment.user.login === 'github-actions[bot]' && 
-                comment.body.includes('## Lighthouse check results')) {
-              try {
-                console.log(`Deleting Lighthouse comment ${comment.id}`);
+            for (const comment of comments) {
+              if (comment.user.login === 'github-actions[bot]' &&
+                  comment.body.includes('## Lighthouse check results')) {
                 await github.rest.issues.deleteComment({
                   owner: context.repo.owner,
                   repo: context.repo.repo,
                   comment_id: comment.id,
                 });
-                console.log(`Successfully deleted Lighthouse comment ${comment.id}`);
-              } catch (error) {
-                console.error(`Failed to delete Lighthouse comment ${comment.id}:`, error);
               }
             }
-          }
-          
-          // Calculate average accessibility score
-          const scores = manifestJson.map(run => run.summary.accessibility);
-          const avgScore = scores.reduce((a, b) => a + b, 0) / scores.length;
-          const lighthouseScore = avgScore.toFixed(2);
-          
-          const lighthouseReportUrl = `https://github.com/${context.repo.owner}/${context.repo.repo}/actions/runs/${runId}`;
-          let lighthouseComment = '';
-          if (parseFloat(lighthouseScore) >= 0.9) {
-            lighthouseComment = `✓ INFO: Average accessibility score is **${lighthouseScore}** (required: >0.9) — [View the workflow run](${lighthouseReportUrl})`; 
-          } else {
-            lighthouseComment = `⚠️ WARN: Average accessibility score is **${lighthouseScore}** (required: >0.9) — [Check the workflow run](${lighthouseReportUrl})`;
-          }
 
-          const stripAuth = url => {
-            try {
-              const u = new URL(url);
-              u.username = '';
-              u.password = '';
-              return u.toString();
-            } catch {
-              return url;
-            }
-          };
+            const scores = manifestJson.map(run => run.summary.accessibility);
+            const avgScore = (scores.reduce((a, b) => a + b, 0) / scores.length).toFixed(2);
+            const lighthouseReportUrl = `https://github.com/${context.repo.owner}/${context.repo.repo}/actions/runs/${runId}`;
+            const lighthouseComment = parseFloat(avgScore) >= 0.9
+              ? `✓ INFO: Average accessibility score is **${avgScore}** (required: ≥0.9) — [View the workflow run](${lighthouseReportUrl})`
+              : `⚠️ WARN: Average accessibility score is **${avgScore}** (required: ≥0.9) — [Check the workflow run](${lighthouseReportUrl})`;
 
-          // Helper to get the public report URL from htmlPath
-          const getReportUrl = (run) => {
-            if (run.report && Array.isArray(run.report)) {
-              // Find the public .report.html URL
-              const htmlReport = run.report.find(r => r.endsWith('.report.html') && r.startsWith('http'));
-              if (htmlReport) return htmlReport;
-              // Fallback: first report if available
-              if (run.report.length > 0) return run.report[0];
-            }
-            // Fallback: just show the workflow run if nothing else
-            return lighthouseReportUrl;
-          };
+            const stripAuth = url => {
+              try {
+                const u = new URL(url);
+                u.username = '';
+                u.password = '';
+                return u.toString();
+              } catch {
+                return url;
+              }
+            };
 
-          // Parse the links output from the Lighthouse step
-          const links = (() => {
-            try {
-              return JSON.parse(`${{ steps.lighthouse.outputs.links }}`);
-            } catch {
-              return {};
+            const links = (() => {
+              try {
+                return JSON.parse(`${{ steps.lighthouse.outputs.links }}`);
+              } catch {
+                return {};
+              }
+            })();
+
+            const scoresTable = manifestJson
+              .map(run => {
+                const formatScore = score => score === null ? 'N/A' : score.toFixed(2);
+                const displayPath = stripAuth(run.url).replace(baseUrl, '') || run.url;
+                const reportUrl = links[run.url] || lighthouseReportUrl;
+                return `| [${displayPath}](${reportUrl}) | ${formatScore(run.summary.accessibility)} | ${formatScore(run.summary.performance)} | ${formatScore(run.summary['best-practices'])} | ${formatScore(run.summary.seo)} |`;
+              })
+              .join('\n');
+
+            const modeLine = mode === 'changed'
+              ? `Audit mode: **changed pages** (${metadata.paths?.length || manifestJson.length} URL(s))`
+              : `Audit mode: **depth ${depth}** (sitemap)`;
+
+            let comment = `## Lighthouse check results\n\n`;
+            comment += `${lighthouseComment}\n\n`;
+            comment += `${modeLine}\n\n`;
+            comment += `<details>\n<summary>Show Lighthouse scores</summary>\n\n`;
+            comment += `Commit SHA: [${commitShaShort}](${context.serverUrl}/${context.repo.owner}/${context.repo.repo}/commit/${commitSha})\n\n`;
+            if (metadata.global_fallback) {
+              comment += `_Global site files changed — audited root navigation pages._\n\n`;
             }
-          })();
-
-          const scoresTable = manifestJson
-            .map(run => {
-              const formatScore = (score) => score === null ? 'N/A' : score.toFixed(2);
-              const displayPath = stripAuth(run.url).replace(baseUrl, '');
-              // Use the public report URL from the links output, fallback to workflow run if missing
-              const reportUrl = links[run.url] || lighthouseReportUrl;
-              return `| [${displayPath}](${reportUrl}) | ${formatScore(run.summary.accessibility)} | ${formatScore(run.summary.performance)} | ${formatScore(run.summary['best-practices'])} | ${formatScore(run.summary.seo)} |`;
-            })
-            .join('\n');
-
-          let comment = `## Lighthouse check results\n\n`;
-          comment += `${lighthouseComment}\n\n`;
-          comment += `<details>\n<summary>Show Lighthouse scores</summary>\n\n`;
-          comment += `Folder depth level checked: **${process.env.DEPTH}**\n\n`;
-          comment += `Commit SHA: [${commitShaShort}](${context.serverUrl}/${context.repo.owner}/${context.repo.repo}/commit/${commitSha})\n\n`;
-          comment += `Modify the workflow to check a different depth:\n`;
-          comment += `- 0: Top-level navigation only — /index.html, /guide/guides.html, ...\n`;
-          comment += `- 1: All first-level subdirectories — /guide/\*.html, /developer/\*.html, ...\n`;
-          comment += `- 2: All second-level subdirectories — /guide/attestation/\*.html, ...\n\n`;
-          comment += `| Page | Accessibility | Performance | Best Practices | SEO |\n`;
-          comment += `|------|---------------|-------------|----------------|-----|\n`;
-          comment += `${scoresTable}\n\n`;
-          comment += `</details>\n\n`;
-
-          await github.rest.issues.createComment({
-            owner: context.repo.owner,
-            repo: context.repo.repo,
-            issue_number: context.issue.number,
-            body: comment
-          }); 
+            comment += `For a thorough audit, run the **Lighthouse check** workflow manually (Actions → Lighthouse check → Run workflow) with depth 0–2, or add the \`lighthouse:full\` label for depth 2 on the next validate run.\n\n`;
+            comment += `| Page | Accessibility | Performance | Best Practices | SEO |\n`;
+            comment += `|------|---------------|-------------|----------------|-----|\n`;
+            comment += `${scoresTable}\n\n`;
+            comment += `</details>\n\n`;
+
+            await github.rest.issues.createComment({
+              owner: context.repo.owner,
+              repo: context.repo.repo,
+              issue_number: prNumber,
+              body: comment,
+            });
diff --git a/.github/workflows/publish-llm-markdown.yaml b/.github/workflows/publish-llm-markdown.yaml
index e5500fe568..3bb4b307bc 100644
--- a/.github/workflows/publish-llm-markdown.yaml
+++ b/.github/workflows/publish-llm-markdown.yaml
@@ -39,10 +39,11 @@ jobs:
         with:
           version: ${{ vars.QUARTO_VERSION }}
 
-      - name: Install Poetry
-        run: |
-          curl -sSL https://install.python-poetry.org | python3 -
-          echo "$HOME/.local/bin" >> $GITHUB_PATH
+      - name: Set up uv
+        uses: astral-sh/setup-uv@v5
+
+      - name: Set up uv
+        uses: astral-sh/setup-uv@v5
 
       - name: Generate Python library docs
         run: |
diff --git a/.github/workflows/validate-docs-site.yaml b/.github/workflows/validate-docs-site.yaml
index 309a7b302f..f9a7fc80f6 100644
--- a/.github/workflows/validate-docs-site.yaml
+++ b/.github/workflows/validate-docs-site.yaml
@@ -5,6 +5,7 @@ on:
     types: [opened, synchronize, ready_for_review]
 
 permissions:
+  actions: write
   issues: write
   pull-requests: write
 
@@ -65,6 +66,9 @@ jobs:
           src/backend/templates/documentation/model_documentation
         sparse-checkout-cone-mode: true
 
+    - name: Set up uv
+      uses: astral-sh/setup-uv@v5
+
     - name: Verify copyright headers
       run: |
         cd site
@@ -75,11 +79,6 @@ jobs:
       with:
         version: pre-release
 
-    - name: Install Poetry
-      run: |
-        curl -sSL https://install.python-poetry.org | python3 -
-        echo "$HOME/.local/bin" >> $GITHUB_PATH
-
     - name: Generate Python library docs
       run: |
         cd site/_source/validmind-library
@@ -91,8 +90,7 @@ jobs:
 
     - name: Generate template schema docs
       run: |
-        pip install json-schema-for-humans
-        BACKEND_ROOT=site/_source/backend python scripts/generate_template_schema_docs.py
+        BACKEND_ROOT=site/_source/backend uv run --with json-schema-for-humans python scripts/generate_template_schema_docs.py
 
     - name: Populate installation
       run: cp -r site/_source/installation/site/installation site/installation
@@ -164,15 +162,48 @@ jobs:
             body: comment
           });
 
+    - name: Trigger Lighthouse check
+      uses: actions/github-script@v6
+      with:
+        script: |
+          await github.rest.actions.createWorkflowDispatch({
+            owner: context.repo.owner,
+            repo: context.repo.repo,
+            workflow_id: 'lighthouse-check.yaml',
+            ref: context.payload.pull_request.head.ref,
+            inputs: {
+              mode: 'changed',
+              depth: '0',
+              pr_number: String(context.issue.number),
+            },
+          });
+          console.log(`Dispatched Lighthouse check for PR #${context.issue.number}`);
+
     - name: Install pandoc
       run: |
         sudo apt-get update
         sudo apt-get install -y pandoc
 
+    - name: Verify chatbot product map is up to date
+      run: |
+        python3 site/scripts/generate_chatbot_product_map.py
+        git diff --exit-code site/llm/chatbot-product-map.md site/llm/chatbot-product-map-frontend-snapshot.json
+
+    - name: Test chatbot product map generator
+      run: python3 -m unittest discover -s site/scripts -p 'test_generate_chatbot_product_map.py' -v
+
     - name: Validate LLM markdown render
       run: bash llm/render.sh && bash llm/clean.sh
       working-directory: site
 
+    - name: Verify LLM corpus includes product map and docs IA hub
+      run: |
+        test -f site/llm/_llm-output/chatbot-product-map.md
+        test -f site/llm/_llm-output/AGENTS.md
+        test -f site/llm/_llm-output/about/using-the-documentation.md
+        test ! -f site/llm/_llm-output/about/contributing/validmind-community.md
+        test ! -d site/llm/_llm-output/about/contributing/style-guide
+
     # Release headroom and shrink before final lightweight steps & post-job
     - name: Release reserve & shrink
       if: always()
diff --git a/AGENTS.md b/AGENTS.md
index b1c662e0e7..52f3c75e8c 100644
--- a/AGENTS.md
+++ b/AGENTS.md
@@ -6,7 +6,7 @@ This repository contains the source files for [ValidMind's documentation site](h
 
 For an overview of the documentation structure and how to navigate it, see:
 
-**[Using the documentation](https://docs.validmind.ai/about/contributing/using-the-documentation.html)**
+**[Using the documentation](https://docs.validmind.ai/about/using-the-documentation.html)**
 
 This page explains:
 - How the documentation is organized
@@ -32,6 +32,16 @@ If you are an AI agent embedded in ValidMind, your capabilities are documented h
 
 This page describes what the assistant can and cannot do, including context-aware features and current limitations.
 
+## Product UI mapping
+
+The in-app assistant (Valerie) also ingests **`chatbot-product-map.md`** in the LLM corpus. That file maps **platform routes** (for example `/settings/workflows`, `/model-inventory`, `/dashboard`) to documentation URLs and section hints.
+
+Route and help-link data from the product UI is vendored as **`site/llm/chatbot-product-map-frontend-snapshot.json`**. Regenerate it with `make -C site refresh-chatbot-product-map` when frontend routes or `helpLink` values change (requires a local `validmind/frontend` checkout).
+
+Use the map when the user’s question is tied to where they are in the product — especially **Settings**, where the UI groups features differently than the documentation sidebars (Configuration, Workflows, Inventory, and so on).
+
+For documentation organized by topic, continue to use **Using the documentation** (above) and the section table in this file.
+
 ## File format
 
 Documentation is written in Quarto Markdown (`.qmd`). Key conventions:
diff --git a/README.md b/README.md
index 8de8105fa5..d35a5c978f 100644
--- a/README.md
+++ b/README.md
@@ -174,6 +174,19 @@ The script reads from:
 
 Output: Content is injected directly into `site/guide/templates/customize-document-templates.qmd` between marker comments.
 
+#### Chatbot product map and LLM corpus
+
+The in-app assistant (Valerie) uses generated files under `site/llm/`, including `chatbot-product-map.md` (platform routes mapped to docs URLs and section headings). CI regenerates that map and fails if it is out of date with your changes.
+
+If you edit `.qmd` files that affect linked docs or headings (for example FAQ or guide pages referenced from the product UI), regenerate and commit the map before opening or updating a pull request:
+
+```bash
+cd site
+make generate-chatbot-product-map
+```
+
+If product routes or in-app help links changed, use `make refresh-chatbot-product-map` instead (requires a local `validmind/frontend` checkout). See [`site/llm/README.md`](site/llm/README.md) for the full LLM render pipeline, snapshot maintenance, and when to refresh each artifact.
+
 #### Stylesheet organization (IN PROGRESS)
 
 The site uses a modular stylesheet architecture to maintain organized and maintainable styles:
@@ -212,7 +225,7 @@ When constructing links, refer to the `.qmd` file as Quarto will properly render
 
 | Correct | Incorrect |
 |---|---|
-| `[Quickstart — Model Development](get-started/developer/quickstart-developer.qmd)` | `[Quickstart — Model Development](get-started/developer/quickstart-developer.html)` |
+| `[Quickstart — Development](get-started/developer/quickstart-developer.qmd)` | `[Quickstart — Development](get-started/developer/quickstart-developer.html)` |
 
 When constructing filepaths, including while using [Quarto's Includes](https://quarto.org/docs/authoring/includes.html) (single-sourcing feature), you'll also want start with the root directory whenever possible as this minimizes usage of unclear relative paths: 
 
@@ -379,24 +392,22 @@ Similarly, http://localhost:4444/ in your browsers should show an all green logo
 
 ## Configuring Lighthouse checks
 
-Lighthouse is an open-source tool that audits web pages for accessibility, performance, best practices, and SEO. We automatically run Lighthouse against PR preview sites to enable a better, accessible documentation for everyone.
+Lighthouse is an open-source tool that audits web pages for accessibility, performance, best practices, and SEO. We automatically run Lighthouse against PR preview sites when **Validate docs site** finishes deploying a preview (it dispatches the Lighthouse workflow on the PR branch).
 
-By default, Lighthouse checks only the top-level pages in our site navigation, such as `/index.html`, `/guide/guides.html`, `/developer/validmind-library.html`, and so forth. You can configure this behavior in the workflow:
+**Default (every PR):** Lighthouse audits only HTML pages that correspond to files changed under `site/` in the pull request. If you change shared layout files (`_quarto.yml`, `theme.scss`, `_variables.yml`, `_extensions/`, and similar), it falls back to the root navigation pages (`index.html`, `guide/guides.html`, and so on).
 
-```sh
-env:
-  # To change the default depth level:
-  # 0 — Top-level navigation only (e.g. /index.html, /guide/guides.html, /developer/validmind-library.html, etc.)
-  # 1 — All first-level subdirectories (e.g. /guide/*.html)
-  # 2 — All second-level subdirectories (e.g. /guide/attestation/*.html)
-  # Note: While the crawler technically supports deeper levels, expect the workflow to take >2-12 hours to complete
-  DEFAULT_DEPTH: '0'
-```
+**Thorough audit:**
+
+- Add the `lighthouse:full` label to a PR to run a depth-2 sitemap audit on the next successful validate run.
+- Or run the **Lighthouse check** workflow manually from Actions → **Run workflow**, set the PR number, and choose depth `0` (root pages), `1` (first-level sections), or `2` (second-level). Depths above zero can take hours; use them on feature branches only.
+
+The PR comment lists audited URLs, the commit SHA, and accessibility scores (required: ≥ 0.9 per page).
 
 **Tips:**
 
-- On the first run, the workflow waits for a preview site to become available. For subsequent runs, it checks the currently available site, which may be behind HEAD. The PR comment shows which commit SHA was checked — rerun the check if needed.
-- Use folder depths greater than zero only on working branches when you need a thorough site audit. Deeper checks take 2-12 hours to complete and significantly slow down the CI/CD pipeline. Do not merge depth changes to `main`.
+- Lighthouse starts only after validate succeeds, so it no longer polls for up to 45 minutes.
+- If a PR changes only CI or repo metadata (no `site/` pages), Lighthouse skips with an informational comment.
+- Re-run validate (or push a commit) if the preview comment SHA does not match the commit you expect audited.
 
 ## Monitoring
 
diff --git a/site/Makefile b/site/Makefile
index d3372f286c..22f6027d50 100644
--- a/site/Makefile
+++ b/site/Makefile
@@ -9,12 +9,11 @@ SRC_ROOT := _source
 SRC_DIR := $(SRC_ROOT)/validmind-library
 DEST_DIR_NB := notebooks
 DEST_DIR_PYTHON := validmind
-DEST_DIR_TESTS := tests
 SRC_ROOT := _source
 SRC_DIR := $(SRC_ROOT)/validmind-library
 
 # Define .PHONY target for help section
-.PHONY: help add-copyright clean clone copy-installation copy-release-notes delete-demo-branch deploy-demo-branch deploy-prod deploy-staging docker-build docker-serve docker-site docker-site-lite docs-site execute generate-sitemap get-api-json get-source kind-serve kind-stop kind-restart kind-logs notebooks python-docs release-notes render-llm template-schema-docs test-descriptions verify-copyright yearly-releases
+.PHONY: help add-copyright clean clone copy-installation copy-release-notes delete-demo-branch deploy-demo-branch deploy-prod deploy-staging docker-build docker-serve docker-site docker-site-lite docs-site execute generate-chatbot-product-map refresh-chatbot-product-map generate-sitemap get-api-json get-source kind-serve kind-stop kind-restart kind-logs notebooks python-docs release-notes render-llm template-schema-docs verify-copyright yearly-releases
 
 # Help section
 help:
@@ -39,10 +38,12 @@ help:
 	@echo "  docker-site              Get source, render site with Docker profile, execute notebooks"
 	@echo "  docker-site-lite         Get source and render site with Docker profile (skips notebook execution)"
 	@echo "  docs-site                Get all source files and render the production docs site with Quarto"
+	@echo "  generate-chatbot-product-map  Generate product-to-docs map (from committed frontend snapshot)"
+	@echo "  refresh-chatbot-product-map   Re-extract frontend snapshot + map (requires ../frontend)"
 	@echo "  generate-sitemap         Generate a sitemap for the static HTML site"
 	@echo "  execute                  Execute a Jupyter Notebook or notebook directory"
 	@echo "  get-api-json             Download Swagger JSON specs from ValidMind APIs into reference/"
-	@echo "  get-source               Get all source files (clean, clone, copy-installation, copy-release-notes, notebooks, python-docs, test-descriptions, get-api-json)"
+	@echo "  get-source               Get all source files (clean, clone, copy-installation, copy-release-notes, notebooks, python-docs, get-api-json)"
 	@echo "  kind-serve               Set up Kind cluster for ValidMind docs"
 	@echo "  kind-stop                Stop Kind cluster for ValidMind docs"
 	@echo "  kind-restart             Restart Kind cluster for ValidMind docs"
@@ -53,7 +54,6 @@ help:
 	@echo "                           Examples: TAG=cmvm/25.07 or TAG=validmind-library/v2.8.22"
 	@echo "  template-schema-docs     Generate template schema documentation from backend"
 	@echo "  render-llm               Render site to GFM markdown for LLM ingestion (mirrors CI)"
-	@echo "  test-descriptions        Copy the ValidMind tests docs into tests/"
 	@echo "  verify-copyright         Verify that all .qmd and .yml/.yaml files have copyright headers"
 	@echo "  yearly-releases          Collate releases by year into a listing landing and update releases sidebar"
 
@@ -177,12 +177,12 @@ execute:
 	elif [ "$$PROFILE_CHOICE" = "3" ]; then PROFILE="exe-prod"; \
 	else echo "Invalid choice"; exit 1; fi; \
 	echo "Select FILE_PATH:"; \
-	echo "1) notebooks/EXECUTED/model_development"; \
-	echo "2) notebooks/EXECUTED/model_validation"; \
+	echo "1) notebooks/EXECUTED/development"; \
+	echo "2) notebooks/EXECUTED/validation"; \
 	echo "3) Enter custom filepath"; \
 	read -p "Enter choice [1-3]: " FILE_CHOICE; \
-	if [ "$$FILE_CHOICE" = "1" ]; then FILE_PATH="notebooks/EXECUTED/model_development"; \
-	elif [ "$$FILE_CHOICE" = "2" ]; then FILE_PATH="notebooks/EXECUTED/model_validation"; \
+	if [ "$$FILE_CHOICE" = "1" ]; then FILE_PATH="notebooks/EXECUTED/development"; \
+	elif [ "$$FILE_CHOICE" = "2" ]; then FILE_PATH="notebooks/EXECUTED/validation"; \
 	elif [ "$$FILE_CHOICE" = "3" ]; then read -p "Enter custom FILE_PATH: " CUSTOM_FILE_PATH; FILE_PATH="$$CUSTOM_FILE_PATH"; \
 	else echo "Invalid choice"; exit 1; fi; \
 	read -p "Enter VM_API_HOST (default: https://api.prod.validmind.ai/api/v1/tracking): " INPUT_VM_API_HOST; \
@@ -284,7 +284,7 @@ get-api-json:
 	@curl -s -o reference/rapidoc-min.js "https://unpkg.com/rapidoc/dist/rapidoc-min.js" || echo "Failed to fetch RapiDoc library"
 
 # Get all source files
-get-source: clean clone copy-installation copy-release-notes notebooks python-docs test-descriptions template-schema-docs
+get-source: clean clone copy-installation copy-release-notes notebooks python-docs template-schema-docs
 
 # Requires that you've run `make docker-build`
 kind-serve:
@@ -324,12 +324,12 @@ notebooks:
 	@rm -f notebooks.zip
 	@rm -rf $(DEST_DIR_NB)/ && mkdir -p $(DEST_DIR_NB)
 	@cp -r $(SRC_DIR)/notebooks/. $(DEST_DIR_NB)/
-	@echo "Duplicating all files from notebooks/tutorials/model_development/ for execution"
-	@mkdir -p notebooks/EXECUTED/model_development/
-	@cp -r notebooks/tutorials/model_development/* notebooks/EXECUTED/model_development/
-	@echo "Duplicating all files from notebooks/tutorials/model_validation/ for execution"
-	@mkdir -p notebooks/EXECUTED/model_validation/
-	@cp -r notebooks/tutorials/model_validation/* notebooks/EXECUTED/model_validation/
+	@echo "Duplicating all files from notebooks/tutorials/development/ for execution"
+	@mkdir -p notebooks/EXECUTED/development/
+	@cp -r notebooks/tutorials/development/* notebooks/EXECUTED/development/
+	@echo "Duplicating all files from notebooks/tutorials/validation/ for execution"
+	@mkdir -p notebooks/EXECUTED/validation/
+	@cp -r notebooks/tutorials/validation/* notebooks/EXECUTED/validation/
 	@echo "Copying LICENSE into notebooks ..."
 	@cp -r $(SRC_DIR)/LICENSE $(DEST_DIR_NB)/
 	@rm -rf $(DEST_DIR_NB)/code_sharing
@@ -430,16 +430,6 @@ template-schema-docs:
 	@python -m pip install -q json-schema-for-humans
 	@BACKEND_ROOT=$(SRC_ROOT)/backend python ../scripts/generate_template_schema_docs.py
 
-test-descriptions:
-	@echo "\nUpdating test descriptions source ..."
-	@cd _source/validmind-library && make install && poetry run python scripts/extract_descriptions.py validmind/tests
-	@cd ../../
-	@rm -rf $(DEST_DIR_TESTS)
-	@mkdir -p $(DEST_DIR_TESTS)
-	@cp -r $(SRC_DIR)/build/_test_descriptions/validmind/tests/. $(DEST_DIR_TESTS)
-	@echo "Copying _metadata.yml into tests/ ..."
-	@cp developer/_metadata.yml $(DEST_DIR_TESTS)/_metadata.yml
-
 verify-copyright:
 	@echo "\nVerifying copyright headers in .qmd and .yml/.yaml files ..."
 	@cd .. && python site/scripts/verify_copyright_qmd.py
@@ -451,6 +441,14 @@ yearly-releases:
 	git status | grep -v 'release-scripts/'
 	quarto preview
 
+# Generate product-to-documentation map for chatbot RAG (uses committed frontend snapshot)
+generate-chatbot-product-map:
+	@python3 scripts/generate_chatbot_product_map.py
+
+# Refresh vendored frontend snapshot from a local validmind/frontend checkout
+refresh-chatbot-product-map:
+	@python3 scripts/generate_chatbot_product_map.py --from-frontend
+
 # Render site to GFM markdown for LLM ingestion
 render-llm:
 	@echo "\nRendering site to GFM markdown for LLM ingestion ..."
diff --git a/site/_quarto.yml b/site/_quarto.yml
index 28da8c4f4e..977562cd82 100644
--- a/site/_quarto.yml
+++ b/site/_quarto.yml
@@ -95,7 +95,7 @@ website:
         - text: "Model risk management"
           file: about/use-cases/model-risk-management.qmd
           contents:
-          - about/use-cases/sr-11-7.qmd
+          - about/use-cases/sr-26-2.qmd
           - about/use-cases/ss1-23.qmd
           - about/use-cases/e-23.qmd
         - text: "---"
@@ -103,7 +103,7 @@ website:
         - text: "Library and platform"
           file: about/library-and-platform.qmd
           contents:
-          - about/overview-model-documentation.qmd
+          - about/overview-documentation.qmd
           - about/overview-llm-features.qmd
           - text: "Deployment options"
             file: about/deployment/deployment-options.qmd
@@ -125,7 +125,7 @@ website:
         - text: "Software license agreement"
           file: about/fine-print/license-agreement.qmd
         - text: "---"
-        - about/contributing/using-the-documentation.qmd
+        - about/using-the-documentation.qmd
 
     - title: "Support"
       contents:
diff --git a/site/about/contributing/style-guide/conventions.qmd b/site/about/contributing/style-guide/conventions.qmd
index 351ed06336..17fc6e2c78 100644
--- a/site/about/contributing/style-guide/conventions.qmd
+++ b/site/about/contributing/style-guide/conventions.qmd
@@ -125,7 +125,7 @@ Column 2, 50% wide
 
 Sometimes, it's helpful to highlight a call to action with a button that takes you to a topic or to a notebook on JupyterHub. 
 
-Change any Markdown link into a our theme-styled button by appending `{.button}`:
+Change any Markdown link into one of our theme-styled buttons by appending `{.button}`:
 
 :::: {.flex .flex-wrap .justify-around}
 
@@ -167,8 +167,8 @@ Using a markdown button also enables you to link to to the `.qmd` path instead o
     ```markdown
     <!-- IN THE BODY OF YOUR CONTENT -->
     - The record is registered in the inventory.[^1]
-    - You've already customized your model lifecycle statuses for use in workflows.[^2]
-    - Workflows have already been set up for use with your models.[^3]
+    - You've already customized your record stages for use in workflows.[^2]
+    - Workflows have already been set up for use with your records.[^3]
     - You are assigned a role that has access to complete actions set up by workflows.[^5]
 
     <!-- AT THE END OF YOUR .QMD PAGE -->
@@ -344,7 +344,7 @@ Use backticks to enclose keyboard commands, parameters, field values, and file n
 
 | Correct | Incorrect | 
 |------|-----|
-|   Learn how to store model identifier credentials in a `.env` file instead of using inline credentials.  |  Learn how to store model identifier credentials in a ".env" file instead of using inline credentials.  |
+|   Learn how to store record identifier credentials in a `.env` file instead of using inline credentials.  |  Learn how to store record identifier credentials in a ".env" file instead of using inline credentials.  |
 |   For example, the `classifier_full_suite` test suite runs tests from the `tabular_dataset` and `classifier` test suites to fully document the data and model sections for binary classification model use cases. |  For example, the "classifier_full_suite" test suite runs tests from the "tabular_dataset" and "classifier" test suites to fully document the data and model sections for binary classification model use cases.  |
 | Under When these conditions are met, you are able to set both `AND` and `OR` conditions. | Under When these conditions are met, you are able to set both "AND" and "OR" conditions.|
 : **Backtick** examples {.hover}
@@ -359,7 +359,7 @@ Use backticks to enclose keyboard commands, parameters, field values, and file n
 : **Mathematical formula** examples {.hover}
 
 ## Proper nouns
-In the context of model risk management, proper nouns include specific models, laws, or regulations, such as "Basel IV" or "SR 11-7." These refer to specific frameworks or guidelines and you spell them with initial capital letters or exactly as indicated by official sources.
+In the context of model risk management, proper nouns include specific models, laws, or regulations, such as "Basel IV" or "SR 26-2." These refer to specific frameworks or guidelines and you spell them with initial capital letters or exactly as indicated by official sources.
 
 - Terms that are not proper nouns include general concepts such as "model validation," "stress testing," "risk assessment," and "backtesting." 
 - These are common terms in the field and are not capitalized unless starting a sentence.
@@ -380,7 +380,7 @@ Within our documentation (`https://docs.validmind.ai/`), you are able to referen
 
 | Product Name | Variable Key | Description |
 |---:|---|---|
-| {{< var validmind.product >}} | `{{{< var validmind.product >}}}` | Comphrensive suite of tools with a {{< var vm.developer >}} for documenting and testing models, alongside a {{< var vm.platform >}} hosting cloud-based tools, APIs, databases, and validation engines. |
+| {{< var validmind.product >}} | `{{{< var validmind.product >}}}` | Comprehensive suite of tools with a {{< var vm.developer >}} for documenting and testing records (such as models), alongside a {{< var vm.platform >}} hosting cloud-based tools, APIs, databases, and validation engines. |
 | {{< var validmind.developer >}} |  `{{{< var validmind.developer >}}}` | Open-source library that connects to the  {{< var validmind.platform >}}. |
 | {{< var validmind.platform >}} |  `{{{< var validmind.platform >}}}` | Hosted multi-tenant architecture that includes a cloud-based web interface. |
 | {{< var validmind.api >}} | `{{{< var validmind.api >}}}` | Used to make calls to the {{< var validmind.developer >}}.[^21] |
@@ -438,7 +438,7 @@ From  **{{< fa gear >}} Settings** in the {{< var validmind.platform >}}, <br>yo
 - Set up your organization
 - Onboard new users
 - Manage roles, groups and <br>permissions
-- Configure the model inventory
+- Configure the inventory
 - Manage templates and workflows
 - And much more!
 
diff --git a/site/about/contributing/style-guide/voice-and-tone.qmd b/site/about/contributing/style-guide/voice-and-tone.qmd
index 60b20dcbd4..f43495e50b 100644
--- a/site/about/contributing/style-guide/voice-and-tone.qmd
+++ b/site/about/contributing/style-guide/voice-and-tone.qmd
@@ -47,7 +47,7 @@ Behind every page, there’s a person. In every word, lies an opportunity to win
 | Correct | Incorrect | 
 |------|-----|
 |   **User acknowledgement:** Documenting artifacts can be difficult and tedious for even the most seasoned of validators.  |  **User dismissal:** For experienced validators, documenting artifacts is a breeze.  |
-| **Success toast:** Nice work — you’ve successfully registered your first model! | **Inappropriate humor:** We lost your model documentation, oops! Here, have a pony! (e.g. error message for serious issue) |
+| **Success toast:** Nice work — you’ve successfully registered your first record! | **Inappropriate humor:** We lost your documentation, oops! Here, have a pony! (e.g. error message for serious issue) |
 : **Empathy & humor** examples {.hover}
 
 ### Be positive
@@ -82,7 +82,7 @@ Address the reader directly by using the second person.
 
 | Correct | Incorrect | 
 |------|-----|
-|   After completing this quickstart, you will be able to view your test results as part of your model documentation right in the {{< var validmind.platform >}}.  |  After completing this quickstart, the model developer will be able to view the test results as part of the model documentation right in the {{< var validmind.platform >}}.   |
+|   After completing this quickstart, you will be able to view your test results as part of your documentation right in the {{< var validmind.platform >}}.  |  After completing this quickstart, the developer will be able to view the test results as part of the documentation right in the {{< var validmind.platform >}}.   |
 : **2nd person** examples {.hover}
 
 ### Avoid stiff formality
@@ -92,7 +92,7 @@ Address the reader directly by using the second person.
 
 | Correct | Incorrect | 
 |------|-----|
-|   Once you’ve registered the model, you can then grab the unique code snippet that will have been generated for you to use in the next step.  |  First, you must register the model as this will generate a unique code snippet that needs to be copied. Then, you need to retrieve the code snippet so that you can make use of it in the following step.  |
+|   Once you’ve registered the record, you can then grab the unique code snippet that will have been generated for you to use in the next step.  |  First, you must register the record as this will generate a unique code snippet that needs to be copied. Then, you need to retrieve the code snippet so that you can make use of it in the following step.  |
 : **Informal language** examples {.hover}
 
 ### Focus on teamwork
diff --git a/site/about/contributing/validmind-community.qmd b/site/about/contributing/validmind-community.qmd
index bc0996e66b..8dc36167ef 100644
--- a/site/about/contributing/validmind-community.qmd
+++ b/site/about/contributing/validmind-community.qmd
@@ -11,7 +11,7 @@ aliases:
   - /about/join-community.html
 ---
 
-Work with financial models, in model risk management (MRM), or are simply enthusiastic about artificial intelligence (AI) and machine learning and how these tools are actively shaping our futures within the finance industry and beyond? Congratulations — you're already part of the {{< var vm.product >}} community! Come learn and play with us.
+Work with financial models, in model risk management (MRM), in AI governance, or are simply enthusiastic about artificial intelligence (AI) and machine learning and how these tools are actively shaping our futures within the finance industry and beyond? Congratulations — you're already part of the {{< var vm.product >}} community! Come learn and play with us.
 
 ::: {.callout}
 
diff --git a/site/about/deployment/deployment-options.qmd b/site/about/deployment/deployment-options.qmd
index 9dab1db881..acb49defa8 100644
--- a/site/about/deployment/deployment-options.qmd
+++ b/site/about/deployment/deployment-options.qmd
@@ -26,23 +26,23 @@ Choose the {{< var vm.product >}} deployment option that best suits your organiz
 
 ![{{< var vm.product >}} architecture overview](validmind-architecture-overview.png){fig-alt="An image showing the ValidMind architecture"}
 
-In your own environment, model developers can continue to run models using your existing tools for data science and model development, such as Python, Jupyter Notebooks, and R, accessing data from sources such as Google Cloud Storage, Amazon S3, and Snowflake.
+In your own environment, developers can continue to run records (such as models) using your existing tools for data science and development, such as Python, Jupyter Notebooks, and R, accessing data from sources such as Google Cloud Storage, Amazon S3, and Snowflake.
 
-These models are then integrated with the {{< var validmind.developer >}}, which communicates with the {{< var validmind.platform >}} via our {{< var validmind.api >}}.
+These records are then integrated with the {{< var validmind.developer >}}, which communicates with the {{< var validmind.platform >}} via our {{< var validmind.api >}}.
 
 The {{< var validmind.platform >}} provides:
 
-- **Model inventory** — Centralized tracking and organization of models, accessible by developers, validators, and executives.
+- **Inventory** — Centralized tracking and organization of records, accessible by developers, validators, and executives.
 
 - **Documentation & validation engine** — Automated testing and documentation, with validation processes, ensuring compliance with regulations and internal policies.
 
 - **Template management** — Allows for easy creation, customization, and reuse of document templates.
 
-- **{{< var vm.product >}} dashboard** — A user-friendly interface providing insights, status updates, and governance reporting for model risk.
+- **{{< var vm.product >}} dashboard** — A user-friendly interface providing insights, status updates, and governance reporting for risk.
 
 ## Security & data privacy
 
-We ensure data security through strong data isolation, encryption, and role-based access controls.[^1] Personal identifiable information and customer data are not stored in model documentation. For more information, see our data privacy policy.[^2]
+We ensure data security through strong data isolation, encryption, and role-based access controls.[^1] Personal identifiable information and customer data are not stored in documentation. For more information, see our data privacy policy.[^2]
 
 ## Secure access
 
diff --git a/site/about/deployment/system-access-requirements.qmd b/site/about/deployment/system-access-requirements.qmd
index 9e0275968d..37586d99bf 100644
--- a/site/about/deployment/system-access-requirements.qmd
+++ b/site/about/deployment/system-access-requirements.qmd
@@ -10,7 +10,7 @@ Allow list the following domains in your organization’s firewall to ensure you
 
 ## ValidMind Library Python API access
 
-To use our documentation automation tools and test suites for model developers and validators:
+To use our documentation automation tools and test suites for developers and validators:
 
 ```html
 *.validmind.ai
diff --git a/site/about/fine-print/data-privacy-policy.qmd b/site/about/fine-print/data-privacy-policy.qmd
index 734d2c7f6a..2bb274fdc2 100644
--- a/site/about/fine-print/data-privacy-policy.qmd
+++ b/site/about/fine-print/data-privacy-policy.qmd
@@ -38,16 +38,16 @@ Understanding our policies shouldn’t feel like deciphering code, so we’ve ma
 
 The key points of our data privacy policy include:
 
-- **No personal identifiable information in documentation** — When the {{< var validmind.developer >}} generates documentation, it ensures that no personally identifiable information (PII) is included. This practice is a critical part of our commitment to protecting your privacy and maintaining the confidentiality of your data.
+- **No personally identifiable information in documentation** — When the {{< var validmind.developer >}} generates documentation, it ensures that no personally identifiable information (PII) is included. This practice is a critical part of our commitment to protecting your privacy and maintaining the confidentiality of your data.
 
-- **No storage of customer data** — {{< var vm.product >}} does not retain any customer datasets or models. This policy is in place in order to protect your data privacy and security. By not storing this information, {{< var vm.product >}} minimizes the risk of unauthorized access or data breaches.
+- **No storage of customer data** — {{< var vm.product >}} does not retain any customer datasets or records (models). This policy is in place in order to protect your data privacy and security. By not storing this information, {{< var vm.product >}} minimizes the risk of unauthorized access or data breaches.
 
 We believe it is important for users of {{< var vm.product >}}'s products to understand these practices as they reflect our dedication to data security and privacy.
 
 ::: {.callout-important}
 ## {{< var vm.product >}} does NOT: 
-- Include any personal identifiable information (PII) when generating documentation reports.
-- Store any customer datasets or models. 
+- Include any personally identifiable information (PII) when generating documentation reports.
+- Store any customer datasets or records (models). 
 :::
 
 ## Do you comply with the SOC 2 security standard?
@@ -64,13 +64,13 @@ The {{< var validmind.vpv >}} option provides all our features and services but
 
 Access is available through AWS PrivateLink, Azure Private Link, or GCP Private Service Connect, all of which provide private connectivity between {{< var vm.product >}} and your on-premises network without exposing your traffic to the public internet. 
 
-## What model assets are imported into documentation?
+## What record (model) assets are imported into documentation?
 
 When you generate documentation or run tests, {{< var vm.product >}} imports the following assets into the documentation via our {{< var validmind.api >}} endpoint integration:
 
 ![Artifacts imported into the documentation via our {{< var vm.api >}}](overview-api-integration.jpg){width=80% fig-alt="A representation of assets imported into the documentation via our Python API"}
 
-- Metadata about datasets and models, used to look up programmatic documentation content, such as the stored definition for _common logistic regression limitations_ when a logistic regression model has been passed to the {{< var vm.product >}} test suite to be run.
+- Metadata about datasets and records, used to look up programmatic documentation content, such as the stored definition for _common logistic regression limitations_ when a logistic regression model has been passed to the {{< var vm.product >}} test suite to be run.
 - Quality and performance metrics collected from datasets and models.
 - Output from tests and test suites that have been run.
 - Images, plots, visuals that were generated as part of extracting metrics and running tests.
diff --git a/site/about/glossary/_ai-governance.qmd b/site/about/glossary/_ai-governance.qmd
new file mode 100644
index 0000000000..4b9324e7c6
--- /dev/null
+++ b/site/about/glossary/_ai-governance.qmd
@@ -0,0 +1,42 @@
+<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
+Refer to the LICENSE file in the root of this repository for details.
+SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
+
+AI ethics
+: A set of principles and practices guiding the responsible design, development, and deployment of AI systems. Common tenets include fairness, transparency, accountability, privacy, and human well-being.
+
+AI lifecycle
+: The end-to-end stages an AI system progresses through, including problem framing, data collection, model development, validation, deployment, monitoring, and retirement. Each stage carries distinct governance requirements.
+
+AI risk
+: The potential for adverse outcomes — financial, reputational, ethical, regulatory, or societal — arising from the design, deployment, or use of AI systems. AI risk extends beyond traditional model risk to include concerns such as bias, opacity, misuse, and unintended consequences.
+
+algorithmic accountability
+: The principle that organizations must take responsibility for the outcomes of the AI systems they deploy, including documenting decisions, monitoring performance, and providing mechanisms to identify and remediate harm.
+
+bias, algorithmic bias
+: Systematic errors or unfair outcomes in AI system results that disproportionately affect specific groups. Sources include unrepresentative training data, flawed assumptions in system design, or feedback loops introduced during deployment. Detecting and mitigating bias is a core AI governance activity.
+
+<span id="eu-ai-act">EU AI Act</span>
+: A regulatory framework introduced by the European Union that classifies AI systems by risk tier^[**European Union:** [Regulation (EU) 2024/1689: Artificial Intelligence Act](https://eur-lex.europa.eu/eli/reg/2024/1689/oj)] — prohibited, high-risk, limited-risk, and minimal-risk — and imposes proportionate obligations such as risk management, data governance, transparency, human oversight, and conformity assessment.
+
+explainability
+: The degree to which the internal mechanics or outputs of an AI system can be understood by humans. Explainability is a core requirement for high-risk AI systems and supports accountability, debugging, and regulatory review.
+
+fairness
+: The principle that AI systems should produce equitable outcomes across individuals and groups. Fairness assessments are a routine part of bias evaluation and impact assessment within AI governance programs.
+
+ISO/IEC 42001
+: An international management system standard for artificial intelligence published by the International Organization for Standardization. Provides requirements for establishing, implementing, maintaining, and continually improving an AI management system within an organization.
+
+model card, system card
+: A standardized document that summarizes an AI system's intended use, training data, performance characteristics, limitations, and ethical considerations. Model and system cards support transparency and informed deployment decisions.^[**Refer also to:** [documentation](#documentation)]
+
+NIST AI Risk Management Framework (AI RMF)
+: A voluntary framework published by the U.S. National Institute of Standards and Technology to help organizations manage risks associated with AI. Organized around four core functions: govern, map, measure, and manage.
+
+responsible AI
+: An umbrella approach to designing, building, and deploying AI systems in ways that are ethical, transparent, accountable, fair, and aligned with human values and societal expectations.
+
+transparency
+: The disclosure of meaningful information about an AI system's design, data, capabilities, limitations, and decision-making processes to relevant stakeholders. Transparency supports trust, accountability, and informed oversight.
diff --git a/site/about/glossary/_ai.qmd b/site/about/glossary/_ai.qmd
index 5ef7bba2ff..b2b90b0106 100644
--- a/site/about/glossary/_ai.qmd
+++ b/site/about/glossary/_ai.qmd
@@ -5,40 +5,48 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 Refer to [IBM's series on artificial intelligence](https://www.ibm.com/think/artificial-intelligence) for more in-depth resources.
 
 AI governance
-: The organizational framework for directing and overseeing how AI is designed, deployed, and used. It sets policy, accountability, and decision rights, covering ethics, compliance, risk appetite, lifecycle controls, and ongoing oversight across people, process, and technology.
+: The organizational framework for directing and overseeing how AI is designed, deployed, and used. It sets policy, accountability, and decision rights, covering ethics, compliance, risk appetite, lifecycle controls, and ongoing oversight across people, process, and technology.^[**Refer also to:** [AI governance](#ai-governance)]
 
 AI system
-: A combination of software, algorithms, and data designed to perform tasks that typically require human intelligence. In AI governance, an AI system is the primary unit of management, distinct from individual models.
+: A combination of software, algorithms, and data designed to perform tasks that typically require human intelligence. In AI governance, an AI system is the primary unit of management, distinct from individual records (such as models).[^ai-system]
 
 AI use case
 : A specific application or deployment of AI technology to solve a business problem or achieve an objective. Use cases are often the unit of oversight in AI governance frameworks.
 
 artificial intelligence (AI)
-: Artificial intelligence is a broad term used to classify machines that mimic human intelligence and human cognitive functions like problem-solving and learning. 
+: Artificial intelligence is a broad term used to classify machines that mimic human intelligence and human cognitive functions like problem-solving and learning.
 
 deep-learning
-: A subset of machine learning that uses multi-layered neural networks (deep neural networks) to simulate the complex decision-making power of the human brain. 
+: A subset of machine learning that uses multi-layered neural networks (deep neural networks) to simulate the complex decision-making power of the human brain.
 
 generative AI (GenAI)
 : Generative AI refers to deep-learning models that can generate high-quality text, images, and other content based on the data they were trained on.
 
 human oversight
-: Controls and processes ensuring human involvement in AI-driven decisions. Required by regulations like the EU AI Act for high-risk AI systems to enable human intervention and override capabilities.
+: Controls and processes ensuring human involvement in AI-driven decisions. Required by regulations like the EU AI Act for high-risk AI systems to enable human intervention and override capabilities.^[**Refer also to:** [EU AI Act](./glossary.qmd#eu-ai-act)]
 
 impact assessment
 : An evaluation of the potential risks, harms, and consequences associated with deploying an AI system. Impact assessments are a core artifact in AI governance programs.
 
 large language model (LLM)
-: Advanced types of artificial intelligence models designed to understand, generate, and interact with human language at a sophisticated level, such as ChatGPT.^[[ChatGPT](https://chat.openai.com)]
+: An advanced type of artificial intelligence model designed to understand, generate, and interact with human language at a sophisticated level, such as ChatGPT.^[[ChatGPT](https://chat.openai.com)]
 
-machine learning
-: Machine learning is a subset of artificial intelligence that allows for optimization. It helps make predictions that minimize the errors that arise from merely guessing. 
+machine learning (ML)
+: Machine learning is a subset of artificial intelligence that allows for optimization. It helps make predictions that minimize the errors that arise from merely guessing.
 
 risk tier
-: A classification level assigned to an AI system based on its potential impact and risk. The EU AI Act defines tiers including prohibited, high-risk, limited-risk, and minimal-risk categories.
+: A classification level assigned to an AI system based on its potential impact and risk. The EU AI Act defines tiers including prohibited, high-risk, limited-risk, and minimal-risk categories.^[**Refer also to:** [EU AI Act](./glossary.qmd#eu-ai-act)]
 
-traditional statistical models
-: Mathematical frameworks used to analyze and make inferences from data. These models are foundational in statistics and serve to explain relationships, predict outcomes, and guide decision-making across various fields, such as economics, biology, engineering, and social sciences.
+traditional statistical model
+: A mathematical framework used to analyze and make inferences from data. Traditional statistical models are foundational in statistics and serve to explain relationships, predict outcomes, and guide decision-making across various fields, such as economics, biology, engineering, and social sciences.
 
 use case owner
 : The individual accountable for an AI use case within an organization. Responsible for decisions about AI deployment, compliance, and ongoing oversight.
+
+
+<!-- ADDITIONAL FOOTNOTES -->
+
+[^ai-system]: **Refer to:**
+
+    - [record](#records)
+    - [model](#models)
diff --git a/site/about/glossary/_attestation.qmd b/site/about/glossary/_attestation.qmd
index 2ca29bdacf..75271ae84e 100644
--- a/site/about/glossary/_attestation.qmd
+++ b/site/about/glossary/_attestation.qmd
@@ -2,29 +2,29 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-attestation 
-: A formal process where attestation participants certify key model information at a specific time. Attestation is part of your audit trail and confirms that governance, documentation, and control requirements are met.
+attestation
+: A formal process where attestation participants certify key record (model) information at a specific time. Attestation is part of your audit trail and confirms that governance, documentation, and control requirements are met.
 
 attestation instance
-: The invocation of the attestation process on the {{< var validmind.platform >}}. Created when the attestation is triggered by the schedule you set up, it includes a snapshot with record activity and artifacts, questionnaire responses and review status, forming a full record of the review and approval process. 
+: The invocation of the attestation process on the {{< var validmind.platform >}}. Created when the attestation is triggered by the schedule you set up, it includes a snapshot with record activity and artifacts, questionnaire responses and review status, forming a full record of the review and approval process.
 
 attestation participant
-: A user who participates in the attestation workflow as a submitter, reviewer, or approver. Submitters are assigned from model stakeholders; reviewers and approvers are assigned from organizational roles.
+: A user who participates in the attestation workflow as a submitter, reviewer, or approver. Submitters are assigned from inventory record stakeholders; reviewers and approvers are assigned from organizational roles.
 
-attestation period  
-: The time window during which attestation is active, with fixed start and end dates. Each period creates an unchanging model snapshot. Periods are usually scheduled quarterly or annually and can align with regulatory or internal cycles.
+attestation period
+: The time window during which attestation is active, with fixed start and end dates. Each period creates an unchanging record (model) snapshot. Periods are usually scheduled quarterly or annually and can align with regulatory or internal cycles.
 
-attestation questionnaire  
-: A structured form that submitters use to confirm model status, documentation and compliance. It supports formatted inputs like checkboxes and text fields, serving as both a compliance check and formal review record.
+attestation questionnaire
+: A structured form that submitters use to confirm record (model) status, documentation and compliance. It supports formatted inputs like checkboxes and text fields, serving as both a compliance check and formal review record.
 
-execution schedule  
+execution schedule
 : The mechanism, manual or automated, that starts the attestation process based on set periods. It creates attestation instances, triggers snapshots and begins the workflow for attestation participants.
 
 group
-: An organizational unit that associates models with specific teams or functions. When reviewers or approvers are assigned by role, they can only act on models within groups they belong to — resulting in one attestation submission per model owner per group.
+: An organizational unit that associates records (models) with specific teams or functions. When reviewers or approvers are assigned by role, they can only act on records within groups they belong to — resulting in one attestation submission per owner per group.
 
 inventory scope
-: The filter conditions that define which models are included in an attestation. Scope can be set using rules based on model fields, stages, or custom attributes.
+: The filter conditions that define which records (models) are included in an attestation. Scope can be set using rules based on fields, stages, or custom attributes.
 
-snapshot  
-: A fixed capture of model data at a specific time. It includes optional custom fields and related artifacts and stays unchanged throughout the attestation, ensuring historical accuracy.
\ No newline at end of file
+snapshot
+: A fixed capture of record (model) data at a specific time. It includes optional custom fields and related artifacts and stays unchanged throughout the attestation, ensuring historical accuracy.
\ No newline at end of file
diff --git a/site/about/glossary/_developer-tools.qmd b/site/about/glossary/_developer-tools.qmd
index 0381ba6ff1..9dd5cb07bd 100644
--- a/site/about/glossary/_developer-tools.qmd
+++ b/site/about/glossary/_developer-tools.qmd
@@ -14,9 +14,9 @@ Decorators are a simpler way for users to run their own code as a {{< var vm.pro
 {{< include key_concepts/_parameters.qmd >}}
 
 pip
-: A package manager for Python, used to install and manage software packages written in the Python programming language. 
+: A package manager for Python, used to install and manage software packages written in the Python programming language.
 
-{{< var vm.product >}} uses the `pip` command to install the Python client library that is part of the {{< var validmind.developer >}} so that model developers can make use of its features.
+{{< var vm.product >}} uses the `pip` command to install the Python client library that is part of the {{< var validmind.developer >}} so that developers can make use of its features.
 
 JupyterHub
 : A multi-user server provides a platform for users to interactively work with data science and scientific computing tools in a collaborative environment. 
@@ -33,4 +33,4 @@ Jupyter Notebook
 GitHub
 : A cloud-based platform that provides hosting for software development and version control using Git. GitHub^[[GitHub](https://github.com/)] offers collaboration tools such as bug tracking, feature requests, task management, and continuous integration pipelines. 
 
-{{< var vm.product >}} uses GitHub to share [pen-source software^[**GitHub:** [validmind](https://github.com/validmind/)] with you.
+{{< var vm.product >}} uses GitHub to share open-source software^[**GitHub:** [validmind](https://github.com/validmind/)] with you.
diff --git a/site/about/glossary/_documentation.qmd b/site/about/glossary/_documentation.qmd
new file mode 100644
index 0000000000..fc4a038cd3
--- /dev/null
+++ b/site/about/glossary/_documentation.qmd
@@ -0,0 +1,23 @@
+<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
+Refer to the LICENSE file in the root of this repository for details.
+SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
+
+<!-- IF A DOCUMENTATION CONCEPT NEEDS TO BE ADDED:
+
+1. Create a new file under the `about/glossary/documentation` folder with the following structure `_doc-feature.qmd` (the `_` is mandatory for Quarto to retrieve the file as a single-source embed: https://quarto.org/docs/authoring/includes.html)
+2. Embed it below in ABC order with the structure `{{< include documentation/_doc-feature.qmd >}}` 
+
+These instructions update the documentation concept on `working-with-documentation.qmd` as well as the glossary. 
+
+-->
+
+{{< include documentation/_doc-intro.qmd >}}
+
+{{< include documentation/_conceptual-soundness.qmd >}}
+
+{{< include documentation/_data-preparation.qmd >}}
+
+{{< include documentation/_model-development.qmd >}}
+
+{{< include documentation/_monitoring-governance.qmd >}}
+
diff --git a/site/about/glossary/_model-documentation.qmd b/site/about/glossary/_model-documentation.qmd
deleted file mode 100644
index b0c983236b..0000000000
--- a/site/about/glossary/_model-documentation.qmd
+++ /dev/null
@@ -1,23 +0,0 @@
-<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
-Refer to the LICENSE file in the root of this repository for details.
-SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
-
-<!-- IF A MODEL DOCUMENTATION CONCEPT NEEDS TO BE ADDED:
-
-1. Create a new file under the `about/glossary/model_documentation` folder with the following structure `_doc-feature.qmd` (the `_` is mandatory for Quarto to retrieve the file as a single-source embed: https://quarto.org/docs/authoring/includes.html)
-2. Embed it below in ABC order with the structure `{{< include model_documentation/_doc-feature.qmd >}}` 
-
-These instructions update the documentation concept on `working-with-documentation.qmd` as well as the glossary. 
-
--->
-
-{{< include model_documentation/_doc-intro.qmd >}}
-
-{{< include model_documentation/_conceptual-soundness.qmd >}}
-
-{{< include model_documentation/_data-preparation.qmd >}}
-
-{{< include model_documentation/_model-development.qmd >}}
-
-{{< include model_documentation/_monitoring-governance.qmd >}}
-
diff --git a/site/about/glossary/_models.qmd b/site/about/glossary/_models.qmd
index 0bc6ee8e3f..8c9ce74f80 100644
--- a/site/about/glossary/_models.qmd
+++ b/site/about/glossary/_models.qmd
@@ -4,14 +4,13 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 #### Models
 
-model
-: SR 11-7^[[SR 11-7: Guidance on Model Risk Management](https://www.federalreserve.gov/supervisionreg/srletters/sr1107.htm)] defines a model as a "quantitative method, system, or approach that applies statistical, economic, financial, or mathematical theories, techniques, and assumptions to process input data into quantitative estimates."
+{{< include /about/glossary/key_concepts/_docs.qmd >}}
+
+{{< include /about/glossary/key_concepts/_models.qmd >}}
 
 model development
 : An iterative process in which many models are derived, tested, and built upon until a model fitting the desired criteria is achieved.
 
-{{< include key_concepts/_docs.qmd >}}
-
 <!-- VISIBLE ONLY ON PAGES THAT HAVE A CUSTOM METADATA TAG:
 
 ```includes:
@@ -19,7 +18,7 @@ model development
 ``` -->
 
 :::: {.content-visible when-format="html" when-meta="includes.glossary"}
-model inventory^[**Refer also to:** [{{< var vm.product >}} model inventory](./glossary.qmd#platform-model-inventory)]
+model inventory^[**Refer also to:** [inventory](./glossary.qmd#inventory)]
 : A systematic and organized record of all quantitative and qualitative models used within an organization. This inventory facilitates oversight, tracking, and assessment by listing each model's purpose, characteristics, owners, validation status, and associated risks.
 
 ::::
diff --git a/site/about/glossary/_mrm.qmd b/site/about/glossary/_mrm.qmd
index 4872d9f341..31835071a4 100644
--- a/site/about/glossary/_mrm.qmd
+++ b/site/about/glossary/_mrm.qmd
@@ -13,27 +13,27 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 3rd line of defense
 : Typically an internal audit function responsible for providing an independent and comprehensive review of the risk management processes and controls that the first two lines have implemented. 
 
-model developer
+model developer, developer
 : Responsible for the design, implementation, and maintenance of models to ensure they are fit-for-purpose, accurate, and aligned with business requirements. As subject matter experts, they collaborate with model validators and other business units, ensuring the models are conceptually sound and robust. 
 
-model governance
+model governance, governance
 : A framework of policies, procedures, and standards established to oversee the lifecycle of models within an organization. Ensures that models are developed, validated, implemented, and retired in a controlled and consistent manner, promoting accountability, transparency, and adherence to regulatory requirements.
 
-model implementation
+model implementation, implementation
 : A collaborative effort among model developers and model owners. Model implementation includes a formalized implementation plan and associated procedures, a review of results, and a record of model change procedures. 
 
-model owner
+model owner, owner
 : Responsible for coordinating model development, model implementation, ongoing model monitoring and maintaining the model’s administration, such as model documentation and model risk reporting.
 
-model user
+model user, user
 : Those who rely on the model’s outputs to inform business decisions. 
 
-model validation
+model validation, validation
 : A systematic process to evaluate and verify that a model is performing as intended, accurately represents the phenomena it is designed to capture, and is appropriate for its specified purpose. This assessment encompasses a review of the model's conceptual soundness, data integrity, calibration, and performance outcomes, as well as testing against out-of-sample datasets. 
     
 Within model risk management, model validation ensures that potential risks associated with model errors, misuse, or misunderstanding are identified and mitigated.
 
-model validator
+model validator, validator
 : Responsible for conducting independent assessments of models to ensure their accuracy, reliability, and appropriateness for intended purposes. The role involves evaluating a model's conceptual soundness, data integrity, calibration methods, and overall performance, typically using out-of-sample datasets. 
 
 Model validators identify potential risks and weaknesses, ensuring that models within an organization meet established standards and regulatory requirements, and provide recommendations to model developers for improvements or modifications.
diff --git a/site/about/glossary/_validmind-features.qmd b/site/about/glossary/_validmind-features.qmd
index 2be12d5923..4d3cc46369 100644
--- a/site/about/glossary/_validmind-features.qmd
+++ b/site/about/glossary/_validmind-features.qmd
@@ -8,16 +8,26 @@ client library, Python client library
 : Enables the interaction of your development environment with the {{< var validmind.platform >}} as part of the {{< var validmind.developer >}}.
 
 content block
-: Content blocks provide you with sections that are part of a template, and are used in model documentation, validation reports, ongoing monitoring reports, and custom document types.^[[Work with content blocks](/guide/documentation/work-with-content-blocks.qmd)]
+: A modular document template component. Content blocks are used to populate text and test results in documentation, validation reports, ongoing monitoring reports, and custom document types.^[[Work with content blocks](/guide/documentation/work-with-content-blocks.qmd)]
 
 documentation automation
-: A core benefit of {{< var vm.product >}} that allows for the automatic creation of model documentation using predefined templates and test suites.
+: A core benefit of {{< var vm.product >}} that allows for the automatic creation of documentation using predefined templates and test suites.[^test-suite]
 
-<span id="platform-model-inventory">model inventory</span>
-: A feature of the {{< var validmind.platform >}} where you can track, manage, and oversee the lifecycle of models. Covers the full model lifecycle, including customizable approval workflows for different user roles, status and activity tracking, and periodic revalidation. 
+<span id="inventory">inventory</span>
+: A feature of the {{< var validmind.platform >}} where you can track, manage, and oversee the lifecycle of your records (such as models). Covers the full record lifecycle, including customizable approval workflows for different user roles, status and activity tracking, and periodic revalidation.
+
+{{< include key_concepts/_records.qmd >}}
 
 {{< include key_concepts/_template.qmd >}}
 
 {{< include key_concepts/_test.qmd >}}
 
-{{< include key_concepts/_test-suite.qmd >}}
\ No newline at end of file
+{{< include key_concepts/_test-suite.qmd >}}
+
+
+<!-- ADDITIONAL FOOTNOTES -->
+
+[^test-suite]: **Refer to:**
+
+    - [document template](/about/glossary/glossary.qmd#document-template)
+    - [test suite](/about/glossary/glossary.qmd#test-suite)
\ No newline at end of file
diff --git a/site/about/glossary/_validmind.qmd b/site/about/glossary/_validmind.qmd
index fcba5f96cc..b9d29c8ff5 100644
--- a/site/about/glossary/_validmind.qmd
+++ b/site/about/glossary/_validmind.qmd
@@ -4,10 +4,10 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 #### {{< var validmind.product >}}
 
-These two features are intertwined and work in tandem to help streamline your model lifecycle.
+These two features are intertwined and work in tandem to help streamline your risk management lifecycles.
 
 <span id="framework">{{< var validmind.developer >}} ({{< var vm.developer >}})</span>
-: An open-source^[**{{< var vm.product >}} GitHub:** [`validmind-library`](https://github.com/validmind/validmind-library/)] suite of documentation tools and test suites designed to document models, test models for weaknesses, and identify overfit areas. Enables automating the generation of model documentation by uploading documentation and test results to the {{< var validmind.platform >}}.
+: An open-source^[**{{< var vm.product >}} GitHub:** [`validmind-library`](https://github.com/validmind/validmind-library/)] suite of documentation tools and test suites designed to document records (such as models), test records for weaknesses, and identify overfit areas. Enables automating the generation of documentation by uploading documentation and test results to the {{< var validmind.platform >}}.
 
 <span id="platform">{{< var validmind.platform >}} ({{< var vm.platform >}})</span>
-: A hosted multi-tenant architecture^[[Log into {{< var vm.product >}}](/guide/access/log-in-to-validmind.qmd)] that includes the {{< var vm.product >}} cloud-based web interface, APIs, databases, documentation and validation engine, and various internal services. 
+: A hosted multi-tenant architecture^[[Log into {{< var vm.product >}}](/guide/access/log-in-to-validmind.qmd)] that includes the {{< var vm.product >}} cloud-based web interface, APIs, databases, documentation and validation engine, and various internal services.
diff --git a/site/about/glossary/documentation/_conceptual-soundness.qmd b/site/about/glossary/documentation/_conceptual-soundness.qmd
new file mode 100644
index 0000000000..1dae64104f
--- /dev/null
+++ b/site/about/glossary/documentation/_conceptual-soundness.qmd
@@ -0,0 +1,6 @@
+<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
+Refer to the LICENSE file in the root of this repository for details.
+SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
+
+conceptual soundness
+: Establishes the foundation of a selected record (such as a model), covering the overview, intended use and business use case, regulatory requirements, limitations, and the rationale behind selection. It emphasizes purpose, scope, and constraints, which are crucial for stakeholders to understand applicability and limitations.
diff --git a/site/about/glossary/model_documentation/_data-preparation.qmd b/site/about/glossary/documentation/_data-preparation.qmd
similarity index 88%
rename from site/about/glossary/model_documentation/_data-preparation.qmd
rename to site/about/glossary/documentation/_data-preparation.qmd
index 9a5b539e85..84646b6c75 100644
--- a/site/about/glossary/model_documentation/_data-preparation.qmd
+++ b/site/about/glossary/documentation/_data-preparation.qmd
@@ -3,4 +3,4 @@ Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 data preparation
-: Details the data description, including dataset summary, data quality tests, descriptive statistics, correlations and interactions, and feature selection and engineering. It provides transparency into the data used for training, ensuring that the record such as a model is built on a solid and relevant dataset.
\ No newline at end of file
+: Details the data description, including dataset summary, data quality tests, descriptive statistics, correlations and interactions, and feature selection and engineering. It provides transparency into the data used for training, ensuring that the record (such as a model) is built on a solid and relevant dataset.
\ No newline at end of file
diff --git a/site/about/glossary/model_documentation/_doc-intro.qmd b/site/about/glossary/documentation/_doc-intro.qmd
similarity index 100%
rename from site/about/glossary/model_documentation/_doc-intro.qmd
rename to site/about/glossary/documentation/_doc-intro.qmd
diff --git a/site/about/glossary/model_documentation/_model-development.qmd b/site/about/glossary/documentation/_model-development.qmd
similarity index 81%
rename from site/about/glossary/model_documentation/_model-development.qmd
rename to site/about/glossary/documentation/_model-development.qmd
index 5acf1242eb..1c7eafc727 100644
--- a/site/about/glossary/model_documentation/_model-development.qmd
+++ b/site/about/glossary/documentation/_model-development.qmd
@@ -3,4 +3,4 @@ Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 model development, development
-: Discusses the training, evaluation, explainability, interpretability, and diagnosis, including weak spots, overfit regions, and robustness. This section is vital for understanding how the record such as a model was developed, how it performs, and its areas of strength and weakness.
+: Discusses the training, evaluation, explainability, interpretability, and diagnosis, including weak spots, overfit regions, and robustness. This section is vital for understanding how the record (such as a model) was developed, how it performs, and its areas of strength and weakness.
diff --git a/site/about/glossary/documentation/_monitoring-governance.qmd b/site/about/glossary/documentation/_monitoring-governance.qmd
new file mode 100644
index 0000000000..05ccf5390e
--- /dev/null
+++ b/site/about/glossary/documentation/_monitoring-governance.qmd
@@ -0,0 +1,6 @@
+<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
+Refer to the LICENSE file in the root of this repository for details.
+SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
+
+monitoring and governance
+: Focuses on the record (such as a model)’s ongoing monitoring plan, implementation, and governance plan. It outlines strategies for maintaining the performance over time and ensuring that it remains compliant with regulatory requirements and ethical standards.
\ No newline at end of file
diff --git a/site/about/glossary/glossary.qmd b/site/about/glossary/glossary.qmd
index cbf0c8ab03..43167cf368 100644
--- a/site/about/glossary/glossary.qmd
+++ b/site/about/glossary/glossary.qmd
@@ -17,32 +17,39 @@ includes:
 This glossary of terms provides short definitions for technical terms you find commonly used in our product documentation grouped by terms related to:
 
 - [{{< var vm.product >}}](#validmind)
-- [Artificial intelligence](#artificial-intelligence)
-- [Models and model risk management](#models-and-model-risk-management)
-- [Model documentation](#model-documentation)
+- [Artificial intelligence (AI) governance](#artificial-intelligence-ai-governance)
+- [Model risk management](#model-risk-management)
+- [Documentation](#documentation)
 - [Validation reports](#validation-reports)
 - [Ongoing monitoring](#ongoing-monitoring)
 - [Attestations](#attestations)
 - [Integrations](#integrations)
 - [Developer tools](#developer-tools)
+<br><br>
 
 ## {{< var vm.product >}}
 
 {{< include _validmind.qmd >}}
 {{< include _validmind-features.qmd >}}
 
-## Artificial intelligence
+## Artificial intelligence (AI) governance
+
+#### AI
 
 {{< include _ai.qmd >}}
 
-## Models and model risk management
+#### AI governance
+
+{{< include _ai-governance.qmd >}}
+
+## Model risk management
 
 {{< include _models.qmd >}}
 {{< include _mrm.qmd >}}
 
-## Model documentation
+## Documentation
 
-{{< include _model-documentation.qmd >}}
+{{< include _documentation.qmd >}}
 
 ## Validation reports
 
diff --git a/site/about/glossary/key_concepts/_docs.qmd b/site/about/glossary/key_concepts/_docs.qmd
index 0ff2fa8d76..886d9f2f20 100644
--- a/site/about/glossary/key_concepts/_docs.qmd
+++ b/site/about/glossary/key_concepts/_docs.qmd
@@ -2,7 +2,12 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-model documentation
-: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. 
-    
-Within the realm of model risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model's application.
\ No newline at end of file
+<span id="documentation"></span>
+
+documentation, model documentation
+: A structured and detailed record pertaining to a record (such as a model), encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses.
+
+:::: {.content-visible when-format="html" when-meta="includes.glossary"}
+Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.
+
+::::
\ No newline at end of file
diff --git a/site/about/glossary/key_concepts/_inputs.qmd b/site/about/glossary/key_concepts/_inputs.qmd
index 0c45358b5e..bc148ade75 100644
--- a/site/about/glossary/key_concepts/_inputs.qmd
+++ b/site/about/glossary/key_concepts/_inputs.qmd
@@ -5,7 +5,19 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 inputs
 : Objects to be evaluated and documented in the {{< var validmind.developer >}}. They can be any of the following:
 
-  - **model**: A single model that has been initialized in {{< var vm.product >}}. Refer to the [`vm.init_model()` function](/validmind/validmind.qmd#init_model){target="_blank"} for more information.
-  - **dataset**: Single dataset that has been initialized in {{< var vm.product >}}. Refer to the [`vm.init_dataset()` function](/validmind/validmind.qmd#init_dataset){target="_blank"} for more information.
-  - **models**: A list of {{< var vm.product >}} models - usually this is used when you want to compare multiple models in your custom tests.
-  - **datasets**: A list of {{< var vm.product >}} datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.ipynb))
\ No newline at end of file
+:::: {.content-visible when-format="html" when-meta="includes.glossary"}
+  - **model**: A single record (such as a model) that has been initialized in {{< var vm.product >}}. Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with {{< var vm.product >}}.^[**Refer to:** [`init_model()`](/validmind/validmind.qmd#init_model){target="_blank"}]
+  - **dataset**: A single dataset that has been initialized in {{< var vm.product >}}.^[**Refer to:** [`init_dataset()`](/validmind/validmind.qmd#init_dataset){target="_blank"}]
+  - **models**: A list of {{< var vm.product >}} records — usually this is used when you want to compare multiple records in your custom tests.
+  - **datasets**: A list of {{< var vm.product >}} datasets — usually this is used when you want to compare multiple datasets in your custom tests.^[**Learn more:** [Run tests with multiple datasets](/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.ipynb)]
+  
+::::
+
+:::: {.content-visible when-format="html" unless-meta="includes.glossary"}
+  - **model**: A single record (such as a model) that has been initialized in {{< var vm.product >}}. Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with {{< var vm.product >}}. Refer to the [`vm.init_model()` function](/validmind/validmind.qmd#init_model){target="_blank"} for more information.
+  - **dataset**: A single dataset that has been initialized in {{< var vm.product >}}. Refer to the [`vm.init_dataset()` function](/validmind/validmind.qmd#init_dataset){target="_blank"} for more information.
+  - **models**: A list of {{< var vm.product >}} records — usually this is used when you want to compare multiple records in your custom tests.
+  - **datasets**: A list of {{< var vm.product >}} datasets — usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.ipynb))
+
+::::
+
diff --git a/site/about/glossary/key_concepts/_key-concepts.qmd b/site/about/glossary/key_concepts/_key-concepts.qmd
index 4e2fe9c64d..73a4f68bab 100644
--- a/site/about/glossary/key_concepts/_key-concepts.qmd
+++ b/site/about/glossary/key_concepts/_key-concepts.qmd
@@ -6,20 +6,28 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 1. Create a new file under the `about/glossary/key_concepts` folder with the following structure `_concept.qmd` (the `_` is mandatory for Quarto to retrieve the file as a single-source embed: https://quarto.org/docs/authoring/includes.html)
 2. Include it below with the structure `{{< include /about/glossary/key_concepts/_concept.qmd >}}`
-3. In the `about/glossary` folder, locate the correct section file it belongs to (e.g. `_ai.qmd`) and embed it there as well in ABC order with the structure `{{< include key_concepts/_concept.qmd >}}` 
+3. In the `about/glossary` folder, locate the correct section file it belongs to (e.g. `_ai.qmd`) and embed it there as well in ABC order with the structure `{{< include key_concepts/_concept.qmd >}}`
 
 These instructions update the key concept on anywhere the key concepts are reference as well as within the glossary.
 
 -->
 
+{{< include /about/glossary/key_concepts/_records.qmd >}}
+
+{{< include /about/glossary/key_concepts/_models.qmd >}}
+
 {{< include /about/glossary/key_concepts/_docs.qmd >}}
 
 {{< include /about/glossary/key_concepts/_report.qmd >}}
 
+{{< include /about/glossary/monitoring/_ongoing-monitoring.qmd >}}
+
 {{< include /about/glossary/key_concepts/_template.qmd >}}
 
 {{< include /about/glossary/key_concepts/_test.qmd >}}
 
+{{< include /about/glossary/key_concepts/_test-suite.qmd >}}
+
 {{< include /about/glossary/key_concepts/_metrics.qmd >}}
 
 {{< include /about/glossary/key_concepts/_inputs.qmd >}}
@@ -28,4 +36,3 @@ These instructions update the key concept on anywhere the key concepts are refer
 
 {{< include /about/glossary/key_concepts/_outputs.qmd >}}
 
-{{< include /about/glossary/key_concepts/_test-suite.qmd >}}
\ No newline at end of file
diff --git a/site/about/glossary/key_concepts/_metrics.qmd b/site/about/glossary/key_concepts/_metrics.qmd
index 53dd1223f7..d95bb3588d 100644
--- a/site/about/glossary/key_concepts/_metrics.qmd
+++ b/site/about/glossary/key_concepts/_metrics.qmd
@@ -2,7 +2,16 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
+:::: {.content-visible when-format="html" when-meta="includes.glossary"}
 metrics, custom metrics
-: Metrics are a subset of tests that do not have thresholds. Custom metrics are functions that you define to evaluate your model or dataset. These functions can be registered via the {{< var validmind.developer >}} to be used with the {{< var validmind.platform >}}.
+: Metrics are a subset of tests that do not have thresholds. Custom metrics are functions that you define to evaluate your record (such as a model) or dataset. These functions can be registered via the {{< var validmind.developer >}} to be used with the {{< var validmind.platform >}}.
 
-In the context of {{< var vm.product >}}'s Jupyter Notebooks, metrics and tests can be thought of as interchangeable concepts. 
\ No newline at end of file
+In the context of {{< var vm.product >}}'s Jupyter Notebooks, metrics and tests can be thought of as interchangeable concepts.^[**Refer also to:** [test](/about/glossary/glossary.qmd#tests)]
+::::
+
+:::: {.content-visible when-format="html" unless-meta="includes.glossary"}
+metrics, custom metrics
+: Metrics are a subset of tests that do not have thresholds. Custom metrics are functions that you define to evaluate your record (such as a model) or dataset. These functions can be registered via the {{< var validmind.developer >}} to be used with the {{< var validmind.platform >}}.
+
+In the context of {{< var vm.product >}}'s Jupyter Notebooks, metrics and tests can be thought of as interchangeable concepts.
+::::
\ No newline at end of file
diff --git a/site/about/glossary/key_concepts/_models.qmd b/site/about/glossary/key_concepts/_models.qmd
new file mode 100644
index 0000000000..15bdf932df
--- /dev/null
+++ b/site/about/glossary/key_concepts/_models.qmd
@@ -0,0 +1,17 @@
+<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
+Refer to the LICENSE file in the root of this repository for details.
+SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
+
+:::: {.content-visible when-format="html" when-meta="includes.glossary"}
+model
+: SR 26-2^[[SR 26-2: Interagency Guidance on Model Risk Management for Banking Organizations](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm)] (which supersedes SR 11-7) defines a model as a "complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates." Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model.
+
+Within {{< var vm.product >}}, a model is a type of record tracked in the inventory.^[**Refer also to:** [record](/about/glossary/glossary.qmd#records)]
+::::
+
+:::: {.content-visible when-format="html" unless-meta="includes.glossary"}
+model
+: SR 26-2 (which supersedes SR 11-7) defines a model as a "complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates." Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model.
+
+Within {{< var vm.product >}}, a model is a type of record tracked in the inventory.
+::::
\ No newline at end of file
diff --git a/site/about/glossary/key_concepts/_records.qmd b/site/about/glossary/key_concepts/_records.qmd
new file mode 100644
index 0000000000..174f514997
--- /dev/null
+++ b/site/about/glossary/key_concepts/_records.qmd
@@ -0,0 +1,16 @@
+<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
+Refer to the LICENSE file in the root of this repository for details.
+SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
+
+:::: {.content-visible when-format="html" when-meta="includes.glossary"}
+<span id="records">record</span>
+: A tool tracked in the {{< var validmind.platform >}} inventory,^[**Refer to:** [model](/about/glossary/glossary.qmd#models)] such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.
+
+::::
+
+:::: {.content-visible when-format="html" unless-meta="includes.glossary"}
+record
+: A tool tracked in the {{< var validmind.platform >}} inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.
+::::
+
+
diff --git a/site/about/glossary/key_concepts/_report.qmd b/site/about/glossary/key_concepts/_report.qmd
index 42157729e9..c5bf7b6960 100644
--- a/site/about/glossary/key_concepts/_report.qmd
+++ b/site/about/glossary/key_concepts/_report.qmd
@@ -5,4 +5,7 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 validation report
 : A formal document produced after a model validation process, outlining the artifacts, assessments, and recommendations related to a specific model's performance, appropriateness, and limitations. Provides a comprehensive review of the model's conceptual framework, data sources and integrity, calibration methods, and performance outcomes. 
 
-Within model risk management, the validation report is crucial for ensuring transparency, demonstrating regulatory compliance, and offering actionable insights for model refinement or adjustments.
\ No newline at end of file
+:::: {.content-visible when-format="html" when-meta="includes.glossary"}
+Within model risk management, the validation report is crucial for ensuring transparency, demonstrating regulatory compliance, and offering actionable insights for model refinement or adjustments.
+
+::::
\ No newline at end of file
diff --git a/site/about/glossary/key_concepts/_template.qmd b/site/about/glossary/key_concepts/_template.qmd
index 6a47859219..7c035e586b 100644
--- a/site/about/glossary/key_concepts/_template.qmd
+++ b/site/about/glossary/key_concepts/_template.qmd
@@ -10,16 +10,18 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 :::: {.content-visible when-format="html" when-meta="includes.glossary"}
 document template
-: Lays out the structure of model documents, segmented into various sections and sub-sections, and function as test suites to help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default {{< var vm.product >}} document types[^default-documents] as well as custom document types.
+: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite to help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default {{< var vm.product >}} document types[^default-documents] as well as custom document types.
 
-<span id="documentation-template">documentation template^[**Refer also to:** [Model documentation](/about/glossary/glossary.qmd#model-documentation)]
-: A default {{< var vm.product >}} document type that serves as a standardized framework for developing and documenting models, including sections designated for model details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across model documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.
+<span id="documentation-template">documentation template</span>^[**Refer also to:** [documentation](/about/glossary/glossary.qmd#documentation)]
+: A default {{< var vm.product >}} document template that serves as a standardized framework for developing and documenting records (such as models), including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, documentation templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.
 
-<span id="validation-report-template">validation report template^[**Refer also to:** [Validation reports](/about/glossary/glossary.qmd#validation-reports)]
-: A default {{< var vm.product >}} document type that serves as a standardized framework for conducting and documenting model validation, including sections designated for attaching test results, evidence, or artifacts (findings). By outlining required documentation, recommended analyses, and expected validation tests, validation report templates ensure consistency and completeness across validation reports and help guide validators through a systematic review process while promoting comparability and traceability of validation outcomes.
+{{< var vm.product >}} documentation templates function as test suites by defining the structure of your documentation, specifying the tests that should be run, and how the results should be displayed.
 
-<span id="monitoring-template">monitoring template, monitoring report template^[**Refer also to:** [Ongoing monitoring](/about/glossary/glossary.qmd#ongoing-monitoring)]
-: A default {{< var vm.product >}} document type that serves as a standardized framework for ongoing model monitoring, including sections designated for test results, performance metrics, and drift analyses. By outlining required monitoring checks and expected routine tests, monitoring templates ensure consistency and completeness across monitoring reports and help guide model owners through a systematic monitoring process while promoting early detection of model performance degradation.
+<span id="validation-report-template">validation report template</span>^[**Refer also to:** [validation reports](/about/glossary/glossary.qmd#validation-reports)]
+: A default {{< var vm.product >}} document template that serves as a standardized framework for conducting and documenting validation, including sections designated for attaching test results, evidence, or artifacts (findings). By outlining required documentation, recommended analyses, and expected validation tests, validation report templates ensure consistency and completeness across validation reports and help guide validators through a systematic review process while promoting comparability and traceability of validation outcomes.
+
+<span id="monitoring-template">monitoring template, monitoring report template</span>^[**Refer also to:** [ongoing monitoring](/about/glossary/glossary.qmd#ongoing-monitoring)]
+: A default {{< var vm.product >}} document template that serves as a standardized framework for ongoing monitoring, including sections designated for test results, performance metrics, and drift analyses. By outlining required monitoring checks and expected routine tests, monitoring templates ensure consistency and completeness across monitoring reports and help guide owners through a systematic monitoring process while promoting early detection of performance degradation.
 
 ::::
 
@@ -31,16 +33,16 @@ document template
 
 :::: {.content-visible when-format="html" unless-meta="includes.glossary"}
 document template
-: Lays out the structure of model documents, segmented into various sections and sub-sections, and function as test suites to help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default {{< var vm.product >}} document types as well as custom document types.
+: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite to help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default {{< var vm.product >}} document types as well as custom document types.
 
-<span id="documentation-template">documentation template
-: A default {{< var vm.product >}} document type that serves as a standardized framework for developing and documenting models, including sections designated for model details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across model documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.
+documentation template
+: A default {{< var vm.product >}} document type that serves as a standardized framework for developing and documenting records (such as models), including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, documentation templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.
 
-<span id="validation-report-template">validation report template
-: A default {{< var vm.product >}} document type that serves as a standardized framework for conducting and documenting model validation, including sections designated for attaching test results, evidence, or artifacts (findings). By outlining required documentation, recommended analyses, and expected validation tests, validation report templates ensure consistency and completeness across validation reports and help guide validators through a systematic review process while promoting comparability and traceability of validation outcomes.
+validation report template
+: A default {{< var vm.product >}} document type that serves as a standardized framework for conducting and documenting validation, including sections designated for attaching test results, evidence, or artifacts (findings). By outlining required documentation, recommended analyses, and expected validation tests, validation report templates ensure consistency and completeness across validation reports and help guide validators through a systematic review process while promoting comparability and traceability of validation outcomes.
 
-<span id="monitoring-template">monitoring template, monitoring report template
-: A default {{< var vm.product >}} document type that serves as a standardized framework for ongoing model monitoring, including sections designated for test results, performance metrics, and drift analyses. By outlining required monitoring checks and expected routine tests, monitoring templates ensure consistency and completeness across monitoring reports and help guide model owners through a systematic monitoring process while promoting early detection of model performance degradation.
+monitoring template, monitoring report template
+: A default {{< var vm.product >}} document type that serves as a standardized framework for ongoing monitoring, including sections designated for test results, performance metrics, and drift analyses. By outlining required monitoring checks and expected routine tests, monitoring templates ensure consistency and completeness across monitoring reports and help guide owners through a systematic monitoring process while promoting early detection of performance degradation.
 
 ::::
 
diff --git a/site/about/glossary/key_concepts/_test-suite.qmd b/site/about/glossary/key_concepts/_test-suite.qmd
index b1d2289365..59024193bc 100644
--- a/site/about/glossary/key_concepts/_test-suite.qmd
+++ b/site/about/glossary/key_concepts/_test-suite.qmd
@@ -2,7 +2,13 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-test suite
-: A collection of tests which are run together to generate model documentation end-to-end for specific use cases. 
+:::: {.content-visible when-format="html" when-meta="includes.glossary"}
+
+<span id="test-suite">test suite</span>
+: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases.^[**Learn more:** [test_suites](/validmind/validmind/test_suites.qmd)]
+::::
 
-For example, the [`classifier_full_suite`](/validmind/validmind/test_suites/classifier.qmd#classifierfullsuite){target="_blank"} test suite runs tests from the [`tabular_dataset`](/validmind/validmind/test_suites/tabular_datasets.qmd){target="_blank"} and [`classifier`](/validmind/validmind/test_suites/classifier.qmd){target="_blank"} test suites to fully document the data and model sections for binary classification model use cases.
\ No newline at end of file
+:::: {.content-visible when-format="html" unless-meta="includes.glossary"}
+test suite
+: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [test_suites](/validmind/validmind/test_suites.qmd))
+::::
\ No newline at end of file
diff --git a/site/about/glossary/key_concepts/_test.qmd b/site/about/glossary/key_concepts/_test.qmd
index 6708c16a77..c4ead6e4b3 100644
--- a/site/about/glossary/key_concepts/_test.qmd
+++ b/site/about/glossary/key_concepts/_test.qmd
@@ -2,7 +2,7 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-test
-: A function contained in the {{< var vm.developer >}}, designed to run a specific quantitative test on the dataset or model. Test results are sent to the {{< var validmind.platform >}} to generate the model documentation according to the template that is associated with the documentation.
+<span id="tests">test</span>
+: A function contained in the {{< var vm.developer >}}, designed to run a specific quantitative test on the dataset or record (such as a model). Test results are logged to the {{< var validmind.platform >}}, where they are attached to documents.
 
-Tests are the building blocks of {{< var vm.product >}}, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.
\ No newline at end of file
+Tests are the building blocks of {{< var vm.product >}}, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.
\ No newline at end of file
diff --git a/site/about/glossary/model_documentation/_conceptual-soundness.qmd b/site/about/glossary/model_documentation/_conceptual-soundness.qmd
deleted file mode 100644
index b173ee9f63..0000000000
--- a/site/about/glossary/model_documentation/_conceptual-soundness.qmd
+++ /dev/null
@@ -1,6 +0,0 @@
-<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
-Refer to the LICENSE file in the root of this repository for details.
-SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
-
-conceptual soundness
-: Establishes the foundation of a selected record such as a model, covering the overview, intended use and business use case, regulatory requirements, limitations, and the rationale behind selection. It emphasizes purpose, scope, and constraints, which are crucial for stakeholders to understand applicability and limitations.
diff --git a/site/about/glossary/model_documentation/_monitoring-governance.qmd b/site/about/glossary/model_documentation/_monitoring-governance.qmd
deleted file mode 100644
index 9d6426d097..0000000000
--- a/site/about/glossary/model_documentation/_monitoring-governance.qmd
+++ /dev/null
@@ -1,6 +0,0 @@
-<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
-Refer to the LICENSE file in the root of this repository for details.
-SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
-
-monitoring and governance
-: Focuses on the record such as a model’s ongoing monitoring plan, implementation, and governance plan. It outlines strategies for maintaining the performance over time and ensuring that it remains compliant with regulatory requirements and ethical standards.
\ No newline at end of file
diff --git a/site/about/glossary/monitoring/_backtesting.qmd b/site/about/glossary/monitoring/_backtesting.qmd
index 77a7e5cfe5..e642f0cef0 100644
--- a/site/about/glossary/monitoring/_backtesting.qmd
+++ b/site/about/glossary/monitoring/_backtesting.qmd
@@ -2,5 +2,5 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-backtesting  
-: Comparing a model's predictions against actual outcomes to verify its predictive power and reliability.
+backtesting
+: Comparing a record's predictions against actual outcomes to verify its predictive power and reliability.
diff --git a/site/about/glossary/monitoring/_compliance-and-regulatory-adherence.qmd b/site/about/glossary/monitoring/_compliance-and-regulatory-adherence.qmd
index 2f1b50ff63..a0b9e89f71 100644
--- a/site/about/glossary/monitoring/_compliance-and-regulatory-adherence.qmd
+++ b/site/about/glossary/monitoring/_compliance-and-regulatory-adherence.qmd
@@ -3,4 +3,4 @@ Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 compliance and regulatory adherence  
-: Ensuring that the model continues to meet evolving regulatory requirements and standards.
\ No newline at end of file
+: Ensuring that the record (model) continues to meet evolving regulatory requirements and standards.
\ No newline at end of file
diff --git a/site/about/glossary/monitoring/_model-drift.qmd b/site/about/glossary/monitoring/_model-drift.qmd
index 3023bc8ffc..84272e38da 100644
--- a/site/about/glossary/monitoring/_model-drift.qmd
+++ b/site/about/glossary/monitoring/_model-drift.qmd
@@ -2,5 +2,5 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-model drift  
-: Changes in data patterns, input distributions, or model behavior that may indicate a degradation in model performance over time.
+model drift, drift 
+: Changes in data patterns, input distributions, or record (such as a model) behavior that may indicate a degradation in performance over time.
diff --git a/site/about/glossary/monitoring/_model-performance.qmd b/site/about/glossary/monitoring/_model-performance.qmd
index 90d343f912..bf3dd4c6cb 100644
--- a/site/about/glossary/monitoring/_model-performance.qmd
+++ b/site/about/glossary/monitoring/_model-performance.qmd
@@ -2,5 +2,5 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-model performance
-: The measure of a model's accuracy, stability, and robustness in achieving its intended outcomes, which is regularly evaluated through monitoring after deployment to ensure ongoing reliability.
\ No newline at end of file
+model performance, performance
+: The measure of a record's accuracy, stability, and robustness in achieving its intended outcomes, which is regularly evaluated through monitoring after deployment to ensure ongoing reliability.
\ No newline at end of file
diff --git a/site/about/glossary/monitoring/_ongoing-monitoring.qmd b/site/about/glossary/monitoring/_ongoing-monitoring.qmd
index 818f5ac5f9..da04e6c99d 100644
--- a/site/about/glossary/monitoring/_ongoing-monitoring.qmd
+++ b/site/about/glossary/monitoring/_ongoing-monitoring.qmd
@@ -2,5 +2,5 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-ongoing monitoring
-: A periodic report assessing the tool such as a model's performance and compliance over time, ensuring it remains valid under changing conditions.
\ No newline at end of file
+ongoing monitoring, ongoing monitoring report, ongoing monitoring plan, monitoring plan
+: A comprehensive and structured periodic report assessing the record's performance and compliance over time, ensuring it remains valid under changing conditions. Monitoring includes key elements such as data sources, inputs, performance metrics, and periodic evaluations, ensuring transparency and visibility of the record's performance in the production environment.
\ No newline at end of file
diff --git a/site/about/glossary/monitoring/_recalibrating-models.qmd b/site/about/glossary/monitoring/_recalibrating-models.qmd
index 252a8ac653..9c1f2285d9 100644
--- a/site/about/glossary/monitoring/_recalibrating-models.qmd
+++ b/site/about/glossary/monitoring/_recalibrating-models.qmd
@@ -2,5 +2,5 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-recalibrating models  
-: The process of adjusting a model to account for detected drift or changes in the underlying data or environment.
+recalibrating models, recalibrating
+: The process of adjusting a record (such as a model) to account for detected drift or changes in the underlying data or environment.
diff --git a/site/about/glossary/monitoring/_reporting-and-governance.qmd b/site/about/glossary/monitoring/_reporting-and-governance.qmd
index e0908f6ce2..d0152b7056 100644
--- a/site/about/glossary/monitoring/_reporting-and-governance.qmd
+++ b/site/about/glossary/monitoring/_reporting-and-governance.qmd
@@ -2,5 +2,5 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-reporting and governance  
+reporting and governance 
 : The documentation of monitoring artifacts and communication to stakeholders to support decision-making and maintain transparency.
diff --git a/site/about/glossary/validation_reports/_artifacts.qmd b/site/about/glossary/validation_reports/_artifacts.qmd
index fc3c7cfe8b..5f27365aef 100644
--- a/site/about/glossary/validation_reports/_artifacts.qmd
+++ b/site/about/glossary/validation_reports/_artifacts.qmd
@@ -3,4 +3,4 @@ Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 artifacts (previously findings)
-: Observations or issues identified during validation, including any deviations from expected performance or standards. Artifacts are organized by type — default types include Validation Issue, Policy Exception, and Limitation. Custom artifact types such as Change Management Record can be created to track other categories relevant to your organization.
\ No newline at end of file
+: Observations or issues identified during validation, including any deviations from expected performance or standards. Artifacts are organized by type — default types provided by {{< var vm.product >}} include Validation Issue, Policy Exception, and Limitation. Custom artifact types can be created to track other categories relevant to your organization.
\ No newline at end of file
diff --git a/site/about/glossary/validation_reports/_report-intro.qmd b/site/about/glossary/validation_reports/_report-intro.qmd
index ed19217e3a..3525a01e55 100644
--- a/site/about/glossary/validation_reports/_report-intro.qmd
+++ b/site/about/glossary/validation_reports/_report-intro.qmd
@@ -2,4 +2,4 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-A validation report is a comprehensive review that evaluates a record's accuracy, performance, and suitability for its intended purpose. It encompasses the process of risk assessment, identifying areas of potential error or risk within the record's components, such as data inputs and algorithms. The report follows established validation guidelines to ensure consistency and adherence to internal and regulatory standards.
\ No newline at end of file
+A validation report is a comprehensive and structured review evaluating a record's accuracy, performance, and suitability for its intended purpose. A report follows established validation guidelines to ensure consistency and adherence to internal and regulatory standards — encompassing the process of risk assessment, identifying areas of potential error or risk within the record's components, supporting transparency, regulatory compliance, and informed decision-making by documenting the validator’s independent review and conclusions.
\ No newline at end of file
diff --git a/site/about/glossary/validation_reports/_risk-areas.qmd b/site/about/glossary/validation_reports/_risk-areas.qmd
index 34169742e5..323a642ca1 100644
--- a/site/about/glossary/validation_reports/_risk-areas.qmd
+++ b/site/about/glossary/validation_reports/_risk-areas.qmd
@@ -3,4 +3,4 @@ Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 model risk areas, risk areas
-: Specific components or aspects of a record such as a model where risk might be present, such as data inputs, algorithms, or implementation.
\ No newline at end of file
+: Specific components or aspects of a record (such as a model) where risk might be present, such as data inputs, algorithms, or implementation.
\ No newline at end of file
diff --git a/site/about/glossary/validation_reports/_risk-assessment.qmd b/site/about/glossary/validation_reports/_risk-assessment.qmd
index b862511921..39ec545370 100644
--- a/site/about/glossary/validation_reports/_risk-assessment.qmd
+++ b/site/about/glossary/validation_reports/_risk-assessment.qmd
@@ -3,4 +3,4 @@ Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 model risk assessment, risk assessment
-: The process of identifying and evaluating risks associated with the use and potential errors in a record such as a model.
\ No newline at end of file
+: The process of identifying and evaluating risks associated with the use and potential errors in a record (such as a model).
\ No newline at end of file
diff --git a/site/about/glossary/validation_reports/_validation-guidelines.qmd b/site/about/glossary/validation_reports/_validation-guidelines.qmd
index 77930799af..2ac7b8baf0 100644
--- a/site/about/glossary/validation_reports/_validation-guidelines.qmd
+++ b/site/about/glossary/validation_reports/_validation-guidelines.qmd
@@ -3,4 +3,4 @@ Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 validation guidelines
-: Established standards or procedures for conducting thorough and consistent validations, usually aligned with principles within specific tools such as models or AI risk frameworks.
\ No newline at end of file
+: Established standards or procedures for conducting thorough and consistent validations, usually aligned with principles within specific records (such as models) or AI risk frameworks.
\ No newline at end of file
diff --git a/site/about/library-and-platform.qmd b/site/about/library-and-platform.qmd
index 7f776107c8..ed0bcf2cf9 100644
--- a/site/about/library-and-platform.qmd
+++ b/site/about/library-and-platform.qmd
@@ -12,7 +12,7 @@ listing:
     sort: false
     fields: [title, description]
     contents:
-    - overview-model-documentation.qmd
+    - overview-documentation.qmd
     - overview-llm-features.qmd
     - deployment-options.qmd
     - system-access-requirements.qmd
@@ -24,21 +24,21 @@ listing:
 
 #### 1. {{< var validmind.developer >}}
 
-The *{{< var validmind.developer >}}* is a Python library of tools and methods designed to automate generating model documentation and running validation tests. The {{< var vm.developer >}} is designed to be platform agnostic and integrates with your existing development environment. 
+The *{{< var validmind.developer >}}* is a Python library of tools and methods designed to automate generating documentation and running validation tests. The {{< var vm.developer >}} is designed to be platform agnostic and integrates with your existing development environment.
 
    For Python developers, a single installation command provides access to all the functions:
-    
+
    ```python
    %pip install validmind
    ```
 
 #### 2. {{< var validmind.platform >}}
 
-The *{{< var validmind.platform >}}* is an easy-to-use web-based interface that enables you to track the model lifecycle:
+The *{{< var validmind.platform >}}* is an easy-to-use web-based interface that enables you to track your risk management lifecycles:
 
 - Customize workflows to adhere to and oversee your governance processes.
 - Review and edit the documentation and test metrics generated by the {{< var vm.developer >}}.
-- Collaborate with and capture feedback from model developers and model validators.
+- Collaborate with and capture feedback from developers and validators.
 - Generate validation reports and approvals.
 
 :::
diff --git a/site/about/overview-model-documentation.qmd b/site/about/overview-documentation.qmd
similarity index 63%
rename from site/about/overview-model-documentation.qmd
rename to site/about/overview-documentation.qmd
index 59e462e4aa..7954b36a9e 100644
--- a/site/about/overview-model-documentation.qmd
+++ b/site/about/overview-documentation.qmd
@@ -2,10 +2,11 @@
 # Copyright © 2023-2026 ValidMind Inc. All rights reserved.
 # Refer to the LICENSE file in the root of this repository for details.
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
-title: "Automated model testing & documentation"
+title: "Automated testing & documentation"
 date: last-modified
 aliases:
   - /guide/overview-model-documentation.html
+  - /about/overview-model-documentation.html
 listing:
   id: quickstart
   type: grid
@@ -17,40 +18,40 @@ listing:
     - path: ../developer/validmind-library.qmd
 # INVISIBLE SPACE REQUIRED TO ENSURE THAT THE DESCRIPTION DOESN'T HAVE EXTRA PADDING DUE TO THE VARIABLE
       title: "{{< var validmind.developer >}}&#8203;"
-      description: "The {{< var validmind.developer >}} streamlines model development and validation by automating testing."
+      description: "The {{< var validmind.developer >}} streamlines development and validation by automating testing."
   fields: [title, description]
 ---
 
 
 
-The {{< var validmind.developer >}} streamlines the process of documenting various types of models. {{< var vm.product >}} automates the documentation process, ensuring that your model documentation and testing aligns with regulatory and compliance standards.
+The {{< var validmind.developer >}} streamlines the process of documenting various types of records, such as models. {{< var vm.product >}} automates the documentation process, ensuring that your documentation and testing aligns with regulatory and compliance standards.
 
 ::: {.attn}
 
 ## {{< fa code >}} The {{< var validmind.developer >}}
 
-The {{< var validmind.developer >}} is a Python library and documentation engine designed to streamline the process of documenting various types of models, including traditional statistical models, legacy systems, artificial intelligence/machine learning models, and large language models (LLMs). 
+The {{< var validmind.developer >}} is a Python library and documentation engine designed to streamline the process of documenting various types of records, including traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and more.
 
-It offers model developers a systematic approach to documenting and testing risk models with repeatability and consistency, ensuring alignment with regulatory and compliance standards.
+It offers developers a systematic approach to documenting and testing with repeatability and consistency, ensuring alignment with regulatory and compliance standards.
 
 <!-- Using the variable in alt text messes up the image display  -->
 
 ![The two main components of {{< var vm.product >}}: the {{< var validmind.developer >}} that integrates with your existing developer environment, and the {{< var validmind.platform >}}](/about/deployment/validmind-architecture-overview.png){fig-alt="An image showing the two main components of ValidMind: the ValidMind Library that integrates with your existing developer environment, and the ValidMind Platform"}
 
-The {{< var validmind.developer >}} consists of a client-side library, a {{< var vm.api >}} integration for models and testing, and validation tests that streamline the model development process. Implemented as a series of independent libraries in Python and R, our {{< var vm.developer >}} ensures compatibility and flexibility with diverse sets of developer environments and requirements.
+The {{< var validmind.developer >}} consists of a client-side library, a {{< var vm.api >}} integration for records (models) and testing, and validation tests that streamline the development process. Implemented as a series of independent libraries in Python and R, our {{< var vm.developer >}} ensures compatibility and flexibility with diverse sets of developer environments and requirements.
 
 With the {{< var validmind.developer >}}, you can:
 
-- **Automate documentation** — Add comprehensive documentation as metadata while you build models to be shared with model validators, streamlining and speeding up the process.
+- **Automate documentation** — Add comprehensive documentation as metadata while you build records to be shared with validators, streamlining and speeding up the process.
 - **Run test suites** — Identify potential risks for a diverse range of statistical and AI/LLM/ML models by assessing data quality, model outcomes, robustness, and explainability.
-- **Integrate with your development environment** — Seamlessly incorporate the {{< var validmind.developer >}} into your existing model development environment, connecting to your existing model code and data sets.
-- **Upload documentation data** — Send qualitative and quantitative test data to the {{< var validmind.platform >}}[^1] to generate the model documentation for review and approval, fostering effective collaboration with model reviewers and validators.
+- **Integrate with your development environment** — Seamlessly incorporate the {{< var validmind.developer >}} into your existing development environment, connecting to your existing code and data sets.
+- **Upload documentation data** — Send qualitative and quantitative test data to the {{< var validmind.platform >}}[^1] to generate the documentation for review and approval, fostering effective collaboration with reviewers and validators.
 
 :::
 
 ## Simple installation
 
-Install the {{< var vm.developer >}} with: 
+Install the {{< var vm.developer >}} with:
 
 ```python
 %pip install validmind
@@ -64,8 +65,8 @@ Install the {{< var vm.developer >}} with:
 
 What the {{< var validmind.developer >}} offers:
 
-- Generates documentation artifacts utilizing the context of the model and dataset, the model's metadata, and the chosen documentation template.
-- Can be easily imported into your local model development environment. The supported platforms include Python and R.
+- Generates documentation artifacts utilizing the context of the record (such as a model) and dataset, the record's metadata, and the chosen documentation template.
+- Can be easily imported into your local development environment. The supported platforms include Python and R.
 - Dual-licensed — The {{< var vm.developer >}} is available as open-source under AGPL v3 license and also with a commercial software license.
 
 :::
@@ -79,18 +80,18 @@ vm.init(model="MODEL_IDENTIFIER")
 ```
 
 ```python
-vm_dataset = vm. log_dataset(
+vm_dataset = vm.log_dataset(
       df,
       "training",
       targets=targets,
 )
-vm. run_dataset_tests(df, vm_dataset=vm_dataset)
+vm.run_dataset_tests(df, vm_dataset=vm_dataset)
 ```
 
 ```python
-vm. Log_model (model)
-vm. log_training_metrics (model, x_train, y_train)
-vm. run_model_tests (model, x_test, y_test)
+vm.log_model (model)
+vm.log_training_metrics (model, x_train, y_train)
+vm.run_model_tests (model, x_test, y_test)
 ```
 
 :::
@@ -100,12 +101,12 @@ vm. run_model_tests (model, x_test, y_test)
 
 How the {{< var validmind.developer >}} works:
 
-- The tests and functions are executed automatically, following pre-configured templates tailored for specific model use cases. This ensures that minimum documentation requirements are consistently fulfilled.
+- The tests and functions are executed automatically, following pre-configured templates tailored for specific use cases. This ensures that minimum documentation requirements are consistently fulfilled.
 - The {{< var vm.developer >}} integrates with ETL/data processing pipelines using connector interfaces. This enables the extraction of relationships between raw data sources and their corresponding post-processed datasets, such as those preloaded session instances received from platforms like Spark and Snowflake.
 
 ## Extensible by design
 
-{{< var vm.product >}} supports various model types, including:[^2]
+{{< var vm.product >}} supports various record (model) types, including:[^2]
 
 - Traditional machine learning models (ML) such as tree-based models and neural network models.
 - Natural language processing models (NLP) for text analysis and understanding.
@@ -114,25 +115,25 @@ How the {{< var validmind.developer >}} works:
 
 {{< var vm.product >}} is designed to be highly extensible to cater to our customers' specific requirements. You can expand its functionality in the following ways:
 
-- You can easily add support for new models and data types by defining new classes within the {{< var validmind.developer >}}. We provide templates to guide you through this process.[^3] 
-- To include custom tests in the library, you can define new functions. We offer templates to help you create these custom tests.[^4] 
-- You have the flexibility to integrate third-party test libraries seamlessly. These libraries can be hosted either locally within your infrastructure or remotely, for example, on GitHub. Leverage additional testing capabilities and resources as needed.[^5] 
+- You can easily add support for new records and data types by defining new classes within the {{< var validmind.developer >}}. We provide templates to guide you through this process.[^3]
+- To include custom tests in the library, you can define new functions. We offer templates to help you create these custom tests.[^4]
+- You have the flexibility to integrate third-party test libraries seamlessly. These libraries can be hosted either locally within your infrastructure or remotely, for example, on GitHub. Leverage additional testing capabilities and resources as needed.[^5]
 
 ## {{< var validmind.api >}} integration
 
 {{< var vm.product >}} imports the following artifacts into the documentation via our {{< var validmind.api >}} integration:
 
-- Metadata about datasets and models, used to lookup programmatic documentation content, such as the stored definition for _common logistic regression limitations_ when a logistic regression model has been passed to the {{< var vm.product >}} test plan to be run.
-- Quality and performance metrics collected from datasets and models.
-- Output from test and test suites that have been run.
+- Metadata about datasets and records (models), used to look up programmatic documentation content, such as the stored definition for _common logistic regression limitations_ when a logistic regression model has been passed to the {{< var vm.product >}} test plan to be run.
+- Quality and performance metrics collected from datasets and records.
+- Output from tests and test suites that have been run.
 - Images, plots, visuals that were generated as part of extracting metrics and running tests.
 
 ![Artifacts imported into the documentation via our {{< var vm.api >}}](fine-print/overview-api-integration.jpg){width=90% fig-alt="A representation of artifacts imported into the documentation via our Python API"}
 
 ::: {.callout-important}
-## {{< var vm.product >}} does NOT: 
-- Send any personal identifiable information (PII) when generating documentation reports.
-- Store any customer datasets or models. 
+## {{< var vm.product >}} does NOT:
+- Send any personally identifiable information (PII) when generating documentation reports.
+- Store any customer datasets or records. 
 :::
 
 ## Ready to try out {{< var vm.product >}}?
@@ -144,9 +145,9 @@ How the {{< var validmind.developer >}} works:
 
 <!-- FOOTNOTES -->
 
-[^1]: [Model risk management](overview-model-risk-management.qmd)
+[^1]: [Model risk management](use-cases/model-risk-management.qmd)
 
-[^2]: [Supported models and frameworks](/developer/supported-models-and-frameworks.qmd)
+[^2]: [Supported records and frameworks](/developer/supported-records-and-frameworks.qmd)
 
 [^3]: [Customize document templates](/guide/templates/customize-document-templates.qmd)
 
diff --git a/site/about/overview-llm-features.qmd b/site/about/overview-llm-features.qmd
index 2dc6c1d19d..202c7e1217 100644
--- a/site/about/overview-llm-features.qmd
+++ b/site/about/overview-llm-features.qmd
@@ -6,7 +6,7 @@ title: "Large language model features"
 date: last-modified
 ---
 
-{{< var vm.product >}} offers several specialized features that use large language models (LLMs) to streamline model risk management and ensure regulatory compliance. Here's how we approach these features and what you need to know.
+{{< var vm.product >}} offers several specialized features that use large language models (LLMs) to streamline risk management and ensure regulatory compliance. Here's how we approach these features and what you need to know.
 
 ::: {.attn}
 ## {{< fa list-check >}} Our philosophy
@@ -30,7 +30,7 @@ Our testing methodologies and philosophy around testing are readily available, a
 
 ## Our features
 
-{{< var vm.product >}} enhances model documentation, testing, and compliance workflows, providing your team with tools for effective model governance.
+{{< var vm.product >}} enhances documentation, testing, and compliance workflows, providing your team with tools for effective risk governance.
 
 
 ::: {.column-margin .pl3 .pt6}
@@ -54,13 +54,13 @@ Why it matters
 ::: {.w-50-ns .pl2 .pr2}
 ### Qualitative checks
 
-Leverages metadata from the model inventory, test outcomes, and additional data provided to create qualitative sections within model documentation. 
+Leverages metadata from the inventory, test outcomes, and additional data provided to create qualitative sections within documentation.
 <br>
 <br>
 
 ::: {.feature}
 Why it matters
-: Qualitative checks ensure that essential contextual information is accurately documented and aligned with the model's purpose and scope.
+: Qualitative checks ensure that essential contextual information is accurately documented and aligned with the record's purpose and scope.
 :::
 
 :::
@@ -72,7 +72,7 @@ Why it matters
 ::: {.w-50-ns .pr2}
 ### Risk assessment
 
-Using data from test results, generates a tailored risk assessment for each section of model documentation. This feature aids in identifying potential risks based on the model’s performance and results.
+Using data from test results, generates a tailored risk assessment for each section of documentation. This feature aids in identifying potential risks based on the record's performance and results.
 
 ::: {.feature}
 Why it matters
@@ -85,7 +85,7 @@ Why it matters
 ::: {.w-50-ns .pl2 .pr2}
 ### {{< var validmind.checker >}}
 
-Reviews documents such as model documentation or validation reports to ensure documents aligns with relevant regulatory requirements.
+Reviews documents such as documentation or validation reports to ensure documents align with relevant regulatory requirements.
 <br>
 <br>
 
@@ -97,7 +97,7 @@ Why it matters
 <!-- NR Nov 2024 Uncomment when available -->
 <!-- ### Section checker
 
-Assesses each part of the model documentation for adherence to internal guidelines and policies. This tool supports consistent documentation standards across the organization, promoting uniformity in compliance practices. -->
+Assesses each part of the documentation for adherence to internal guidelines and policies. This tool supports consistent documentation standards across the organization, promoting uniformity in compliance practices. -->
 :::
 
 ::::
@@ -120,7 +120,7 @@ These documents detail our [AI usage policy](https://validmind.com/about/legal/a
 ::: {.w-50-ns .pr3}
 ### Try it yourself
 
-Discover how {{< var vm.product >}}’s LLM-powered platform, purpose-built for model risk management teams, enables streamlined and confident testing, documentation, validation, and governance of generative AI models and processes.
+Discover how {{< var vm.product >}}’s LLM-powered platform, purpose-built for risk management teams, enables streamlined and confident testing, documentation, validation, and governance of generative AI systems and processes.
 
 [Request a Demo](https://validmind.com/request-demo/){.button .button-green}
 
diff --git a/site/about/overview-model-risk-management.qmd b/site/about/overview-model-risk-management.qmd
deleted file mode 100644
index 81a6d137ed..0000000000
--- a/site/about/overview-model-risk-management.qmd
+++ /dev/null
@@ -1,226 +0,0 @@
----
-# Copyright © 2023-2026 ValidMind Inc. All rights reserved.
-# Refer to the LICENSE file in the root of this repository for details.
-# SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
-title: "Model risk management"
-date: last-modified
-aliases:
-  - /guide/overview-model-risk-management.html
-listing:
-  id: quickstart
-  type: grid
-  grid-columns: 2
-  # image-height: 100%
-  contents:
-    - path: ../get-started/get-started.qmd
-      title: "Get started"
-      description: "Our quickstarts are the quickest and easiest way to try out our product features."
-  fields: [title, description, reading-time]
----
-
-The {{< var validmind.platform >}} offers an integrated solution to manage validation reports, track artifacts, and report on model risk compliance across your model portfolio. {{< var vm.product >}} enables your organization to monitor and manage models effectively, focusing on mitigating risks, maintaining governance, and ensuring compliance throughout the entire enterprise. 
-
-::: {.attn}
-
-## {{< fa laptop-code >}} The {{< var validmind.platform >}} 
-
-The {{< var validmind.platform >}} provides a comprehensive suite of tools, guidelines, and best practices. You use {{< var vm.product >}} to review and evaluate models and model documentation to ensure they comply with organizational and regulatory requirements.
-
-<!-- Using the variable in alt text messes up the image display  -->
-
-![The two main components of {{< var vm.product >}}. The {{< var validmind.developer >}} that integrates with your existing developer environment, and the {{< var validmind.platform >}}.](overview-platform.png){width=80% fig-alt="An image showing the two main components of ValidMind. The ValidMind Library that integrates with your existing developer environment, and the ValidMind Platform."}
-
-The {{< var vm.platform >}} employs a multi-tenant architecture, hosting the cloud-based user interface, APIs, databases, and internal services. The design ensures efficient resource utilization and offers a highly scalable solution for organizations of varying sizes.
-
-With the {{< var vm.platform >}}, you can:
-
-- **Track your model inventory**[^1] — Manage the model lifecycle, track the workflow status for models, plan for upcoming validation dates, and more.
-- **Work on validation initiatives**[^2] — Collaborate with developers and validators to review documentation, add artifacts, keep track of review statuses, and generate validation reports.
-- **Configure workflows**[^3] — Set up the {{< var validmind.platform >}} to follow your existing model risk management processes, manage statuses for different parts of the workflow, and get an end-to-end view of workflows and who is involved.
-- **Use, create, or edit tests, test suites, and templates**[^4] — Create and/or configure required validation tests, test suites, and document templates for specific model use cases, tailoring it to your own specific needs.
-- **Integrate with your stack**[^5] — Import and export model documentation and validation reports.
-
-:::
-
-## Regulatory requirements
-
-{{< var vm.product >}} is designed to cater to the regulatory compliance and model risk management (MRM) requirements of financial institutions, facilitating enhanced compliance with government regulations, policies concerning MRM, and emerging legislations addressing AI model risk, including risks associated with the use of large language models (LLMs).
-
-Examples of regulations or policies include:
-
-:::: {.flex .flex-wrap .justify-around}
-
-::: {.w-75-ns}
-
-### SR 11-7: Guidance on Model Risk Management
-
-The Supervisory Guidance on model risk management issued by the Board of Governors of the Federal Reserve System and the Office of the Comptroller of the Currency in the United States in 2011. It provides comprehensive guidance to financial institutions on developing and maintaining a robust model risk management framework, covering aspects like model development, implementation, use, and validation. 
-
-:::
-
-::: {.w-20-ns .content-center}
-
-![Board of Governors Federal Reserve logo](federal-reserve.svg){width=70% fig-alt="Board of Governors Federal Reserve logo"}
-
-:::
-
-::::
-
-SR 11-7 is widely recognized and has become a benchmark in the industry for model risk management practices. 
-
-SR 11-7 outlines these core requirements: 
- 
-Model Risk Management
-: - Identify and mitigate risks associated with incorrect or inappropriate model usage, outputs, or implementation errors.
-- Encourage "effective challenge" to identify model limitations and propose necessary changes.
-- Consider materiality in model risk management based on the extent of model usage and its impact on the organization's financial condition.
-
-Model Development, Implementation, and Use
-: - Develop with a clear statement of purpose, sound design, theory, and logic.
-- Assess rigorously data quality and relevance, robust methodologies, and appropriate documentation.
-- Test to ensure accuracy, robustness, stability, and to evaluate limitations and assumptions.
-
-Model Validation
-: - Be an integral part for managing model risk, ensuring models perform as intended.
-- Identify and address potential errors or misuses.
-
-Governance, Policies, and Controls
-: - Establish a sound governance framework to oversee model risk management.
-- Implement policies and controls for appropriate use and validation of models.
-
-The regulation also mandates ongoing monitoring and periodic reviews to ensure models remain valid and effective.
-
-:::: {.flex .flex-wrap .justify-around}
-
-::: {.w-20-ns .content-center}
-
-![Bank of England logo](bank-of-england.svg){fig-alt="Bank of England logo"}
-
-:::
-
-::: {.w-75-ns}
-
-### SS1/23 – Model Risk Management Principles for Banks
-
-A policy issued by the Prudential Regulation Authority (PRA) in the UK. It encapsulates the final model risk management principles following feedback on the earlier consultation paper CP6/22. The statement provides guidelines for banks in the UK on managing model risk effectively, with particular emphasis on strategic planning and technical capabilities. 
-
-:::
-
-::::
-
-It outlines principles and amendments, like clarifications on model complexity factors, senior management function responsibilities, and inclusion of dynamic adjustments in model change management, aiming to standardize MRM practices across UK banks and foster the safe adoption of emerging technologies, such as machine learning, artificial intelligence, and large language models (LLMs). 
-
-SS1/23 outlines these core principles:
-
-Model Identification and Model Risk Classification
-: - Ensure a structured approach to accurately identify and categorize models within the model risk management (MRM) framework.
-- Facilitate the proper management and oversight of models, aiding in the alignment of model risk management efforts with organizational risks and objectives.
-
-Governance
-: - Establish a structured oversight mechanism for effective model risk management, delineating clear responsibilities and authorities.
-- Ensure accountability, transparency, and effective communication within the organization regarding model risks and controls.
-
-Model Development, Implementation, and Use
-: - Emphasize the correct development, deployment, and utilization of models as per the guidelines laid down in the MRM framework.
-- Ensure models are developed and utilized in a manner consistent with their intended purposes and within acceptable risk boundaries.
-
-Independent Model Validation
-: - Stress the importance of independent validation to ascertain model performance, accuracy, and identify potential issues.
-- Provide an objective assessment of models to ensure they are functioning as intended and to identify any potential areas of improvement or correction.
-
-Model Risk Mitigants
-: - Underline the necessity for measures to mitigate risks associated with model use, including the identification and implementation of controls.
-- Help in reducing the potential adverse impact of model risks on the organization’s financial condition, reputation, and regulatory compliance.
-
-The regulation encourages a proportionate application of these principles based on the size and complexity of the institution.
-
-### Around the globe 
-
-Other, similar guidelines and policies that {{< var vm.product >}} is designed to help you with include:
-
-:::: {.flex .flex-wrap .justify-around}
-
-::: {.w-50-ns}
-
-#### Guideline-E23: Enterprise-Wide Model Risk Management for Deposit-Taking Institutions
-
-Issued by the Office of the Superintendent of Financial Institutions (OSFI) in Canada, it outlines minimum prudent practices for model development, review, approval, use, and modification​​.
-
-:::
-
-::: {.w-40-ns}
-
-#### Principles for Model Risk Management
-
-Issued by the Financial Services Agency (FSA) in Japan in June 2021, this document was finalized after a consultation period and outlines principles for managing model risk​​​.
-
-:::
-
-::::
-
-::: {.callout title="Read more:"}
-- [SR 11-7](https://www.federalreserve.gov/supervisionreg/srletters/sr1107.htm)
-- [SS1/23](https://www.bankofengland.co.uk/prudential-regulation/publication/2023/may/model-risk-management-principles-for-banks-ss)
-- [Guideline-E23](https://www.osfi-bsif.gc.ca/Eng/fi-if/rg-ro/gdn-ort/gl-ld/Pages/e23.aspx)
-- [Principles for Model Risk Management](https://www.fsa.go.jp/common/law/ginkou/pdf_03.pdf)
-
-:::
-
-### Meeting regulatory requirements with {{< var vm.product >}}
-
- As a robust tool for implementing Model Risk Management (MRM) best practices, including the _three lines of defense_, {{< var vm.product >}} significantly aids organizations in adhering to the regulatory guidelines set forth by SR 11-7 and SS1/23. 
-
-:::: {.flex .flex-wrap .justify-around}
-
-::: {.w-40-ns}
-
-First line of defense — model developers
-: {{< var vm.product >}} offers a suite of tools for model developers, facilitating thorough documentation and rigorous testing of models, aligning with the regulatory expectations of both SR 11-7 and SS1/23, particularly for models under regulatory purview.
-
-Second line of defense — model validators
-: {{< var vm.product >}} empowers model validators with the ability to independently validate models ensuring adherence to the organization's MRM principles throughout the model lifecycle, a core requirement of these regulations.
-
-Third line of defense — auditors
-: Enabling internal and external audits provides an independent and objective assurance to the organization by assessing the robustness of controls within the model risk management framework. It evaluates how well the first and second lines of defense are functioning, ensuring adherence to regulatory and organizational standards, thereby promoting a robust model risk management environment. 
-
-Model inventory
-: The {{< var vm.product >}} **{{< fa cubes >}} Inventory** encapsulates a centralized repository for all models, aiding in streamlined tracking, management, and monitoring, simplifying compliance with the inventory mandates specified in SR 11-7 and SS1/23.
-
-:::
-
-::: {.w-50-ns}
-Lifecycle management and custom workflows
-: {{< var vm.product >}}’s capabilities extend to effective model lifecycle management through configurable workflows. This structured approach to managing model risks across various lifecycle stages significantly aids in meeting the rigorous management and oversight expectations set by SR 11-7 and SS1/23.
-
-Model documentation automation
-: By automating model documentation through configurable templates and test plans, {{< var vm.product >}} ensures consistent and accurate documentation capture, directly aligning with the documentation standards stipulated in these regulatory guidelines.
-
-Model validation and approval
-: With automated validation features and comprehensive risk assessment tools, {{< var vm.product >}} aligns with the effective validation criteria and thorough risk evaluation mandates of SR 11-7 and SS1/23.
-
-Communication and tracking
-: The built-in communication and tracking functionality of {{< var vm.product >}} facilitates seamless collaboration and understanding among stakeholders regarding model usage, limitations, and risks, fostering a collaborative environment as encouraged by these regulations.
-
-By integrating these features, {{< var vm.product >}} provides a comprehensive suite of tools that not only simplifies the path to compliance with SR 11-7 and SS1/23 but also embeds a culture of rigorous and transparent model risk management within the organization.
-
-:::
-
-::::
-
-## Ready to try out {{< var vm.product >}}?
-
-:::{#quickstart}
-:::
-
-
-<!-- FOOTNOTES -->
-
-[^1]: [Working with the inventory](/guide/inventory/working-with-the-inventory.qmd)
-
-[^2]: [Preparing validation reports](/guide/validation/preparing-validation-reports.qmd)
-
-[^3]: [Setting up workflows](/guide/workflows/setting-up-workflows.qmd)
-
-[^4]: [Working with document templates](/guide/templates/working-with-document-templates.qmd)
-
-[^5]: [Export documents](/guide/reporting/export-documents.qmd)
\ No newline at end of file
diff --git a/site/about/overview.qmd b/site/about/overview.qmd
index 8b1ef72853..af7f860745 100644
--- a/site/about/overview.qmd
+++ b/site/about/overview.qmd
@@ -32,7 +32,7 @@ aliases:
   - /about.html
 ---
 
-{{< var vm.product >}} is the system of record for AI governance. You use {{< var vm.product >}} to model the full lifecycle of AI systems, models, use cases, and tools, along with their dependencies, and automates the governance and documentation you build on top.
+{{< var vm.product >}} is the system of record for AI governance. You use {{< var vm.product >}} to model the full lifecycle of AI systems, records (such as models), use cases, and tools, along with their dependencies, and automates the governance and documentation you build on top.
 
 Flexible by design, the {{< var vm.platform >}} lets you define your own inventory hierarchy, dependencies, and governance rules, powered by {{< var vm.product >}}’s documentation automation, workflows, and analytics.
 
@@ -40,7 +40,7 @@ Flexible by design, the {{< var vm.platform >}} lets you define your own invento
 
 ::: {.column-margin}
 ::: {.image-container}
-<!-- Using the variable in alt text messes up the image display  -->
+<!-- Using the variable in alt text messes up the image display -->
 ![](/assets/img/admin-diagram.png)
 ![](/assets/img/developer-diagram.png)
 ![](/assets/img/validator-diagram.png)
@@ -56,7 +56,8 @@ Flexible by design, the {{< var vm.platform >}} lets you define your own invento
 
 ## {{< fa hand-point-right >}} Ready to try out {{< var vm.product >}}?
 
+:::{#validmind-next-steps}
 :::
 
-:::{#validmind-next-steps}
 :::
+
diff --git a/site/about/use-cases/eu-ai-act.qmd b/site/about/use-cases/eu-ai-act.qmd
index a33f793e66..02639a6180 100644
--- a/site/about/use-cases/eu-ai-act.qmd
+++ b/site/about/use-cases/eu-ai-act.qmd
@@ -28,7 +28,7 @@ The EU AI Act categorizes AI systems by risk level:
 
 ### Harmonization with other standards
 
-The EU AI Act requirements overlap with existing model risk management frameworks. Organizations already following SR 11-7, SS1/23, or E-23 can  leverage existing documentation and controls but must also comply with the EU AI Act requirements.
+The EU AI Act requirements overlap with existing model risk management frameworks. Organizations already following SR 26-2, SS1/23, or E-23 can  leverage existing documentation and controls but must also comply with the EU AI Act requirements.
 
 ## 1. Risk management system implementation (Article 9)
 
@@ -230,14 +230,14 @@ Integrate all components into a complete compliance workflow addressing Articles
 
 [^3]: [Setting up workflows](/guide/workflows/setting-up-workflows.qmd)
 
-[^4]: [Install and initialize the {{< var validmind.developer >}}](/developer/model-documentation/install-and-initialize-validmind-library.qmd)
+[^4]: [Install and initialize the {{< var validmind.developer >}}](/developer/quickstart/install-and-initialize-validmind-library.qmd)
 
  [^5]:
 [Run tests and test suites](/developer/how-to/testing-overview.qmd)
 
 [^6]: [Work with document templates](/guide/templates/working-with-document-templates.qmd)
 
-[^7]: [Test descriptions](/developer/test-descriptions.qmd)
+[^7]: [{{< var vm.product >}} test sandbox](/developer/how-to/test-sandbox.qmd)
 
 [^8]: [Work with content blocks](/guide/documentation/work-with-content-blocks.qmd)
 
diff --git a/site/about/use-cases/model-risk-management.qmd b/site/about/use-cases/model-risk-management.qmd
index cae973dca0..b5d0926c25 100644
--- a/site/about/use-cases/model-risk-management.qmd
+++ b/site/about/use-cases/model-risk-management.qmd
@@ -4,6 +4,9 @@
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
 title: "Model risk management"
 date: last-modified
+aliases:
+  - /about/overview-model-risk-management.html
+  - /guide/overview-model-risk-management.html
 listing:
   id: quickstart
   type: grid
@@ -126,19 +129,19 @@ Lifecycle
 
 {{< var vm.product >}} is designed to help organizations comply with MRM regulatory requirements:
 
-### SR 11-7 (United States)
+### SR 26-2 (United States)
 
 :::: {.columns}
 
 ::: {.column width="70%" .pr3}
 
-The Supervisory Guidance on model risk management was issued by the Board of Governors of the Federal Reserve System and the Office of the Comptroller of the Currency. It provides comprehensive guidance on designing and maintaining a robust MRM framework.
+*Interagency Guidance on Model Risk Management for Banking Organizations* was issued jointly by the Board of Governors of the Federal Reserve System, the Federal Deposit Insurance Corporation, and the Office of the Comptroller of the Currency. It supersedes SR 11-7 and sets expectations for a risk-based MRM program — including a narrowed model definition, materiality-based tiering, strong ongoing monitoring and outcomes analysis, and a comprehensive enterprise inventory.
 
 :::
 
 ::: {.column width="30%" .pl3}
 
-[SR 11-7 implementation guide](sr-11-7.qmd){.button}
+[SR 26-2 implementation guide](sr-26-2.qmd){.button}
 
 :::
 
diff --git a/site/about/use-cases/sr-11-7.qmd b/site/about/use-cases/sr-11-7.qmd
deleted file mode 100644
index ad4b573fda..0000000000
--- a/site/about/use-cases/sr-11-7.qmd
+++ /dev/null
@@ -1,226 +0,0 @@
----
-# Copyright © 2023-2026 ValidMind Inc. All rights reserved.
-# Refer to the LICENSE file in the root of this repository for details.
-# SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
-title: "SR 11-7"
-date: last-modified
----
-
-Implement SR 11-7 compliance using {{< var vm.product >}}.
-
-{{< include _use-case-summary.qmd >}}
-
-## Overview
-
-SR 11-7 (Supervisory Guidance on Model Risk Management)[^1] provides comprehensive guidance to financial institutions on developing and maintaining a robust model risk management framework. By emphasizing the three lines of defense model and the concept of "effective challenge" — SR 11-7 ensures that models are rigorously questioned and tested.
-
-This guide is organized around the expectations for the three main areas outlined in SR 11-7:
-
-1. Model development, implementation, and use
-
-2. Model validation
-
-3. Governance, policies, and controls
-
-## 1. Model inventory setup
-
-#### Purpose
-
-Establish a comprehensive model inventory aligned to SR 11-7 requirements.
-
-### Steps
-
-1. Establish model definition criteria:
-
-   - Define what constitutes a model in your organization.
-   - Document inclusion and exclusion criteria.
-   - Classify models by type and purpose.
-
-2. Configure inventory fields:[^2]
-
-   - Set up materiality and tiering fields.
-   - Add fields for model purpose and business use.
-   - Configure risk rating classifications.
-
-3. Populate the inventory:[^3]
-
-   - Register existing models.
-   - Document model ownership and stakeholders.
-   - Track model lifecycle status.
-
-## 2. Model development documentation
-
-#### Purpose
-
-Document models according to SR 11-7 development standards.
-
-### Steps
-
-1. Configure document templates:[^4]
-
-   - Select or create templates aligned to SR 11-7.
-   - Include sections for purpose, design, theory, and logic.
-
-2. Document purpose, design, theory, and logic:[^5]
-
-   - Clearly state the model's intended use.
-   - Document the theoretical basis.
-   - Explain design choices and methodology.
-
-3. Document data quality and relevance:
-
-   - Assess and document data sources.
-   - Evaluate data quality and limitations.
-   - Document data transformations.
-
-4. Track assumptions and limitations:
-
-   - Document all model assumptions.
-   - Identify known limitations.
-   - Establish conditions under which the model should not be used.
-
-## 3. Testing and outcomes analysis
-
-#### Purpose
-
-Test models for accuracy, robustness, and stability per SR 11-7 requirements.
-
-### Steps
-
-1. Run automated testing using the {{< var validmind.developer >}}:[^6]
-
-   - Execute accuracy tests.
-   - Run robustness and stability tests.
-   - Document test results.
-
-2. Perform sensitivity analysis and benchmarking:
-
-   - Test model sensitivity to input changes.
-   - Compare against benchmarks or challenger models.
-   - Document performance boundaries.
-
-3. Evaluate limitations and assumptions:
-
-   - Test assumption validity.
-   - Identify conditions where performance degrades.
-   - Document testing coverage.
-
-## 4. Independent validation (effective challenge)
-
-#### Purpose
-
-Implement independent validation aligned to SR 11-7's "effective challenge" concept.
-
-### Steps
-
-1. Configure validation workflows:
-
-   - Set up validation initiation triggers.
-   - Define validation scope and requirements.
-   - Establish independence requirements.
-
-2. Prepare validation reports:[^7]
-
-   - Use validation report templates.
-   - Document validation activities.
-   - Summarize findings and conclusions.
-
-3. Track findings and remediation:[^8]
-
-   - Document validation findings.
-   - Assign remediation owners.
-   - Track remediation progress.
-
-## 5. Ongoing monitoring and periodic review
-
-#### Purpose
-
-Implement ongoing monitoring per SR 11-7 requirements.
-
-### Steps
-
-1. Set up monitoring workflows:[^9]
-
-   - Configure monitoring frequency.
-   - Define monitoring metrics.
-   - Establish escalation procedures.
-
-2. Configure performance tracking and alerts:
-
-   - Set up performance dashboards.
-   - Configure threshold-based alerts.
-   - Document alert response procedures.
-
-3. Schedule periodic reviews:[^10]
-
-   - Establish review frequency by model tier.
-   - Configure review reminders.
-   - Document review requirements.
-
-## 6. Governance, policies, and controls
-
-#### Purpose
-
-Establish governance framework aligned to SR 11-7.
-
-### Steps
-
-1. Configure role-based access:[^11]
-
-   - Set up roles for three lines of defense.
-   - Configure permissions by role.
-   - Ensure appropriate segregation of duties.
-
-2. Configure approval workflows:[^12]
-
-   - Set up model approval processes.
-   - Define approval authorities.
-   - Configure escalation paths.
-
-3. Enable audit trail and compliance reporting:[^12]
-
-   - Configure activity logging.
-   - Set up compliance dashboards.
-   - Generate audit reports.
-
-## Implementation checklist
-
-- [x] Model definition criteria established
-- [x] Model inventory configured and populated
-- [x] Document templates aligned to SR 11-7
-- [x] Testing framework implemented
-- [x] Validation workflows configured
-- [x] Ongoing monitoring established
-- [x] Three lines of defense roles configured
-- [x] Approval workflows in place
-- [x] Audit trail enabled
-
-
-<!-- FOOTNOTES -->
-
-[^1]:
-
-   **Board of Governors of the Federal Reserve System:**<br>
-   [SR 11-7: Guidance on Model Risk Management](https://www.federalreserve.gov/supervisionreg/srletters/sr1107.htm)
-
-[^2]: [Manage inventory fields](/guide/inventory/manage-inventory-fields.qmd)
-
-[^3]: [Working with the inventory](/guide/inventory/working-with-the-inventory.qmd)
-
-[^4]: [Working with document templates](/guide/templates/working-with-document-templates.qmd)
-
-[^5]: [Working with documentation](/guide/documentation/working-with-documentation.qmd)
-
-[^6]: [Run tests and test suites](/developer/how-to/testing-overview.qmd)
-
-[^7]: [Preparing validation reports](/guide/validation/preparing-validation-reports.qmd)
-
-[^8]: [Working with artifacts](/guide/validation/working-with-artifacts.qmd)
-
-[^9]: [Ongoing monitoring](/guide/monitoring/ongoing-monitoring.qmd)
-
-[^10]: [Setting up workflows](/guide/workflows/setting-up-workflows.qmd)
-
-[^11]: [Manage permissions](/guide/configuration/manage-permissions.qmd)
-
-[^12]: [Working with analytics](/guide/reporting/working-with-analytics.qmd)
diff --git a/site/about/use-cases/sr-26-2.qmd b/site/about/use-cases/sr-26-2.qmd
new file mode 100644
index 0000000000..a37fd2e594
--- /dev/null
+++ b/site/about/use-cases/sr-26-2.qmd
@@ -0,0 +1,210 @@
+---
+# Copyright © 2023-2026 ValidMind Inc. All rights reserved.
+# Refer to the LICENSE file in the root of this repository for details.
+# SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
+title: "SR 26-2"
+date: last-modified
+aliases:
+  - /about/use-cases/sr-11-7.html
+---
+
+Implement SR 26-2 compliance using {{< var vm.product >}}.
+
+{{< include _use-case-summary.qmd >}}
+
+## Overview
+
+SR 26-2 (*Interagency Guidance on Model Risk Management for Banking Organizations*)[^1] was issued jointly by the Board of Governors of the Federal Reserve System, the Federal Deposit Insurance Corporation, and the Office of the Comptroller of the Currency. It supersedes SR 11-7 and reframes U.S. banking agencies’ expectations for model risk management (MRM).
+
+SR 26-2 keeps core themes from prior guidance — sound development, independent validation, governance, and effective challenge — while emphasizing a risk-based posture: a narrower definition of what counts as a model, an explicit materiality framework, stronger ongoing monitoring and outcomes analysis, and an enterprise model inventory that supports concentration and dependency visibility.
+
+::: {.callout title="Generative and agentic AI"}
+SR 26-2 explicitly excludes generative AI and agentic AI from its scope because these technologies are novel and rapidly evolving. Underlying MRM principles — including materiality, ongoing monitoring, and effective challenge — still apply when you govern those systems alongside traditional models.
+:::
+
+This guide organizes platform actions around four priorities that align with SR 26-2:
+
+1. **Distinguish models from non-models** — Focus MRM on *complex quantitative methods* that apply statistical, economic, or financial theory, rather than on simple arithmetic, purely deterministic rules, or software without substantive theoretical underpinning.
+
+2. **Assess and tier models by materiality** — Use model exposure and model purpose so high-materiality models receive commensurate rigor while lower-materiality models can use more automated governance where appropriate.
+
+3. **Emphasize ongoing monitoring and outcomes analysis** — Treat continuous performance tracking, outcomes testing, and escalation as first-class obligations, not only point-in-time validation events.
+
+4. **Maintain a comprehensive model inventory** — Keep enterprise visibility into models, dependencies, concentrations, and aggregate risk.
+
+## 1. Distinguish models from non-models
+
+#### Purpose
+
+Apply a clear, documented definition of *model* versus *non-model* so MRM effort targets SR 26-2 scope.
+
+### Steps
+
+1. Document inclusion and exclusion criteria:
+
+   - Define which methods count as models under SR 26-2’s narrowed definition.
+   - Record exclusions (for example, simple spreadsheets, deterministic rules without quantitative theory) and the rationale.
+
+2. Align inventory registration rules:[^2]
+
+   - Configure inventory fields that capture model type, theoretical basis, and intended analytical use.
+   - Ensure non-models are not inadvertently treated as in-scope models.
+
+3. Review the portfolio periodically:
+
+   - Re-evaluate borderline tools when business use or complexity changes.
+   - Update documentation when classification decisions change.
+
+## 2. Assess and tier models by materiality
+
+#### Purpose
+
+Implement SR 26-2’s materiality lens — combining exposure and purpose — so controls scale with risk.
+
+### Steps
+
+1. Configure materiality and tiering fields:[^2]
+
+   - Map organizational tiers to exposure and purpose dimensions.
+   - Align tiering to validation depth, monitoring frequency, and approval paths.
+
+2. Document purpose and business use:[^3]
+
+   - Capture how each model affects decisions, capital, liquidity, or customers.
+   - Link materiality to reporting and committee oversight where required.
+
+3. Apply tier-aware workflows:[^10]
+
+   - Automate reminders and approvals based on tier.
+   - Route high-materiality models to stricter documentation and validation templates.
+
+## 3. Ongoing monitoring, testing, and outcomes analysis
+
+#### Purpose
+
+Meet SR 26-2’s heightened expectations for continuous insight into model performance and outcomes, complementing periodic validation.
+
+### Steps
+
+1. Run automated testing in the {{< var validmind.developer >}}:[^6]
+
+   - Execute accuracy, robustness, and stability tests on a defined cadence.
+   - Store results as evidence for monitoring and review.
+
+2. Configure monitoring and alerts:[^9]
+
+   - Define metrics, thresholds, and escalation paths by materiality tier.
+   - Integrate outcomes analysis (for example, performance drift, decision quality) into review cycles.
+
+3. Schedule periodic reviews with monitoring context:[^10]
+
+   - Combine monitoring dashboards, incidents, and validation history in each review.
+   - Document conclusions and required actions.
+
+## 4. Model development documentation
+
+#### Purpose
+
+Document models so development choices, data, theory, and limitations are transparent and reviewable.
+
+### Steps
+
+1. Configure document templates:[^4]
+
+   - Align sections to SR 26-2 expectations for purpose, design, theory, and logic.
+   - Tier template depth by materiality.
+
+2. Document purpose, design, theory, and logic:[^5]
+
+   - State intended use and decisions supported.
+   - Explain methodology, key assumptions, and known limitations.
+
+3. Document data quality and relevance:
+
+   - Record data sources, transformations, and quality assessments.
+   - Highlight data gaps that affect reliability.
+
+## 5. Independent validation (effective challenge)
+
+#### Purpose
+
+Preserve effective challenge for in-scope models — independent validation that identifies limitations and supports sound use.
+
+### Steps
+
+1. Configure validation workflows:
+
+   - Define independence rules and scope by materiality.
+   - Trigger validation when models change tier or materiality drivers shift.
+
+2. Prepare validation reports:[^7]
+
+   - Use templates that capture findings, limitations, and conditions of use.
+   - Tie conclusions to monitoring metrics where applicable.
+
+3. Track findings and remediation:[^8]
+
+   - Assign owners, due dates, and retest evidence.
+   - Close the loop into monitoring and inventory metadata.
+
+## 6. Governance, policies, and controls
+
+#### Purpose
+
+Operate a governance framework — policies, roles, approvals, and auditability — that matches SR 26-2’s risk-based MRM program.
+
+### Steps
+
+1. Configure role-based access:[^11]
+
+   - Map the three lines of defense to platform roles.
+   - Enforce segregation of duties for high-materiality models.
+
+2. Configure approval workflows:[^12]
+
+   - Encode model approvals, exceptions, and retirements.
+   - Maintain an audit trail for supervisory and internal review.
+
+3. Enable audit trail and compliance reporting:[^12]
+
+   - Use activity logs and analytics for evidence of control operation.
+   - Export reports for committees and audits.
+
+## Implementation checklist
+
+- [x] Model versus non-model criteria documented and reflected in the inventory
+- [x] Materiality and tiering configured with purpose and exposure fields
+- [x] Ongoing monitoring, alerts, and outcomes analysis in place
+- [x] Development documentation templates aligned to SR 26-2
+- [x] Validation workflows and effective challenge operating by tier
+- [x] Governance roles, approvals, and audit evidence configured
+
+
+<!-- FOOTNOTES -->
+
+[^1]:
+
+   **Board of Governors of the Federal Reserve System, FDIC, and OCC:**<br>
+   [SR 26-2: Interagency Guidance on Model Risk Management for Banking Organizations](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (April 17, 2026; supersedes SR 11-7)
+
+[^2]: [Manage inventory fields](/guide/inventory/manage-inventory-fields.qmd)
+
+[^3]: [Working with the inventory](/guide/inventory/working-with-the-inventory.qmd)
+
+[^4]: [Working with document templates](/guide/templates/working-with-document-templates.qmd)
+
+[^5]: [Working with documentation](/guide/documentation/working-with-documentation.qmd)
+
+[^6]: [Run tests and test suites](/developer/how-to/testing-overview.qmd)
+
+[^7]: [Preparing validation reports](/guide/validation/preparing-validation-reports.qmd)
+
+[^8]: [Working with artifacts](/guide/validation/working-with-artifacts.qmd)
+
+[^9]: [Ongoing monitoring](/guide/monitoring/ongoing-monitoring.qmd)
+
+[^10]: [Setting up workflows](/guide/workflows/setting-up-workflows.qmd)
+
+[^11]: [Manage permissions](/guide/configuration/manage-permissions.qmd)
+
+[^12]: [Working with analytics](/guide/reporting/working-with-analytics.qmd)
diff --git a/site/about/contributing/using-the-documentation.qmd b/site/about/using-the-documentation.qmd
similarity index 82%
rename from site/about/contributing/using-the-documentation.qmd
rename to site/about/using-the-documentation.qmd
index 4757f97f7b..39f59870e6 100644
--- a/site/about/contributing/using-the-documentation.qmd
+++ b/site/about/using-the-documentation.qmd
@@ -4,9 +4,11 @@
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
 title: "Using the documentation"
 date: last-modified
+aliases:
+  - /about/contributing/using-the-documentation.html
 ---
 
-This documentation site helps you learn {{< var vm.product >}}, implement it in your organization, govern your AI/ML models, and operate the platform day to day.
+This documentation site helps you learn {{< var vm.product >}}, implement it in your organization, govern your AI/ML records (models), and operate the platform day to day.
 
 ## How to use this site
 
@@ -25,7 +27,7 @@ Introduces the platform, its use cases, and deployment options.
 
 - [About {{< var vm.product >}}](/about/overview.qmd) — Platform overview and capabilities
 - [AI governance](/about/use-cases/ai-governance.qmd) — EU AI Act compliance and risk classification
-- [Model risk management](/about/use-cases/model-risk-management.qmd) — SR 11-7, SS1/23, and E-23 compliance
+- [Model risk management](/about/use-cases/model-risk-management.qmd) — SR 26-2, SS1/23, and E-23 compliance
 - [Library and platform](/about/library-and-platform.qmd) — How the {{< var validmind.developer >}} and {{< var validmind.platform >}} work together
 - [Deployment options](/about/deployment/deployment-options.qmd) — Multi-tenant cloud vs. Virtual Private {{< var vm.product >}}
 
@@ -35,7 +37,7 @@ Introduces the platform, its use cases, and deployment options.
 
 Role-based quickstarts to help you begin using {{< var vm.product >}} quickly.
 
-- [Developer quickstart](/get-started/developer/quickstart-developer.qmd) — Set up your environment and document your first model
+- [Developer quickstart](/get-started/developer/quickstart-developer.qmd) — Set up your environment and document your first record (model)
 - [Validator quickstart](/get-started/validator/quickstart-validator.qmd) — Review documentation and prepare validation reports
 - [Administrator quickstart](/get-started/administrator/quickstart-administrator.qmd) — Configure users, roles, and organization settings
 
@@ -49,14 +51,14 @@ Step-by-step instructions for platform tasks, organized by feature area.
 |---------|--------|---------------|
 | [Access](/guide/guides.qmd#access) | Signing up for and logging into {{< var vm.product >}} | Register, sign in via SSO, recover access |
 | [Configuration](/guide/guides.qmd#configuration) | Setting up your organization and users | Add users, create groups, assign roles and permissions |
-| [Integrations](/guide/integrations/managing-integrations.qmd) | Connecting {{< var vm.product >}} to external systems | Manage secrets, configure connections, link external models |
-| [Workflows](/guide/guides.qmd#workflows) | Automating model lifecycle processes | Configure workflow steps, manage transitions, set up approvals |
-| [Inventory](/guide/guides.qmd#inventory) | Managing your model and record inventory | Register records, edit fields, configure interdependencies |
+| [Integrations](/guide/integrations/managing-integrations.qmd) | Connecting {{< var vm.product >}} to external systems | Manage secrets, configure connections, link external records (models) |
+| [Workflows](/guide/guides.qmd#workflows) | Automating lifecycle processes | Configure workflow steps, manage transitions, set up approvals |
+| [Inventory](/guide/guides.qmd#inventory) | Managing your records (models) and record inventory | Register records, edit fields, configure interdependencies |
 | [Documents & templates](/guide/templates/working-with-documents.qmd) | Creating and customizing documentation | Manage document types, customize templates, use the text block library |
-| [Model documentation](/guide/guides.qmd#model-documentation) | Authoring and collaborating on model docs | Edit content blocks, add test results, manage versions, submit for approval |
-| [Model validation](/guide/guides.qmd#model-validation) | Reviewing and validating models | Review documentation, assess compliance, manage findings and artifacts |
+| [Documentation](/guide/guides.qmd#documentation) | Authoring and collaborating on documents | Edit content blocks, add test results, manage versions, submit for approval |
+| [Validation](/guide/guides.qmd#validation) | Reviewing and validating records (models) | Review documentation, assess compliance, manage findings and artifacts |
 | [Reporting](/guide/guides.qmd#reporting) | Analyzing and exporting data | View reports, create custom analytics, export inventory and documents |
-| [Monitoring](/guide/guides.qmd#monitoring) | Tracking model performance over time | Enable monitoring, review results, set thresholds and alerts |
+| [Monitoring](/guide/guides.qmd#monitoring) | Tracking record (model) performance over time | Enable monitoring, review results, set thresholds and alerts |
 | [Attestation](/guide/guides.qmd#attestation) | Managing formal attestations | Create, submit, review, and approve attestations |
 
 ### [{{< var validmind.developer >}}](/developer/validmind-library.qmd)
@@ -65,7 +67,7 @@ Resources for developers integrating {{< var vm.product >}} into their workflows
 
 - [{{< var validmind.developer >}}](/developer/validmind-library.qmd) — Python library overview and installation
 - [Code samples](/developer/samples-jupyter-notebooks.qmd) — Jupyter notebooks for common use cases
-- [Test descriptions](/developer/test-descriptions.qmd) — Reference for available validation tests
+- [{{< var vm.product >}} test sandbox](/developer/how-to/test-sandbox.qmd) — Reference for available validation tests
 - [{{< var validmind.api >}}](/validmind/validmind.qmd) — Python API documentation
 - [Public REST API](/reference/validmind-rest-api-vm.qmd) — REST API for platform integrations
 
diff --git a/site/about/contributing/validmind-chatbot.png b/site/about/validmind-chatbot.png
similarity index 100%
rename from site/about/contributing/validmind-chatbot.png
rename to site/about/validmind-chatbot.png
diff --git a/site/developer/_sidebar.yaml b/site/developer/_sidebar.yaml
index a9d08ebe6c..399bd86069 100644
--- a/site/developer/_sidebar.yaml
+++ b/site/developer/_sidebar.yaml
@@ -10,44 +10,45 @@ website:
         # USING THE VARIABLE IN THE LINK TEXT MESSES UP THE MOBILE VIEW
         - text: "ValidMind Library"
           file: developer/validmind-library.qmd
-        - developer/supported-models-and-frameworks.qmd
+        - developer/supported-records-and-frameworks.qmd
         - text: "---"
         - text: "Quickstart"
-        - notebooks/quickstart/quickstart_model_documentation.ipynb
-        - notebooks/quickstart/quickstart_model_validation.ipynb
+        - notebooks/quickstart/quickstart_documentation.ipynb
+        - notebooks/quickstart/quickstart_validation.ipynb
         # USING THE VARIABLE IN THE LINK TEXT MESSES UP THE MOBILE VIEW & BREADCRUMB
         - section: "Install and initialize ValidMind"
           contents:
             - text: "Install and initialize the library"
-              file: developer/model-documentation/install-and-initialize-validmind-library.qmd
+              file: developer/quickstart/install-and-initialize-validmind-library.qmd
             - text: "Install and initialize the library for R"
-              file: developer/model-documentation/install-and-initialize-validmind-for-r.qmd
+              file: developer/quickstart/install-and-initialize-validmind-for-r.qmd
             - text: "Use an HTTP proxy with the library"
-              file: developer/model-documentation/use-http-proxy-with-validmind-library.qmd
-        - developer/model-documentation/store-credentials-in-env-file.qmd
+              file: developer/quickstart/use-http-proxy-with-validmind-library.qmd
+        - text: "Store credentials in `.env` files"
+          file: developer/quickstart/store-credentials-in-env-file.qmd
         - text: "---"
         - text: "End-to-End Tutorials"
         # USING THE VARIABLE IN THE LINK TEXT MESSES UP THE MOBILE VIEW & BREADCRUMB
-        - section: "Model development"
+        - section: "Development"
           contents:
             - text: "1 — Set up ValidMind Library"
-              file: notebooks/tutorials/model_development/1-set_up_validmind.ipynb
-            - text: "2 — Start model development process"
-              file: notebooks/tutorials/model_development/2-start_development_process.ipynb
+              file: notebooks/tutorials/development/1-set_up_validmind.ipynb
+            - text: "2 — Start the development process"
+              file: notebooks/tutorials/development/2-start_development_process.ipynb
             - text: "3 — Integrate custom tests"
-              file: notebooks/tutorials/model_development/3-integrate_custom_tests.ipynb
+              file: notebooks/tutorials/development/3-integrate_custom_tests.ipynb
             - text: "4 — Finalize testing & documentation"
-              file: notebooks/tutorials/model_development/4-finalize_testing_documentation.ipynb
-        - section: "Model validation"
+              file: notebooks/tutorials/development/4-finalize_testing_documentation.ipynb
+        - section: "Validation"
           contents:
             - text: "1 — Set up ValidMind Library for validation"
-              file: notebooks/tutorials/model_validation/1-set_up_validmind_for_validation.ipynb
-            - text: "2 —\u00A0Start model validation process"
-              file: notebooks/tutorials/model_validation/2-start_validation_process.ipynb
-            - text: "3 — Developing a challenger model"
-              file: notebooks/tutorials/model_validation/3-developing_challenger_model.ipynb
+              file: notebooks/tutorials/validation/1-set_up_validmind_for_validation.ipynb
+            - text: "2 — Start the validation process"
+              file: notebooks/tutorials/validation/2-start_validation_process.ipynb
+            - text: "3 — Developing a challenger"
+              file: notebooks/tutorials/validation/3-developing_potential_challenger.ipynb
             - text: "4 — Finalize validation & reporting"
-              file: notebooks/tutorials/model_validation/4-finalize_validation_reporting.ipynb
+              file: notebooks/tutorials/validation/4-finalize_validation_reporting.ipynb
         - text: "---"
         - text: "How-To"
         - text: "Run tests & test suites"
@@ -57,11 +58,10 @@ website:
               contents:
                 - notebooks/how_to/tests/explore_tests/explore_tests.ipynb
                 - notebooks/how_to/tests/explore_tests/explore_test_suites.ipynb
-                - developer/how-to/test-sandbox.qmd
             - section: "Run tests"
               contents:
-                - notebooks/how_to/tests/run_tests/1_run_dataset_based_tests.ipynb
-                - notebooks/how_to/tests/run_tests/2_run_comparison_tests.ipynb
+                - notebooks/how_to/tests/run_tests/1-run_dataset-based_tests.ipynb
+                - notebooks/how_to/tests/run_tests/2-run_comparison_tests.ipynb
                 - section: "Configuring tests"
                   contents: "notebooks/how_to/tests/run_tests/configure_tests/*.ipynb"
                 - section: "Using tests in documentation"
@@ -97,8 +97,6 @@ website:
               contents: "notebooks/use_cases/code_explainer/**/*.ipynb"
             - section: "Credit risk"
               contents: "notebooks/use_cases/credit_risk/**/*.ipynb"
-            - section: "Model validation"
-              contents: "notebooks/use_cases/model_validation/**/*.ipynb"
             - section: "NLP and LLM"
               contents: "notebooks/use_cases/nlp_and_llm/**/*.ipynb"
             - section: "Ongoing monitoring"
@@ -107,11 +105,12 @@ website:
               contents: "notebooks/use_cases/regression/**/*.ipynb"
             - section: "Time series"
               contents: "notebooks/use_cases/time_series/**/*.ipynb"
+            - section: "Validation"
+              contents: "notebooks/use_cases/validation/**/*.ipynb"
         - text: "---"
         - text: "Reference"
-        - text: "Test descriptions"
-          file: developer/test-descriptions.qmd
-          contents: tests/**
+        - text: "{{< var vm.product >}} test sandbox"
+          file: developer/how-to/test-sandbox.qmd
         - text: "{{< var validmind.api >}}"
           file: validmind/validmind.qmd
         # USING THE VARIABLE IN THE LINK TEXT MESSES UP THE MOBILE VIEW & BREADCRUMB
diff --git a/site/developer/how-to/test-sandbox.qmd b/site/developer/how-to/test-sandbox.qmd
index c9ea3a23c3..5eedac7292 100644
--- a/site/developer/how-to/test-sandbox.qmd
+++ b/site/developer/how-to/test-sandbox.qmd
@@ -2,19 +2,40 @@
 # Copyright © 2023-2026 ValidMind Inc. All rights reserved.
 # Refer to the LICENSE file in the root of this repository for details.
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
-title: "Test sandbox <sup>[beta]{.smallcaps}</sup>"
-date: last-modified
+pagetitle: "{{< var vm.product >}} test sandbox"
+title-block-style: none
+bread-crumbs: false
+page-layout: full
 aliases:
   - /guide/test-sandbox.html
   - /developer/model-testing/test-sandbox.html
+  - /developer/test-descriptions.html
+  - /guide/test-descriptions.html
+  - /developer/model-testing/test-descriptions.html
 ---
 
-<!--- TO DO
-- Ordering of notebooks if we want them to appear in a specific sequence
---->
-Explore our interactive sandbox to see what tests are available in the {{< var validmind.developer >}} and how you can use them in your own code.
+```{=html}
+<style>
+  /* Close the gap between the pink banner and the test-sandbox iframe */
+  #title-block-header { display: none !important; }
+  #quarto-document-content { padding-top: 0 !important; margin-top: 0 !important; }
+  #quarto-document-content > .column-screen:first-child { margin-top: 0 !important; }
+  #quarto-document-content > .column-screen iframe { display: block; }
+
+  /* Hide the secondary-nav toggle bar only on desktop;
+     keep it on mobile/tablet so the sidebar remains reachable. */
+  @media (min-width: 992px) {
+    .quarto-secondary-nav { display: none !important; }
+  }
+
+  /* Quarto sidebar scroll-visibility strip under the navbar (this page only) */
+  #quarto-sidebarnav-toggle {
+    display: none !important;
+  }
+</style>
+```
 
-::: {.column-screen-right}
+::: {.column-screen}
 
 ```{=html}
 <iframe
diff --git a/site/developer/how-to/testing-overview.qmd b/site/developer/how-to/testing-overview.qmd
index 7d1511f138..129c428de9 100644
--- a/site/developer/how-to/testing-overview.qmd
+++ b/site/developer/how-to/testing-overview.qmd
@@ -24,8 +24,9 @@ listing:
     sort: false
     fields: [title, description]
     contents:
-    - test-sandbox.qmd
-    - ../test-descriptions.qmd
+    - title: "{{< var vm.product >}} test sandbox"
+      description: "Tests that are available as part of the {{< var validmind.developer >}}, grouped by type of validation or monitoring test."
+      path: test-sandbox.qmd
   - id: test-basics
     type: grid
     grid-columns: 2
@@ -33,8 +34,8 @@ listing:
     sort: false
     fields: [title, description]
     contents:
-    - ../../notebooks/how_to/tests/run_tests/1_run_dataset_based_tests.ipynb
-    - ../../notebooks/how_to/tests/run_tests/2_run_comparison_tests.ipynb
+    - ../../notebooks/how_to/tests/run_tests/1-run_dataset-based_tests.ipynb
+    - ../../notebooks/how_to/tests/run_tests/2-run_comparison_tests.ipynb
   - id: configure-tests
     type: grid
     grid-columns: 2
@@ -71,7 +72,7 @@ listing:
     - ../samples-jupyter-notebooks.qmd
 ---
 
-{{< var vm.product >}} provides many built-in tests and test suites, which help you produce documentation during stages of the model lifecycle, where you need to ensure that your work satisfies regulatory and risk management requirements.
+{{< var vm.product >}} provides many built-in tests and test suites, which help you produce documentation during stages of your risk management lifecycle, where you need to ensure that your work satisfies regulatory and risk management requirements.
 
 ::: {.callout-important collapse="false" appearance="minimal"}
 ## Quick reference
@@ -89,10 +90,10 @@ listing:
 : When running the same test multiple times with different parameters, add a `:suffix` to distinguish results, such as `validmind.data_validation.ClassImbalance:custom_threshold`.
 
 **Inputs**
-: The datasets and models your test analyzes. Pass these via `inputs={}`:
+: The datasets and records (models) your test analyzes. Pass these via `inputs={}`:
 
     - `dataset` — A VM dataset object
-    - `model` — A VM model object
+    - `model` — A VM model object, which can be any type of record
     - `datasets` / `models` — For tests comparing multiple datasets or models
 
 **Parameters**
@@ -100,9 +101,7 @@ listing:
 
     - Thresholds, such as `min_percent_threshold`, `disparity_tolerance`
     - Metrics to compute, such as `metrics=["fnr", "fpr", "tpr"]`
-    - Any setting that isn't a dataset or model
-
-Use `vm.tests.describe_test("test_id")` or check the [test descriptions](/developer/test-descriptions.qmd) page to see what parameters a test accepts.
+    - Any setting that isn't a dataset or model[^1]
 
 **Outputs**
 : Tests return results like tables and plots. Tables can be lists of dictionaries or pandas DataFrames; plots can be matplotlib or plotly figures.
@@ -118,10 +117,10 @@ Use `vm.tests.describe_test("test_id")` or check the [test descriptions](/develo
 : Test suites are collections of tests that run together. Each has an identifier like `classifier_full_suite`. Use `vm.tests.list_test_suites()` to browse available test suites.
 
 **Inputs**
-: The datasets and models the test suite analyzes. Pass these via `inputs={}`:
+: The datasets and records (models) the test suite analyzes. Pass these via `inputs={}`:
 
     - `dataset` — A VM dataset object
-    - `model` — A VM model object
+    - `model` — A VM model object, which can be any type of record
     - `datasets` / `models` — For suites comparing multiple datasets or models
 
 **Config**
@@ -139,7 +138,7 @@ Use `vm.tests.describe_test("test_id")` or check the [test descriptions](/develo
 
 ## Explore tests
 
-Start by exploring the {{< var validmind.developer >}}'s available tests and tests suites:
+Start by exploring the {{< var validmind.developer >}}'s available tests and test suites:
 
 ::: {.panel-tabset}
 
@@ -168,9 +167,9 @@ To document and validate your dataset:
 - For generic tabular datasets: use the [`tabular_dataset`](/validmind/validmind/test_suites/tabular_datasets.qmd){target="_blank"} test suite.
 - For time-series datasets: use the [`time_series_dataset`](/validmind/validmind/test_suites/time_series.qmd#timeseriesdataset){target="_blank"} test suite.
 
-### Model testing
+### Record (model) testing
 
-To document and validate your model:
+To document and validate your record:
 
 - For binary classification models: use the [`classifier`](/validmind/validmind/test_suites/classifier.qmd){target="_blank"} test suite.
 - For time series models: use the [`timeseries`](/validmind/validmind/test_suites/time_series.qmd){target="_blank"} test suite.
@@ -186,7 +185,7 @@ Use the [`classifier_full_suite`](/validmind/validmind/test_suites/classifier.qm
 
 ## Run tests
 
-Next, learn how to use the {{< var validmind.developer >}} to run tests on datasets and models:
+Next, learn how to use the {{< var validmind.developer >}} to run tests on datasets and records (models):
 
 ::: {.panel-tabset}
 
@@ -232,3 +231,7 @@ Learn more about using the other features of the {{< var validmind.developer >}}
 :::{#testing-next}
 :::
 
+<!-- FOOTNOTES -->
+
+[^1]: Use `vm.tests.describe_test("test_id")` for programmatic parameter details, or browse the [{{< var vm.product >}} test sandbox](test-sandbox.qmd).
+
diff --git a/site/developer/model-documentation/_code-snippet.qmd b/site/developer/quickstart/_code-snippet.qmd
similarity index 53%
rename from site/developer/model-documentation/_code-snippet.qmd
rename to site/developer/quickstart/_code-snippet.qmd
index b98da91b48..3ec85602e7 100644
--- a/site/developer/model-documentation/_code-snippet.qmd
+++ b/site/developer/quickstart/_code-snippet.qmd
@@ -2,4 +2,4 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-Initialize the {{< var validmind.developer >}} with the _code snippet_ unique to each model per document to connect your environment to the {{< var validmind.platform >}}, ensuring test results are uploaded to the correct model and automatically populated in the right document.
\ No newline at end of file
+Initialize the {{< var validmind.developer >}} with the _code snippet_ unique to each record (model) per document to connect your environment to the {{< var validmind.platform >}}, ensuring test results are uploaded to the correct record and automatically populated in the right document.
\ No newline at end of file
diff --git a/site/developer/model-documentation/install-and-initialize-validmind-for-r.qmd b/site/developer/quickstart/install-and-initialize-validmind-for-r.qmd
similarity index 81%
rename from site/developer/model-documentation/install-and-initialize-validmind-for-r.qmd
rename to site/developer/quickstart/install-and-initialize-validmind-for-r.qmd
index c83aa193a1..d5394b06f6 100644
--- a/site/developer/model-documentation/install-and-initialize-validmind-for-r.qmd
+++ b/site/developer/quickstart/install-and-initialize-validmind-for-r.qmd
@@ -4,6 +4,8 @@
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
 title: "Install and initialize ValidMind for R"
 date: last-modified
+aliases:
+  - /developer/model-documentation/install-and-initialize-validmind-for-r.html
 listing:
   - id: whats-next
     type: grid
@@ -13,23 +15,23 @@ listing:
     grid-columns: 2
     contents:
       - path: https://github.com/validmind/validmind-library/tree/main/notebooks/quickstart/
-        title: "Quickstart for model documentation"
-        description: "End-to-end model documentation workflow in R: load data, preprocess, train a GLM model, and run the full documentation test suite."
+        title: "Quickstart for documentation"
+        description: "End-to-end documentation workflow in R: load data, preprocess, train a GLM model, and run the full documentation test suite."
       - path: https://github.com/validmind/validmind-library/tree/main/notebooks/quickstart/
-        title: "Quickstart for model validation"
-        description: "End-to-end model validation workflow in R: load data, run data quality tests, train a champion GLM model, and run model evaluation tests."
+        title: "Quickstart for validation"
+        description: "End-to-end validation workflow in R: load data, run data quality tests, train a champion GLM model, and run model evaluation tests."
 ---
 
-Use the ValidMind R package to document and validate models built in R. The package interfaces with the {{< var validmind.developer >}} through `reticulate`, giving you access to the full Python API from R.
+Use the ValidMind R package to document and validate records (models) built in R. The package interfaces with the {{< var validmind.developer >}} through `reticulate`, giving you access to the full Python API from R.
 
 ::: {.attn}
 
 ## Prerequisites
 
 - [x] {{< var link.login >}}
-- [x] The model you want to connect to is registered in the model inventory.[^1]
-- [x] The model document has a template applied.[^2]
-- [x] You are the record owner, model validator, or another model stakeholder with write access to the model's documents.[^3]
+- [x] The record you want to connect to is registered in the inventory.[^1]
+- [x] The document you want to connect to has a template applied.[^2]
+- [x] You are the owner, validator, or another inventory record stakeholder with write access to the record's documents.[^3]
 
 :::
 
@@ -71,7 +73,7 @@ sudo dnf install R
 
 ## Install Python dependencies
 
-Install the {{< var validmind.developer >}} and `rpy2` so Python can interface with R models:
+Install the {{< var validmind.developer >}} and `rpy2` so Python can interface with R records:
 
 ```bash
 pip install validmind rpy2
@@ -136,8 +138,8 @@ vm_r <- vm(
 
 The `document` parameter specifies which document type to associate with the session:
 
-- `"documentation"` — For model development
-- `"validation-report"` — For model validation
+- `"documentation"` — For development
+- `"validation-report"` — For validation
 
 ## Key APIs
 
diff --git a/site/developer/model-documentation/install-and-initialize-validmind-library.qmd b/site/developer/quickstart/install-and-initialize-validmind-library.qmd
similarity index 63%
rename from site/developer/model-documentation/install-and-initialize-validmind-library.qmd
rename to site/developer/quickstart/install-and-initialize-validmind-library.qmd
index da77325b88..e0eb1656f6 100644
--- a/site/developer/model-documentation/install-and-initialize-validmind-library.qmd
+++ b/site/developer/quickstart/install-and-initialize-validmind-library.qmd
@@ -10,6 +10,7 @@ aliases:
   - /guide/install-and-initialize-validmind-library.html
   - /guide/install-and-initialize-developer-framework.html
   - install-and-initialize-client-library.html
+  - /developer/model-documentation/install-and-initialize-validmind-library.html
 listing:
   - id: whats-next
     type: grid
@@ -29,12 +30,12 @@ listing:
 ## Prerequisites
 
 - [x] {{< var link.login >}}
-- [x] The model you want to connect to is registered in the model inventory.[^1]
-- [x] The model document has a template applied.[^2]
-- [x] You are the record owner, model validator, or another model stakeholder with write access to the model's documents.[^3]
+- [x] The record you want to connect to is registered in the inventory.[^1]
+- [x] The document you want to connect to has a template applied.[^2]
+- [x] You are the owner, validator, or another inventory record stakeholder with write access to the record's documents.[^3]
 
 ::: {.callout}
-The {{< var validmind.developer >}} requires access to the data sources where relevant datasets and model files are stored in order to help you run tests.
+The {{< var validmind.developer >}} requires access to the data sources where relevant datasets and record files are stored in order to help you run tests.
 
 :::
 
@@ -50,25 +51,27 @@ In order to upload test results from the {{< var validmind.developer >}} to the
 | `api_host`    | The location of the {{< var vm.product >}} API  |
 | `api_key`     | The account API key                |
 | `api_secret`  | The account secret key             |
-| `document`  | The model document identifier key             |
-| `model`     | The model identifier             |
+| `document`  | The record document identifier key             |
+| `model`     | The record identifier             |
 
 ### Get your code snippet
 
-Retrieve your code snippet for your model's selected document from the {{< var validmind.platform >}}:
+Retrieve your code snippet for your record's selected document from the {{< var validmind.platform >}}:
 
 1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
 
-2. Select a model by clicking on it or find your model by applying a filter or searching for it.[^4]
+2. Under the [record type]{.smallcaps} drop-down, select the type of record you want to retrieve the code snippet for.[^4]
 
-3. In the left sidebar that appears for your model, click **{{< fa rocket >}} Getting Started**.
+3. Select a record by clicking on it or find your record by applying a filter or searching for it.[^5]
 
-4. Select the **[document]{.smallcaps}** you want to automatically upload test results to.[^5]
+4. In the left sidebar that appears for your record, click **{{< fa rocket >}} Getting Started**.
 
-5. Click **{{< fa regular copy >}} Copy snippet to clipboard**.
+5. Select the **[document]{.smallcaps}** you want to automatically upload test results to.[^6]
+
+6. Click **{{< fa regular copy >}} Copy snippet to clipboard**.
 
 ::: {.callout}
-## Selecting a **[document]{.smallcaps}** to connect to requires {{< var validmind.developer >}} version >=2.12.0.[^6]
+## Selecting a **[document]{.smallcaps}** to connect to requires {{< var validmind.developer >}} version >=2.12.0.[^7]
 
 A template must already be applied to your selected document to populate test results in the {{< var validmind.platform >}}. Attempting to initialize the {{< var vm.developer >}} with a document that does not have a template applied will result in an error.
 
@@ -101,13 +104,13 @@ vm.init(
 ```
 
 :::{.callout}
-To also enable monitoring, add `monitoring=True` to the `vm.init` method in your code snippet. [^7]
+To also enable monitoring, add `monitoring=True` to the `vm.init` method in your code snippet. [^8]
 :::
 
 ::: {.feature}
 #### **Automate with {{< var vm.product >}}**
 
-After you run the code snippet in your environment, the {{< var validmind.developer >}} will connect to your model and selected document in the {{< var validmind.platform >}}. Automate your workflow by using the {{< var vm.developer >}} to run tests, then seamlessly upload your test results to the {{< var vm.platform >}}.
+After you run the code snippet in your environment, the {{< var validmind.developer >}} will connect to your record and selected document in the {{< var validmind.platform >}}. Automate your workflow by using the {{< var vm.developer >}} to run tests, then seamlessly upload your test results to the {{< var vm.platform >}}.
 
 :::
 
@@ -115,7 +118,7 @@ After you run the code snippet in your environment, the {{< var validmind.develo
 
 ## Upgrade the {{< var validmind.developer >}}
 
-After installing the {{< var validmind.developer >}},[^8] you'll want to periodically make sure you are on the latest version to access any new features and other enhancements:
+After installing the {{< var validmind.developer >}},[^9] you'll want to periodically make sure you are on the latest version to access any new features and other enhancements:
 
 1. In your Jupyter Notebook or developer environment, retrieve the information for the currently installed version of the {{< var vm.developer >}}:
 
@@ -132,7 +135,7 @@ Version: 2.11.0
 ```
 :::
 
-2. If the version returned is lower than the version indicated in our production open-source code,[^9] run the following command:
+2. If the version returned is lower than the version indicated in our production open-source code,[^10] run the following command:
 
     ```python
     %pip install --upgrade validmind
@@ -152,14 +155,16 @@ Version: 2.11.0
 
 [^3]: [Manage inventory record stakeholders](/guide/inventory/edit-inventory-fields.qmd#manage-inventory-record-stakeholders)
 
-[^4]: [Working with the inventory](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records)
+[^4]: [Manage inventory record types](/guide/inventory/manage-inventory-record-types.qmd)
+
+[^5]: [Working with the inventory](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records)
 
-[^5]: [Working with documents](/guide/templates/working-with-documents.qmd)
+[^6]: [Working with documents](/guide/templates/working-with-documents.qmd)
 
-[^6]: [Upgrade the {{< var validmind.developer >}}](#upgrade-validmind)
+[^7]: [Upgrade the {{< var validmind.developer >}}](#upgrade-validmind)
 
-[^7]: [Ongoing monitoring](/guide/monitoring/ongoing-monitoring.qmd)
+[^8]: [Ongoing monitoring](/guide/monitoring/ongoing-monitoring.qmd)
 
-[^8]: [Install {{< var vm.product >}}](#install-validmind)
+[^9]: [Install {{< var vm.product >}}](#install-validmind)
 
-[^9]: **ValidMind GitHub:** [validmind-library/validmind/&lowbar;&lowbar;version&lowbar;&lowbar;.py](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py)
\ No newline at end of file
+[^10]: **ValidMind GitHub:** [validmind-library/validmind/&lowbar;&lowbar;version&lowbar;&lowbar;.py](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py)
\ No newline at end of file
diff --git a/site/developer/model-documentation/store-credentials-in-env-file.qmd b/site/developer/quickstart/store-credentials-in-env-file.qmd
similarity index 61%
rename from site/developer/model-documentation/store-credentials-in-env-file.qmd
rename to site/developer/quickstart/store-credentials-in-env-file.qmd
index 484ec10487..c59d30396e 100644
--- a/site/developer/model-documentation/store-credentials-in-env-file.qmd
+++ b/site/developer/quickstart/store-credentials-in-env-file.qmd
@@ -2,10 +2,11 @@
 # Copyright © 2023-2026 ValidMind Inc. All rights reserved.
 # Refer to the LICENSE file in the root of this repository for details.
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
-title: "Store model credentials in `.env` files"
+title: "Store record credentials in `.env` files"
 date: last-modified
 aliases:
   - /guide/store-credentials-in-env-file.html
+  - /developer/model-documentation/store-credentials-in-env-file.html
 listing:
   - id: whats-next
     type: grid
@@ -18,7 +19,7 @@ listing:
     - ../how-to/feature-overview.qmd
 ---
 
-Learn how to store model identifier credentials in an `.env` file instead of using inline credentials, allowing you to follow best practices for security when running Jupyter Notebooks.
+Learn how to store record (model) identifier credentials in an `.env` file instead of using inline credentials, allowing you to follow best practices for security when running Jupyter Notebooks.
 
 <br>
 
@@ -26,9 +27,9 @@ Learn how to store model identifier credentials in an `.env` file instead of usi
 ::: {.callout collapse="true" appearance="minimal"}
 ### Why is it recommended to store credentials in an `.env` file?
 
-Storing credentials in a `.env` file is considered a best practice for security. Embedding credentials directly within the code makes them more susceptible to accidental exposure when sharing code or collaborating on models.
+Storing credentials in a `.env` file is considered a best practice for security. Embedding credentials directly within the code makes them more susceptible to accidental exposure when sharing code or collaborating on records.
 
-Keeping model credentials in a separate file also allows for precise access control and ensures that sensitive credentials are not publicly accessible.
+Keeping record credentials in a separate file also allows for precise access control and ensures that sensitive credentials are not publicly accessible.
 
 :::
 :::
@@ -39,10 +40,10 @@ Keeping model credentials in a separate file also allows for precise access cont
 
 - [x] {{< var link.login >}}
 - [x] The record you want to store credentials for is registered in the inventory.[^1]
-- [x] You are the record owner, model validator, or another model stakeholder with sufficient permissions to perform the tasks in this guide.[^2]
+- [x] You are the owner, validator, or another inventory record stakeholder with sufficient permissions to perform the tasks in this guide.[^2]
 
 ::: {.callout}
-Before you follow the steps on this page, we recommend that you first complete our introductory guide on how to [Install and initialize the {{< var validmind.developer >}}](/developer/model-documentation/install-and-initialize-validmind-library.qmd).
+Before you follow the steps on this page, we recommend that you first complete our introductory guide on how to [Install and initialize the {{< var validmind.developer >}}](/developer/quickstart/install-and-initialize-validmind-library.qmd).
 
 :::
 
@@ -54,17 +55,19 @@ Before you follow the steps on this page, we recommend that you first complete o
 
 ### a. Get your code snippet
 
-In the {{< var validmind.platform >}}, retrieve the code snippet for your model:
+In the {{< var validmind.platform >}}, retrieve the code snippet for your record:
 
 i. In the left sidebar, click **{{< fa cubes >}} Inventory**.
 
-ii. Select a model by clicking on it or find your model by applying a filter or searching for it.[^3]
+ii. Under the [record type]{.smallcaps} drop-down, select the type of record you want to retrieve the code snippet for.[^3]
 
-iii. In the left sidebar that appears for your model, click **{{< fa rocket >}} Getting Started**.
+iii. Select a record by clicking on it or find your record by applying a filter or searching for it.[^4]
 
-iv. Select the **[document]{.smallcaps}** you want to automatically upload test results to.[^4]
+iv. In the left sidebar that appears for your record, click **{{< fa rocket >}} Getting Started**.
 
-v. Click **{{< fa regular copy >}} Copy snippet to clipboard**.
+v. Select the **[document]{.smallcaps}** you want to automatically upload test results to.[^5]
+
+vi. Click **{{< fa regular copy >}} Copy snippet to clipboard**.
 
 ### b. Create an `.env` file
 
@@ -72,7 +75,7 @@ i. Create a new file in the same folder as your notebook and name it `.env`.
 
    This is a hidden file, so you may need to change your settings to view it.
 
-ii. Use the code snippet from your clipboard to build the credentials in your `.env` file in the following format:[^5]
+ii. Use the code snippet from your clipboard to build the credentials in your `.env` file in the following format:[^6]
 
       ```yaml
       VM_API_HOST=<api_host>
@@ -82,7 +85,7 @@ ii. Use the code snippet from your clipboard to build the credentials in your `.
       ```
 
 ::: {.callout}
-To define the document to connect the {{< var validmind.developer >}} to, or to enable monitoring, include these in your `vm.init()` snippet within your Jupyter Notebook.[^6]
+To define the document to connect the {{< var validmind.developer >}} to, or to enable monitoring, include these in your `vm.init()` snippet within your Jupyter Notebook.[^7]
 
 :::
 
@@ -90,7 +93,7 @@ To define the document to connect the {{< var validmind.developer >}} to, or to
 
 ## 2. Use credentials in your Jupyter Notebook
 
-a. After installing the {{< var validmind.developer >}} within your Jupyter Notebook,[^7] insert this code snippet in a code cell above your model identifier credentials:
+a. After installing the {{< var validmind.developer >}} within your Jupyter Notebook,[^8] insert this code snippet in a code cell above your record (model) identifier credentials:
 
    ```python
    %load_ext dotenv
@@ -118,7 +121,7 @@ b. Remove the inline credentials from `vm.init()` after importing the {{< var vm
 
    ### With ongoing monitoring
 
-   Example updated code cell including ongoing monitoring:[^8]
+   Example updated code cell including ongoing monitoring:[^9]
 
    ```python
    %load_ext dotenv
@@ -137,13 +140,13 @@ b. Remove the inline credentials from `vm.init()` after importing the {{< var vm
    ::: {.callout}
    ## A template must already be applied to your selected document to populate test results in the {{< var validmind.platform >}}.
 
-   Selecting a document to connect to requires {{< var validmind.developer >}} version >=2.12.0.[^9] Attempting to initialize the {{< var vm.developer >}} with a document that does not have a template applied will result in an error.
+   Selecting a document to connect to requires {{< var validmind.developer >}} version >=2.12.0.[^10] Attempting to initialize the {{< var vm.developer >}} with a document that does not have a template applied will result in an error.
 
    :::
 
 c. Run the cell.
 
-   Instead of using inline credentials, this code cell will now load your model credentials from a `.env` file.
+   Instead of using inline credentials, this code cell will now load your record credentials from a `.env` file.
 
 ## What's next
 
@@ -157,11 +160,13 @@ c. Run the cell.
 
 [^2]: [Manage inventory record stakeholders](/guide/inventory/edit-inventory-fields.qmd#manage-inventory-record-stakeholders)
 
-[^3]: [Working with the inventory](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records)
+[^3]: [Manage inventory record types](/guide/inventory/manage-inventory-record-types.qmd)
+
+[^4]: [Working with the inventory](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records)
 
-[^4]: [Working with documents](/guide/templates/working-with-documents.qmd)
+[^5]: [Working with documents](/guide/templates/working-with-documents.qmd)
 
-[^5]:
+[^6]:
 
     For example, if your credentials look like this:
 
@@ -186,10 +191,10 @@ c. Run the cell.
     VM_API_MODEL=model789
     ```
 
-[^6]: [Use credentials in your Jupyter Notebook](#use-credentials-in-your-jupyter-notebook)
+[^7]: [Use credentials in your Jupyter Notebook](#use-credentials-in-your-jupyter-notebook)
 
-[^7]: [Install and initialize the {{< var validmind.developer >}}](/developer/model-documentation/install-and-initialize-validmind-library.qmd#install-validmind)
+[^8]: [Install and initialize the {{< var validmind.developer >}}](/developer/quickstart/install-and-initialize-validmind-library.qmd#install-validmind)
 
-[^8]: [Enable monitoring](/guide/monitoring/enable-monitoring.qmd)
+[^9]: [Enable monitoring](/guide/monitoring/enable-monitoring.qmd)
 
-[^9]: [Install and initialize the {{< var validmind.developer >}}](/developer/model-documentation/install-and-initialize-validmind-library.qmd#upgrade-validmind)
+[^10]: [Install and initialize the {{< var validmind.developer >}}](/developer/quickstart/install-and-initialize-validmind-library.qmd#upgrade-validmind)
diff --git a/site/developer/model-documentation/use-http-proxy-with-validmind-library.qmd b/site/developer/quickstart/use-http-proxy-with-validmind-library.qmd
similarity index 94%
rename from site/developer/model-documentation/use-http-proxy-with-validmind-library.qmd
rename to site/developer/quickstart/use-http-proxy-with-validmind-library.qmd
index 233e18aae8..0e31b14a1e 100644
--- a/site/developer/model-documentation/use-http-proxy-with-validmind-library.qmd
+++ b/site/developer/quickstart/use-http-proxy-with-validmind-library.qmd
@@ -4,6 +4,8 @@
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
 title: "Use an HTTP proxy with the ValidMind Library"
 date: last-modified
+aliases:
+  - /developer/model-documentation/use-http-proxy-with-validmind-library.html
 listing:
   - id: whats-next
     type: grid
@@ -12,8 +14,8 @@ listing:
     fields: [title, description]
     grid-columns: 2
     contents:
-    - ../../notebooks/quickstart/quickstart_model_documentation.ipynb
-    - ../../notebooks/quickstart/quickstart_model_validation.ipynb
+    - ../../notebooks/quickstart/quickstart_documentation.ipynb
+    - ../../notebooks/quickstart/quickstart_validation.ipynb
 ---
 
 Outbound HTTPS traffic to the ValidMind API relies on standard Python HTTP clients that honor proxy-related environment variables, which lets you work behind corporate or regional proxies without custom library configuration.
@@ -90,7 +92,7 @@ If you change proxy variables after a session has already started, restart the k
 
 <!-- FOOTNOTES -->
 
-[^1]: If you have not installed the library yet, start with [Install and initialize the {{< var validmind.developer >}}](/developer/model-documentation/install-and-initialize-validmind-library.qmd).
+[^1]: If you have not installed the library yet, start with [Install and initialize the {{< var validmind.developer >}}](/developer/quickstart/install-and-initialize-validmind-library.qmd).
 
 [^2]: For example, refer to [aiohttp client advanced topics](https://docs.aiohttp.org/en/stable/client_advanced.html#proxy-support), [Requests proxies](https://requests.readthedocs.io/en/latest/user/advanced/#proxies), and [HTTPX proxies](https://www.python-httpx.org/advanced/proxies/).
 
diff --git a/site/developer/samples-jupyter-notebooks.qmd b/site/developer/samples-jupyter-notebooks.qmd
index 63786d527b..62e71b7928 100644
--- a/site/developer/samples-jupyter-notebooks.qmd
+++ b/site/developer/samples-jupyter-notebooks.qmd
@@ -41,15 +41,6 @@ listing:
     image-height: "100%"
     fields: [title, description, reading-time]
     contents: "../notebooks/use_cases/credit_risk/*.ipynb"
-  - id: model-validation
-    type: grid
-    grid-columns: 2
-    page-size: 4
-    image-placeholder: "jupyter-logo-rectangle.svg"
-    max-description-length: 350
-    image-height: "100%"
-    fields: [title, description, reading-time]
-    contents: "../notebooks/use_cases/model_validation/*.ipynb"
   - id: nlp-and-llm
     type: grid
     grid-columns: 2
@@ -86,6 +77,15 @@ listing:
     image-height: "100%"
     fields: [title, description, reading-time]
     contents: "../notebooks/use_cases/time_series/*.ipynb"
+  - id: validation
+    type: grid
+    grid-columns: 2
+    page-size: 4
+    image-placeholder: "jupyter-logo-rectangle.svg"
+    max-description-length: 350
+    image-height: "100%"
+    fields: [title, description, reading-time]
+    contents: "../notebooks/use_cases/validation/*.ipynb"
 fig-cap-location: top
 aliases:
   - /guide/samples-jupyter-notebooks.html
@@ -140,11 +140,6 @@ Our Jupyter Notebook code samples showcase the capabilities and features of the
 :::{#credit-risk}
 :::
 
-## Model validation
-
-:::{#model-validation}
-:::
-
 ## NLP and LLM
 
 :::{#nlp-and-llm}
@@ -165,4 +160,9 @@ Our Jupyter Notebook code samples showcase the capabilities and features of the
 :::{#time-series}
 :::
 
+## Validation
+
+:::{#validation}
+:::
+
 :::
diff --git a/site/developer/supported-models-and-frameworks.qmd b/site/developer/supported-records-and-frameworks.qmd
similarity index 88%
rename from site/developer/supported-models-and-frameworks.qmd
rename to site/developer/supported-records-and-frameworks.qmd
index ab9319d529..5704b52d0c 100644
--- a/site/developer/supported-models-and-frameworks.qmd
+++ b/site/developer/supported-records-and-frameworks.qmd
@@ -2,15 +2,16 @@
 # Copyright © 2023-2026 ValidMind Inc. All rights reserved.
 # Refer to the LICENSE file in the root of this repository for details.
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
-title: "Supported models and frameworks"
+title: "Supported records and frameworks"
 date: last-modified
 aliases:
   - /guide/supported-models.html
   - /developer/model-documentation/supported-models.html
   - /developer/supported-models.html
   - /developer/supported-model-frameworks.html
+  - /developer/supported-models-and-frameworks.html
 listing:
-  - id: next-models
+  - id: whats-next
     type: grid
     grid-columns: 2
     max-description-length: 250
@@ -18,20 +19,22 @@ listing:
     fields: [title, description]
     contents:
     - /how-to/testing-overview.qmd
-    - test-descriptions.qmd
+    - how-to/test-sandbox.qmd
     - /how-to/feature-overview.qmd
     - samples-jupyter-notebooks.qmd
 ---
 
-Learn about the wide range of models and frameworks for testing and documentation supported by the {{< var validmind.developer >}}. Understand which frameworks are supported, what your model needs to provide for tests to run, and how to work with models that don't fit standard patterns.
+Learn about the wide range of records (such as models) and frameworks for testing and documentation supported by the {{< var validmind.developer >}}.
+
+Understand which frameworks are supported, what your record needs to provide for tests to run, and how to work with records that don't fit standard patterns.
 
 ::: {.attn}
 
-## What does _supported_ mean? 
+## What does _supported_ mean?
 
-_Supported_ here means the {{< var validmind.developer >}} provides dedicated wrappers, install options, and guidance for these models and frameworks. 
+_Supported_ here means the {{< var validmind.developer >}} provides dedicated wrappers, install options, and guidance for these records and frameworks.
 
-You can also use other code with the {{< var vm.developer >}} for models that don't fit standard framework patterns. For example, you can wrap any Python callable with `FunctionModel` or pass precomputed predictions when you don't have a model object.
+You can also use other code with the {{< var vm.developer >}} for records that don't fit standard framework patterns. For example, you can wrap any Python callable with `FunctionModel` or pass precomputed predictions when you don't have a traditional model object.
 
 :::: {.columns}
 
@@ -41,8 +44,8 @@ Framework-agnostic support
 :::
 
 ::: {.column width="50%" .pl3}
-Vendor model compatibility
-: Works with both first-party models you create and third-party models from external vendors, enabling flexible integration with both proprietary and external sources.
+Vendor record compatibility
+: Works with both first-party records you create and third-party records from external vendors, enabling flexible integration with both proprietary and external sources.
 :::
 
 ::::
@@ -149,7 +152,7 @@ ARIMA, VAR, and other statsmodels time series models.
 
 ## Frameworks
 
-The {{< var validmind.developer >}} provides wrapper classes for common frameworks. When you call `vm.init_model()`, the library automatically detects your model's framework from its module, such as `sklearn`, `torch`, or `transformers`, and selects the appropriate wrapper. You don't need to specify the wrapper class manually.
+The {{< var validmind.developer >}} provides wrapper classes for common frameworks. When you call `vm.init_model()`, the library automatically detects your record's framework from its module, such as `sklearn`, `torch`, or `transformers`, and selects the appropriate wrapper. You don't need to specify the wrapper class manually.
 
 ::: {.panel-tabset}
 ## CatBoost
@@ -227,13 +230,13 @@ pip install validmind[all]
 
 ### Test input requirements
 
-Different tests require different inputs from your model and dataset. Understanding these requirements helps you run the right tests for your use case.[^1]
+Different tests require different inputs from your record and dataset. Understanding these requirements helps you run the right tests for your use case.[^1]
 
 ::: {.panel-tabset}
 
 #### When `predict()` is required
 
-Most model tests call your model's `predict()` method to generate predictions. This includes:
+Most record tests call your record's `predict()` method to generate predictions. This includes:
 
 - Performance metrics (accuracy, precision, recall, F1)
 - Error analysis tests
@@ -248,7 +251,7 @@ Classification metrics that evaluate probability outputs require `predict_proba(
 - Calibration tests
 - Probability distribution analysis
 
-If your model doesn't have `predict_proba()`, these tests will be skipped or return an error.
+If your record doesn't have `predict_proba()`, these tests will be skipped or return an error.
 
 :::
 
@@ -280,7 +283,7 @@ flowchart LR
 
 ### Using precomputed predictions
 
-If you can't provide a model object because your model runs in a separate environment, you can pass precomputed predictions directly to the dataset:
+If you can't provide a model object because your record runs in a separate environment, you can pass precomputed predictions directly to the dataset:
 
 ```python
 vm_dataset = vm.init_dataset(
@@ -304,7 +307,7 @@ vm_dataset = vm.init_dataset(
 
 ### Dataset-only tests
 
-Some tests analyze data quality and don't require a model at all:
+Some tests analyze data quality and don't require a record at all:
 
 - Missing value analysis
 - Class imbalance detection
@@ -325,7 +328,7 @@ The library accepts multiple data formats when initializing datasets with `vm.in
 
 ## Custom model wrappers
 
-For models that don't fit standard framework patterns, use these flexible wrappers:
+For records that don't fit standard framework patterns, use these flexible wrappers:
 
 ::: {.panel-tabset}
 ### FunctionModel
@@ -518,7 +521,7 @@ Optional dependencies for specific frameworks:
 
 ## What's next
 
-:::{#next-models}
+:::{#whats-next}
 :::
 
 <!-- FOOTNOTES -->
diff --git a/site/developer/test-descriptions.qmd b/site/developer/test-descriptions.qmd
deleted file mode 100644
index fc82f7d8bc..0000000000
--- a/site/developer/test-descriptions.qmd
+++ /dev/null
@@ -1,67 +0,0 @@
----
-# Copyright © 2023-2026 ValidMind Inc. All rights reserved.
-# Refer to the LICENSE file in the root of this repository for details.
-# SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
-title: "Test descriptions"
-date: last-modified
-aliases:
-  - /guide/test-descriptions.html
-  - /developer/model-testing/test-descriptions.html
-listing:
-  - id: data-validation
-    contents: "../tests/data_validation/*.md"
-    type: grid
-    max-description-length: 250
-    page-size: 150
-    fields: [title, description]
-  - id: model-validation
-    type: grid
-    contents: "../tests/model_validation/*.md"
-    max-description-length: 250
-    page-size: 150
-    fields: [title, description]
-  - id: prompt-validation
-    contents: "../tests/prompt_validation/*.md"
-    type: grid
-    max-description-length: 250
-    page-size: 150
-    fields: [title, description]  
-  - id: ongoing-monitoring
-    contents: "../tests/ongoing_monitoring/*.md"
-    type: grid
-    max-description-length: 250
-    page-size: 150
-    fields: [title, description]  
----
-
-Tests that are available as part of the {{< var validmind.developer >}}, grouped by type of validation or monitoring test.
-
-::: {.callout}
-## {{< fa flask >}} [Try the test sandbox <sup>[beta]{.smallcaps}</sup>](how-to/test-sandbox.qmd)
-
-Explore our interactive sandbox to see what tests are available in the {{< var validmind.developer >}}.
-:::
-
-:::{.panel-tabset}
-
-## {{< fa database >}} Data validation
-
-:::{#data-validation}
-:::
-
-## {{< fa cube >}} Model validation
-
-:::{#model-validation}
-:::
-
-## {{< fa terminal >}} Prompt validation
-
-:::{#prompt-validation}
-:::
-
-## {{< fa desktop >}} Ongoing monitoring
-
-:::{#ongoing-monitoring}
-:::
-
-:::
diff --git a/site/developer/validmind-library.qmd b/site/developer/validmind-library.qmd
index 698a4b4d93..e522a4772a 100644
--- a/site/developer/validmind-library.qmd
+++ b/site/developer/validmind-library.qmd
@@ -19,42 +19,42 @@ listing:
     fields: [title, description]
     grid-columns: 2
     contents:
-    - ../notebooks/quickstart/quickstart_model_documentation.ipynb
-    - ../notebooks/quickstart/quickstart_model_validation.ipynb
-  - id: model-development
+    - ../notebooks/quickstart/quickstart_documentation.ipynb
+    - ../notebooks/quickstart/quickstart_validation.ipynb
+  - id: development
     type: grid
     grid-columns: 2
     max-description-length: 250
     contents:
-    - path: ../notebooks/tutorials/model_development/1-set_up_validmind.ipynb
+    - path: ../notebooks/tutorials/development/1-set_up_validmind.ipynb
       title: "1 — Set up the {{< var validmind.developer >}}"
       description: "Get to know {{< var vm.product >}} by setting up the {{< var validmind.developer >}} in your own environment, and registering a sample binary classification model in the {{< var validmind.platform >}} for use with this series of notebooks."
-    - path: ../notebooks/tutorials/model_development/2-start_development_process.ipynb
-      title: "2 — Start the model development process"
+    - path: ../notebooks/tutorials/development/2-start_development_process.ipynb
+      title: "2 — Start the development process"
       description: "Learn to run and log tests with a variety of methods and in different situations with the {{< var validmind.developer >}}, then add the results or evidence to your documentation for the sample model you registered."
-    - path: ../notebooks/tutorials/model_development/3-integrate_custom_tests.ipynb
+    - path: ../notebooks/tutorials/development/3-integrate_custom_tests.ipynb
       title: "3 — Integrate custom tests"
       description: "After you become familiar with the basics of the {{< var validmind.developer >}}, learn how to supplement ValidMind tests with your own and include them as additional evidence in your documentation. "
-    - path: ../notebooks/tutorials/model_development/4-finalize_testing_documentation.ipynb
+    - path: ../notebooks/tutorials/development/4-finalize_testing_documentation.ipynb
       title: "4 — Finalize testing and documentation"
-      description: "Wrap up by learning how to ensure that custom tests are included in your model's documentation template. By the end of this series, you will have a fully documented sample model ready for review."
-  - id: model-validation
+      description: "Wrap up by learning how to ensure that custom tests are included in your documentation template. By the end of this series, you will have a fully documented sample model ready for review."
+  - id: validation
     type: grid
     grid-columns: 2
     max-description-length: 250
     contents:
-    - path: ../notebooks/tutorials/model_validation/1-set_up_validmind_for_validation.ipynb
+    - path: ../notebooks/tutorials/validation/1-set_up_validmind_for_validation.ipynb
       title: "1 — Set up the {{< var validmind.developer >}} for validation"
       description: "Get to know {{< var vm.product >}} by setting up the {{< var validmind.developer >}} in your own environment, and gaining access as a validator to a sample model in the {{< var validmind.platform >}} for use with this series of notebooks."
-    - path: ../notebooks/tutorials/model_validation/2-start_validation_process.ipynb
-      title: "2 — Start the model validation process"
-      description: "Independently verify the data quality tests performed on datasets used to train the dummy champion model using tests from the {{< var validmind.developer >}}, then add the results or evidence to your validation report."
-    - path: ../notebooks/tutorials/model_validation/3-developing_challenger_model.ipynb
-      title: "3 — Developing a potential challenger model"
-      description: "After you become familiar with the basics of the {{< var validmind.developer >}}, use it to develop a potential challenger model and run thorough model comparison tests, such as performance, diagnostic, and feature importance tests."
-    - path: ../notebooks/tutorials/model_validation/4-finalize_validation_reporting.ipynb
+    - path: ../notebooks/tutorials/validation/2-start_validation_process.ipynb
+      title: "2 — Start the validation process"
+      description: "Independently verify the data quality tests performed on datasets used to train the dummy champion using tests from the {{< var validmind.developer >}}, then add the results or evidence to your validation report."
+    - path: ../notebooks/tutorials/validation/3-developing_potential_challenger.ipynb
+      title: "3 — Developing a potential challenger"
+      description: "After you become familiar with the basics of the {{< var validmind.developer >}}, use it to develop a potential challenger and run thorough comparison tests, such as performance, diagnostic, and feature importance tests."
+    - path: ../notebooks/tutorials/validation/4-finalize_validation_reporting.ipynb
       title: "4 — Finalize validation and reporting"
-      description: "Wrap up by learning how to include custom tests and verifying that all tests conducted during model development were run and reported accurately. By the end of this series, you will have a validation report complete with artifacts ready for review."
+      description: "Wrap up by learning how to include custom tests and verifying that all tests conducted during development were run and reported accurately. By the end of this series, you will have a validation report complete with artifacts ready for review."
   - id: library-features
     grid-columns: 2
     type: grid
@@ -73,7 +73,7 @@ listing:
     contents:
     - ../notebooks/use_cases/agents/document_agentic_ai.ipynb
     - ../notebooks/use_cases/credit_risk/document_excel_application_scorecard.ipynb
-    - ../notebooks/use_cases/model_validation/validate_application_scorecard.ipynb
+    - ../notebooks/use_cases/validation/validate_application_scorecard.ipynb
   - id: library-documentation
     type: grid
     grid-columns: 2
@@ -85,19 +85,19 @@ listing:
     - ../guide/documentation/work-with-content-blocks.qmd
 ---
 
-The {{< var validmind.developer >}} streamlines model development and validation by automating testing. Run tests, log those test results to the {{< var validmind.platform >}}, and have fully supported drafts of documentation or reporting ready for you to fine-tune.
+The {{< var validmind.developer >}} streamlines development and validation by automating testing. Run tests, log those test results to the {{< var validmind.platform >}}, and have fully supported drafts of documentation or reporting ready for you to fine-tune.
 
 ## What is the {{< var validmind.developer >}}?
 
-The {{< var validmind.developer >}} provides a rich collection of documentation tools and test suites, from documenting descriptions of your dataset to validation testing your models for weak spots and overfit areas. 
+The {{< var validmind.developer >}} provides a rich collection of documentation tools and test suites, from documenting descriptions of your datasets to validation testing your records (such as models) for weak spots and overfit areas.
 
-{{< var vm.product >}} offers two primary methods for automating model documentation:
+{{< var vm.product >}} offers two primary methods for automating documentation:
 
-- **Generate documentation**[^1] — Through automation, the {{< var vm.developer >}} extracts metadata from associated datasets and models for you and generates model documentation based on a template. You can also add more documentation and tests manually using the documentation editing capabilities in the {{< var validmind.platform >}}.
+- **Generate documentation**[^1] — Through automation, the {{< var vm.developer >}} extracts metadata from associated datasets and records for you and generates documentation based on a template. You can also add more documentation and tests manually using the documentation editing capabilities in the {{< var validmind.platform >}}.
 
-- **Run validation tests**[^2] — The {{< var vm.developer >}} provides a suite of validation tests for common financial services use cases. For cases where these tests do not cover everything you need, you can also extend existing test suites with your own proprietary tests or testing providers. 
+- **Run validation tests**[^2] — The {{< var vm.developer >}} provides a suite of validation tests for common financial services use cases. For cases where these tests do not cover everything you need, you can also extend existing test suites with your own proprietary tests or testing providers.
 
-The {{< var validmind.developer >}} is designed to be model agnostic. If your model is built in Python, the {{< var vm.developer >}} provides all the standard functionality you may need without requiring you to rewrite any functions.
+The {{< var validmind.developer >}} is designed to be agnostic. For example, if you have a model built with Python, the {{< var vm.developer >}} provides all the standard functionality you may need without requiring you to rewrite any functions.
 
 ::: {.callout-important collapse="true" appearance="minimal"}
 ## Key {{< var vm.product >}} concepts
@@ -110,7 +110,7 @@ The {{< var validmind.developer >}} is designed to be model agnostic. If your mo
 
 ## Quickstart
 
-After you [**sign up**](/guide/access/accessing-validmind.qmd) for {{< var vm.product >}} to get access, try our Jupyter Notebook quickstarts for model documentation or validation:
+After you [**sign up**](/guide/access/accessing-validmind.qmd) for {{< var vm.product >}} to get access, try our Jupyter Notebook quickstarts for documentation or validation:
 
 :::{#library-quickstart}
 :::
@@ -121,20 +121,20 @@ Learn how to use the {{< var validmind.developer >}} with our high-level Jupyter
 
 <span id="development"></span>
 
-#### {{< var vm.product >}} for model development
+#### {{< var vm.product >}} for development
 
-Learn how to use ValidMind for your end-to-end model documentation process based on common model development scenarios with our *ValidMind for model development* series of four introductory notebooks:
+Learn how to use ValidMind for your end-to-end documentation process based on common development scenarios with our *ValidMind for development* series of four introductory notebooks:
 
-:::{#model-development}
+:::{#development}
 :::
 
 <span id="validation"></span>
 
-#### {{< var vm.product >}} for model validation
+#### {{< var vm.product >}} for validation
 
-Learn how to use ValidMind for your end-to-end model validation process based on common scenarios with our *ValidMind for model validation* series of four introductory notebooks:
+Learn how to use ValidMind for your end-to-end validation process based on common scenarios with our *ValidMind for validation* series of four introductory notebooks:
 
-:::{#model-validation}
+:::{#validation}
 :::
 
 
@@ -142,7 +142,7 @@ Learn how to use ValidMind for your end-to-end model validation process based on
 
 :::: {.flex .flex-wrap .justify-around}
 
-Learn how to use the comprehensive out-of-the-box tests and test suites, and other features in the {{< var validmind.developer >}} that make it easy for you to automate building, documenting, validating your models and more.
+Learn how to use the comprehensive out-of-the-box tests and test suites, and other features in the {{< var validmind.developer >}} that make it easy for you to automate building, documenting, validating your records and more.
 
 :::{#library-features}
 :::
@@ -169,9 +169,9 @@ Examples that you can build on and adapt for your own usage include:
 :::{#code-samples}
 :::
 
-## Work with model documentation
+## Work with documentation
 
-After you have tried out the {{< var validmind.developer >}}, continue working with your model documentation in the {{< var validmind.platform >}}:[^3]
+After you have tried out the {{< var validmind.developer >}}, continue working with your documentation in the {{< var validmind.platform >}}:[^3]
 
 :::{#library-documentation}
 :::
@@ -182,8 +182,8 @@ After you have tried out the {{< var validmind.developer >}}, continue working w
 
 <!-- FOOTNOTES -->
 
-[^1]: [{{< var vm.product >}} for model development](#development)
+[^1]: [{{< var vm.product >}} for development](#development)
 
-[^2]: [{{< var vm.product >}} for model validation](#validation)
+[^2]: [{{< var vm.product >}} for validation](#validation)
 
 [^3]: [Working with documentation](/guide/documentation/working-with-documentation.qmd)
\ No newline at end of file
diff --git a/site/faq/_faq-activity.qmd b/site/faq/_faq-activity.qmd
index b950ebeccd..42dee4c34c 100644
--- a/site/faq/_faq-activity.qmd
+++ b/site/faq/_faq-activity.qmd
@@ -2,7 +2,7 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-## Is activity on models, documents, etc. logged?
+## Is activity on records, documents, etc. logged?
 
-- Yes, the {{< var validmind.platform >}}^[[Accessing {{< var vm.product >}}](/guide/access/accessing-validmind.qmd)] provides an audit trail functionality, enabling you to track or audit all the events associated with a specific model.
-- You can review a full record of comments, workflow status changes, and any other updates made to the model, including modifications to documents or test results.
\ No newline at end of file
+- Yes, the {{< var validmind.platform >}}^[[Accessing {{< var vm.product >}}](/guide/access/accessing-validmind.qmd)] provides an audit trail functionality, enabling you to track or audit all the events associated with a specific record (such as a model).
+- You can review a full record of comments, workflow status changes, and any other updates made to the record, including modifications to documents or test results.
\ No newline at end of file
diff --git a/site/faq/_faq-attachments.qmd b/site/faq/_faq-attachments.qmd
index a37ad2d71b..625f325a92 100644
--- a/site/faq/_faq-attachments.qmd
+++ b/site/faq/_faq-attachments.qmd
@@ -2,11 +2,11 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-## Can we attach files to models, artifacts, or documents? 
+## Can we attach files to records, artifacts, or documents?
 
-Yes, attachment type inventory fields are available for custom use.^[[Manage inventory fields](/guide/inventory/manage-inventory-fields.qmd)] Once created, attachment type fields allow you to upload supporting files to your model.
+Yes, attachment type inventory fields are available for custom use.^[[Manage inventory fields](/guide/inventory/manage-inventory-fields.qmd)] Once created, attachment type fields allow you to upload supporting files to your record (model).
 
-- Out-of-the-box functionality is included for attaching files to model artifacts.
+- Out-of-the-box functionality is included for attaching files to artifacts.
 - You can also attach images to document content blocks and comments.
 
-By default, the [{{< fa hand >}} Customer Admin]{.bubble} role has sufficient permissions to manage model inventory fields.
\ No newline at end of file
+By default, the [{{< fa hand >}} Customer Admin]{.bubble} role has sufficient permissions to manage inventory fields.
\ No newline at end of file
diff --git a/site/faq/_faq-explainability.qmd b/site/faq/_faq-explainability.qmd
index 5d51af7799..f4fc4bcb68 100644
--- a/site/faq/_faq-explainability.qmd
+++ b/site/faq/_faq-explainability.qmd
@@ -2,18 +2,18 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-## Do you include explainability-related testing and documentation? 
-<span id="explanability"></span>
-Yes, {{< var vm.product >}} includes explainability-related testing and documentation as part of our offerings. Our approach incorporates a comprehensive suite of tests designed to evaluate model interpretability and identify potential risks, ensuring transparency and reliability in model outcomes. 
+## Do you include explainability-related testing and documentation?
+<span id="explainability"></span>
+Yes, {{< var vm.product >}} includes explainability-related testing and documentation as part of our offerings. Our approach incorporates a comprehensive suite of tests designed to evaluate interpretability and identify potential risks, ensuring transparency and reliability in outcomes.
 
-Below is an overview of our key explainability-related tests:
+Below is an overview of our key explainability-related tests^[[{{< var vm.product >}} test sandbox](/developer/how-to/test-sandbox.qmd)] with models as an example:
 
-- **Features AUC**^[[FeaturesAUC](/tests/model_validation/FeaturesAUC.md)] — Assesses the discriminatory power of individual features in binary classification models, providing insights into how well each feature differentiates between classes. This test supports explainability by isolating the contribution of each feature to the classification task.
-- **Feature Importance**^[[FeatureImportance](/tests/model_validation/sklearn/FeatureImportance.md)] — Generates feature importance scores to identify and compare impactful features across different models and datasets. By highlighting the relative significance of features, this test clarifies how inputs influence model predictions.
-- **Overfit Diagnosis**^[[OverfitDiagnosis](/tests/model_validation/sklearn/OverfitDiagnosis.md)] — Detects potential overfitting by comparing performance between training and testing sets for specific feature segments, highlighting areas of significant deviation. This test aids explainability by revealing where model behavior is inconsistent, offering insights into its generalization capability.
-- **Permutation Feature Importance**^[[PermutationFeatureImportance](/tests/model_validation/sklearn/PermutationFeatureImportance.md)] — Measures feature significance by analyzing the impact of randomly rearranging feature values on model performance. This test quantifies the dependency of model performance on each feature, making it clear which inputs drive the predictions.
-- **SHAP Global Importance**^[[SHAPGlobalImportance](/tests/model_validation/sklearn/SHAPGlobalImportance.md)] — Uses SHAP (SHapley Additive exPlanations) values to assign global importance to features, offering a clear explanation of model outcomes and supporting risk identification. SHAP values provide a mathematically sound attribution of model predictions to specific features, enhancing interpretability.
-- **Weakspots Diagnosis**^[[WeakspotsDiagnosis](/tests/model_validation/sklearn/WeakspotsDiagnosis.md)] — Identifies and visualizes regions of suboptimal model performance across the feature space, highlighting areas that may require further attention. This test explains where and why the model struggles by connecting poor performance to specific feature regions.
+- **Features AUC** — Assesses the discriminatory power of individual features in binary classification models, providing insights into how well each feature differentiates between classes. This test supports explainability by isolating the contribution of each feature to the classification task.
+- **Feature Importance** — Generates feature importance scores to identify and compare impactful features across different models and datasets. By highlighting the relative significance of features, this test clarifies how inputs influence model predictions.
+- **Overfit Diagnosis** — Detects potential overfitting by comparing performance between training and testing sets for specific feature segments, highlighting areas of significant deviation. This test aids explainability by revealing where model behavior is inconsistent, offering insights into its generalization capability.
+- **Permutation Feature Importance** — Measures feature significance by analyzing the impact of randomly rearranging feature values on model performance. This test quantifies the dependency of model performance on each feature, making it clear which inputs drive the predictions.
+- **SHAP Global Importance** — Uses SHAP (SHapley Additive exPlanations) values to assign global importance to features, offering a clear explanation of model outcomes and supporting risk identification. SHAP values provide a mathematically sound attribution of model predictions to specific features, enhancing interpretability.
+- **Weakspots Diagnosis** — Identifies and visualizes regions of suboptimal model performance across the feature space, highlighting areas that may require further attention. This test explains where and why the model struggles by connecting poor performance to specific feature regions.
 
 ::: {.callout}
 ## When logged for documentation, each test automatically generates a comprehensive report as soon as it is executed. 
diff --git a/site/faq/_faq-images.qmd b/site/faq/_faq-images.qmd
index 2d36be4758..c84d874f14 100644
--- a/site/faq/_faq-images.qmd
+++ b/site/faq/_faq-images.qmd
@@ -2,7 +2,7 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-## Do you support including images in model documents?
+## Do you support including images in documents?
 <span id="images"></span>
 Yes, as long as you can produce the image with Python or open the image from a file, you can include it in your documents with {{< var vm.product >}}:^[[Implement custom tests](/notebooks/how_to/tests/custom_tests/implement_custom_tests.ipynb#custom-test-images)]
 
diff --git a/site/faq/_faq-model-updates.qmd b/site/faq/_faq-model-updates.qmd
deleted file mode 100644
index a9a23c7325..0000000000
--- a/site/faq/_faq-model-updates.qmd
+++ /dev/null
@@ -1,9 +0,0 @@
-<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
-Refer to the LICENSE file in the root of this repository for details.
-SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
-
-## How does {{< var vm.product >}} manage updates to models?
-
-1. {{< var vm.product >}} allows model developers to re-run documentation functions with the {{< var validmind.developer >}}^[[{{< var validmind.developer >}}](/developer/validmind-library.qmd)] to capture changes in the model, such as changes in the number of features or hyperparameters. 
-2. After a model developer has made a change in their development environment, such as to a Jupyter Notebook,^[[Code samples](/developer/samples-jupyter-notebooks.qmd)] they can execute the relevant {{< var vm.product >}} documentation function to update the corresponding documentation section. 
-3. {{< var vm.product >}} will then automatically recreate the relevant figures and tables and update them in the online documentation.
\ No newline at end of file
diff --git a/site/faq/_faq-monitoring.qmd b/site/faq/_faq-monitoring.qmd
index 76d6b43827..372ac8f510 100644
--- a/site/faq/_faq-monitoring.qmd
+++ b/site/faq/_faq-monitoring.qmd
@@ -2,11 +2,11 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-## Does {{< var vm.product >}} support monitoring models after deployment?
+## Does {{< var vm.product >}} support monitoring records after deployment?
 
-Yes, {{< var vm.product >}} offers ongoing monitoring support to help you regularly assess a model’s accuracy, stability, and robustness to ensure it remains reliable after deployment: 
+Yes, {{< var vm.product >}} offers ongoing monitoring support to help you regularly assess a record’s accuracy, stability, and robustness to ensure it remains reliable after deployment:
 
-- You can enable monitoring for both new and existing models.^[[Enable monitoring](/guide/monitoring/enable-monitoring.qmd)]
-- You use the {{< var validmind.developer >}} to automatically populate the monitoring template for your model with data, providing a comprehensive view of your model’s performance over time.
+- You can enable monitoring for both new and existing records.^[[Enable monitoring](/guide/monitoring/enable-monitoring.qmd)]
+- You use the {{< var validmind.developer >}} to automatically populate the monitoring template for your record with data, providing a comprehensive view of your record’s performance over time.
 - You then access and examine these results within the {{< var validmind.platform >}}, allowing you to identify any deviations from expected performance and take corrective actions as needed.^[[Review monitoring results](/guide/monitoring/review-monitoring-results.qmd)]
 - Once generated via the {{< var validmind.developer >}}, view and add metrics over time to your ongoing monitoring reports in the {{< var validmind.platform >}}.^[[Work with metrics over time](/guide/monitoring/work-with-metrics-over-time.qmd)]
\ No newline at end of file
diff --git a/site/faq/_faq-progress-model.qmd b/site/faq/_faq-progress-workflow.qmd
similarity index 53%
rename from site/faq/_faq-progress-model.qmd
rename to site/faq/_faq-progress-workflow.qmd
index aebd3a98eb..dd9e0f62b3 100644
--- a/site/faq/_faq-progress-model.qmd
+++ b/site/faq/_faq-progress-workflow.qmd
@@ -2,8 +2,8 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-## How do I progress a model along in its lifecycle within {{< var vm.product >}}?
+## How do I progress a record along in its lifecycle within {{< var vm.product >}}?
 
-Transition a model along in the workflow, for example for review with the next set of stakeholders, by changing a model's status.
+Transition a record (such as a model) along in the workflow, for example for review with the next set of stakeholders, by changing a record's status.
 
 {{< include /guide/workflows/_transition-workflow-examples.qmd >}}
\ No newline at end of file
diff --git a/site/faq/_faq-record-updates.qmd b/site/faq/_faq-record-updates.qmd
new file mode 100644
index 0000000000..739040675e
--- /dev/null
+++ b/site/faq/_faq-record-updates.qmd
@@ -0,0 +1,9 @@
+<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
+Refer to the LICENSE file in the root of this repository for details.
+SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
+
+## How does {{< var vm.product >}} manage updates to records?
+
+1. {{< var vm.product >}} allows developers to re-run documentation functions with the {{< var validmind.developer >}}^[[{{< var validmind.developer >}}](/developer/validmind-library.qmd)] to capture changes in the record (such as a model), such as changes in the number of features or hyperparameters. 
+2. After a developer has made a change in their development environment, such as to a Jupyter Notebook,^[[Code samples](/developer/samples-jupyter-notebooks.qmd)] they can execute the relevant {{< var vm.product >}} documentation function to update the corresponding documentation section. 
+3. {{< var vm.product >}} will then automatically recreate the relevant figures and tables and update them in the online documentation.
\ No newline at end of file
diff --git a/site/faq/_faq-tracking.qmd b/site/faq/_faq-tracking.qmd
index 82ae4cc508..2a8c460248 100644
--- a/site/faq/_faq-tracking.qmd
+++ b/site/faq/_faq-tracking.qmd
@@ -4,5 +4,5 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 ## Can I use {{< var vm.product >}} to track milestone dates?
 
-- Yes, the {{< var validmind.platform >}} includes support for custom inventory fields, including those for dates and date time — allowing you to track important dates throughout the model risk management lifecycle unique to your workflow.
+- Yes, the {{< var validmind.platform >}} includes support for custom inventory fields, including those for dates and date time — allowing you to track important dates throughout the risk management lifecycle unique to your workflow.
 - In addition, calculation type custom inventory fields can draw upon date and date time values, allowing you to automatically calculate next review, revalidation, ongoing monitoring deadlines, or any other desired date. 
diff --git a/site/faq/faq-collaboration.qmd b/site/faq/faq-collaboration.qmd
index c1901b8180..76e1dd16ac 100644
--- a/site/faq/faq-collaboration.qmd
+++ b/site/faq/faq-collaboration.qmd
@@ -4,8 +4,6 @@
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
 title: "Collaboration"
 date: last-modified
-aliases:
-  - /guide/faq-workflows.html
 listing:
   - id: faq-collaboration
     type: grid
@@ -17,15 +15,15 @@ listing:
     - ../guide/inventory/view-record-activity.qmd
     - ../guide/documentation/collaborate-with-others.qmd
     - ../guide/workflows/working-with-workflows.qmd
-categories: ["real-time collaboration", "documents","documentation", "record activity", "auditing", "workflows", "model lifecycle", "validmind platform"]
+categories: ["real-time collaboration", "documents","documentation", "record activity", "auditing", "workflows", "lifecycle", "validmind platform"]
 ---
 
 {{< include _faq-activity.qmd >}}
 
 ## What real-time collaboration features does {{< var vm.product >}} offer?
 
-- You can simultaneously edit model documents, leave and respond to comments or suggestions all within the {{< var validmind.platform >}}.
-- You can also saved named versions of edits to retain specific revisions, and any changes to model documents are automatically logged on your model's activity feed.
+- You can simultaneously edit documents, leave and respond to comments or suggestions all within the {{< var validmind.platform >}}.
+- You can also save named versions of edits to retain specific revisions, and any changes to documents are automatically logged on your record's activity feed.
 
 ::: {.callout}
 ## Multiple users are able to simultaneously edit documents in the {{< var validmind.platform >}}. 
@@ -33,7 +31,7 @@ categories: ["real-time collaboration", "documents","documentation", "record act
 If two users are editing the same cell within {{< var vm.platform >}}, the most recently saved version of the content will prevail. 
 :::
 
-{{< include _faq-progress-model.qmd >}}
+{{< include _faq-progress-workflow.qmd >}}
 
 
 <!-- BELOW REMOVED ON REQUEST AS PER SC-6528 -->
@@ -45,6 +43,6 @@ If two users are editing the same cell within {{< var vm.platform >}}, the most
 
 ## Learn more
 
-:::{#faq-validation}
+:::{#faq-collaboration}
 :::
 
diff --git a/site/faq/faq-documentation.qmd b/site/faq/faq-documentation.qmd
index 244940cf56..bd78fd0859 100644
--- a/site/faq/faq-documentation.qmd
+++ b/site/faq/faq-documentation.qmd
@@ -2,7 +2,7 @@
 # Copyright © 2023-2026 ValidMind Inc. All rights reserved.
 # Refer to the LICENSE file in the root of this repository for details.
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
-title: "Model documents and templates"
+title: "Documents and templates"
 date: last-modified
 aliases:
   - /guide/faq-documentation.html
@@ -23,7 +23,7 @@ categories: ["templates", "documents", "documentation","customization", "images"
 
 {{< var vm.product >}} provides the following default template types:[^1]
 
-- Development (model documentation)
+- Development (documentation)
 - Validation (validation reports)
 - Monitoring (ongoing monitoring reports)
 
@@ -31,7 +31,7 @@ You can also create custom document types and associated templates to suit your
 
 ## Can templates be customized for our use cases?
 
-Yes, the {{< var validmind.platform >}}[^2] allows you to configure versioned templates based on document requirements for each model or lifecycle use case.
+Yes, the {{< var validmind.platform >}}[^2] allows you to configure versioned templates based on document requirements for each record (such as a model) or lifecycle use case.
 
 - {{< var vm.product >}}'s templates are fully customizable,[^3] and are complemented by the ability to manage validation guidelines.
 - You can swap between different versions of templates or apply another version of the current template.[^4]
@@ -41,17 +41,17 @@ By default, the [{{< fa hand >}} Customer Admin]{.bubble} role[^5] has sufficien
 
 ## Can documents be created right in the {{< var validmind.platform >}}?
 
-Yes, you can work with model documentation, validation reports, ongoing monitoring reports, or any other document type directly in the {{< var validmind.platform >}}, without having to first generate anything using the {{< var validmind.developer >}}.[^6]
+Yes, you can work with documentation, validation reports, ongoing monitoring reports, or any other document type directly in the {{< var validmind.platform >}}, without having to first generate anything using the {{< var validmind.developer >}}.[^6]
 
 1. Add and edit text on any document within the {{< var vm.platform >}} using our content editing toolbar.[^7]
 2. Using the {{< var vm.developer >}}, execute test suites and generate the corresponding supporting results. These results can then be added to your documents within the {{< var vm.platform >}}.[^8]
 
-## Can I run tests and log documentation without a model? 
-<span id="no-available-model"><span>
-Yes! If you do not have a model ready, or your model can't be loaded directly, or you only have access to model predictions, you can still run tests and log documentation using the {{< var validmind.developer >}} as long as you're able to load the model predictions.
+## Can I run tests and log documentation without a record?
+<span id="no-available-model"></span>
+Yes! If you do not have a record (such as a model) ready, or your record can't be loaded directly, or you only have access to predictions, you can still run tests and log documentation using the {{< var validmind.developer >}} as long as you're able to load the predictions.
 
 - Use `assign_predictions()`[^9] to load predictions from a separate file or a dataset with predictions.
-- Call `init_model()`[^10] but instead of a trained model instance, pass an `input_id` and model metadata. `ModelMetadata()`[^11] will use the provided metadata instead of trying to calculate it from the model's library. 
+- Call `init_model()`[^10] to create a model object, but instead of a trained instance, pass an `input_id` and model metadata. `ModelMetadata()`[^11] will use the provided metadata instead of trying to calculate it from the model's library.
 
 
 ::: {.column-margin}
@@ -65,8 +65,10 @@ Yes! If you do not have a model ready, or your model can't be loaded directly, o
 ```
 :::
 
-::: {.callout title="If neither a trained model instance nor metadata is provided, `init_model()` will return an error.  "}
-However, tests that need a trained model will not work with "empty" models.
+::: {.callout title="If neither a trained instance nor metadata is provided, `init_model()` will return an error."}
+- However, tests that need a trained model will not work with "empty" models.
+- Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with {{< var vm.product >}}.
+
 :::
 
 {{< include _faq-attachments.qmd >}}
diff --git a/site/faq/faq-integrations.qmd b/site/faq/faq-integrations.qmd
index f217833b1e..e1be635668 100644
--- a/site/faq/faq-integrations.qmd
+++ b/site/faq/faq-integrations.qmd
@@ -14,7 +14,7 @@ listing:
     sort: false
     fields: [title, description]
     contents:
-    - ../developer/supported-models-and-frameworks.qmd
+    - ../developer/supported-records-and-frameworks.qmd
     - ../about/overview-llm-features.qmd
     - ../about/deployment/deployment-options.qmd
 categories: ["supported libraries", "supported languages", "integrations", "images", "large language models", "explainability", "deployment options", "validmind library"]
@@ -22,7 +22,7 @@ categories: ["supported libraries", "supported languages", "integrations", "imag
 
 ## Which languages, libraries, and environments do you support?
 
-- The {{< var validmind.developer >}}[^1] is designed to be platform-agnostic and compatible with most popular open-source programming languages and model development environments in Python and R,[^2] from XGBoost to more sophisticated libraries such as Pytorch and TensorFlow — and many more.
+- The {{< var validmind.developer >}}[^1] is designed to be platform-agnostic and compatible with most popular open-source programming languages and development environments in Python and R,[^2] from XGBoost to more sophisticated libraries such as Pytorch and TensorFlow — and many more.
 - We directly support Matplotlib[^3] and Plotly[^4] plotting libraries for visual representations, and you're able to return images from other libraries as bytes-like objects.[^5]
 
 ::: {.callout}
@@ -35,18 +35,18 @@ Support for commercial and closed-source programming languages such as SAS and M
 ## What test ingestion or modeling techniques are supported?
 
 - {{< var vm.product >}} supports ingesting test results from your training and evaluation pipeline, such as using batch prediction or online prediction mechanisms.[^6]
-- We are also offer standard documentation via the {{< var vm.developer >}} for additional modeling techniques.[^7] 
+- We also offer standard documentation via the {{< var vm.developer >}} for additional modeling techniques.[^7]
 
 {{< include _faq-images.qmd >}}
 
 ## What large language model (LLM) features are offered?
 
-{{< var vm.product >}} offers several specialized features that use large language models (LLMs) to streamline model risk management and ensure regulatory compliance:
+{{< var vm.product >}} offers several specialized features that use large language models (LLMs) to streamline risk management and ensure regulatory compliance:
  
 - **Test interpretation** — Interprets results from tests run within {{< var vm.product >}}.
-- **Qualitative checks** — Leverages metadata from the model inventory, test outcomes, and additional data provided to create qualitative sections within model documentation.
-- **Risk assessment** — Using data from test results, generates a tailored risk assessment for each section of model documentation.
-- **{{< var validmind.checker >}}**[^8] — Reviews documents such as model documentation or validation reports to ensure documents aligns with relevant regulatory requirements.
+- **Qualitative checks** — Leverages metadata from the inventory, test outcomes, and additional data provided to create qualitative sections within documentation.
+- **Risk assessment** — Using data from test results, generates a tailored risk assessment for each section of documentation.
+- **{{< var validmind.checker >}}**[^8] — Reviews documents such as documentation or validation reports to ensure they align with relevant regulatory requirements.
 
 {{< include _faq-explainability.qmd >}}
 
@@ -54,24 +54,6 @@ Support for commercial and closed-source programming languages such as SAS and M
 
 {{< include /about/deployment/_deployment-available-options.qmd >}}
 
-<!-- BELOW REMOVED AFTER ANDRES CONFIRMED WE DON'T SUPPORT DATA DICTIONARIES IN A WAY OUR USERS WOULD EXPECT - BC (Nov 27, 2024) -->
-
-<!-- ## Does {{< var vm.product >}} support data dictionaries?
-
-Yes, you can pass data dictionaries to {{< var vm.product >}} via the {{< var vm.developer >}}, such as in CSV format. -->
-
-<!-- BELOW REMOVED ON REQUEST AS PER SC-6528 -->
-
-<!-- ## Can you integrate with JIRA to connect with our Model Development pipeline?
-
-{{< var vm.product >}} is planning to provide integration with JIRA tickets via the JIRA Python API. You will be able to configure {{< var vm.product >}} to update the status of a particular JIRA ticket when a specific state or approval is triggered from the workflow (roadmap item – Q3’2023). -->
-
-<!-- ## Do you support integration with data lakes and ETL solutions?
-
-Support for connecting to data lakes and data processing or ETL pipelines is on our roadmap (Q3’2023+).
-
-We will be implementing connector interfaces allowing extraction of relationships between raw data sources and final post-processed datasets for preloaded session instances received from Spark and Snowflake. -->
-
 ## Learn more
 
 :::{#faq-integrations}
@@ -82,16 +64,16 @@ We will be implementing connector interfaces allowing extraction of relationship
 
 [^1]: [{{< var validmind.developer >}}](/developer/validmind-library.qmd)
 
-[^2]: [Supported models and frameworks](/developer/supported-models-and-frameworks.qmd)
+[^2]: [Supported records and frameworks](/developer/supported-records-and-frameworks.qmd)
 
 [^3]: [Matplotlib](https://matplotlib.org/)
 
 [^4]: [Plotly](https://plotly.com/)
 
-[^5]: [Do you support including images in model documents?](#images)
+[^5]: [Do you support including images in documents?](#images)
 
 [^6]: [Load dataset predictions](/notebooks/how_to/data_and_datasets/dataset_inputs/load_datasets_predictions.ipynb)
 
-[^7]: [Do you include explainability-related testing and documentation?](#explanability)
+[^7]: [Do you include explainability-related testing and documentation?](#explainability)
 
 [^8]: [Customize {{< var validmind.checker >}}](/guide/templates/customize-document-checker.qmd)
\ No newline at end of file
diff --git a/site/faq/faq-inventory.qmd b/site/faq/faq-inventory.qmd
index 1aa5bf9ccc..3cb987a699 100644
--- a/site/faq/faq-inventory.qmd
+++ b/site/faq/faq-inventory.qmd
@@ -2,7 +2,7 @@
 # Copyright © 2023-2026 ValidMind Inc. All rights reserved.
 # Refer to the LICENSE file in the root of this repository for details.
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
-title: "Model inventory and activity"
+title: "Inventory and activity"
 date: last-modified
 aliases:
   - /guide/faq-inventory.html
@@ -17,47 +17,47 @@ listing:
     - ../guide/inventory/view-record-activity.qmd
     - ../guide/inventory/working-with-the-inventory.qmd
     - ../guide/inventory/managing-the-inventory.qmd
-categories: ["record activity", "model registration", "model inventory", "customization", "model stages", "model interdependencies", "auditing", "exports", "validmind platform"]
+categories: ["inventory", "inventory registration", "inventory customization", "inventory interdependencies", "activity", "auditing", "exports", "validmind platform"]
 ---
 
 {{< include _faq-activity.qmd >}}
 
-## How do I register models with {{< var vm.product >}}?
+## How do I register records with {{< var vm.product >}}?
 
-- Register models within the {{< var validmind.platform >}} via the model inventory as the first step towards streamlining your model documentation and validation workflow.
-- To add a model to the inventory, you fill out a customizable questionnaire capturing the required registration metadata.[^1]
+- Register records (such as models) within the {{< var validmind.platform >}} via the inventory as the first step towards streamlining your documentation and validation workflow.
+- To add a record to the inventory, you fill out a customizable questionnaire capturing the required registration metadata.[^1]
 
-By default, the [{{< fa code >}} Developer]{.bubble} role[^2] has sufficient permissions to register models.
+By default, the [{{< fa code >}} Developer]{.bubble} role[^2] has sufficient permissions to register records.
 
-## Are model registration questionnaires customizable?
+## Are registration questionnaires customizable?
 
-- Yes, along with default fields provided by {{< var vm.product >}} as part of your basic model information, you can add additional model information and make these custom fields required when creating models.[^3]
+- Yes, along with default fields provided by {{< var vm.product >}} as part of your basic record (model) information, you can add additional record information and make these custom fields required when creating records.[^3]
 - You can modify these custom fields as needed and on an ongoing basis.
 
-By default, the [{{< fa hand >}} Customer Admin]{.bubble} role has sufficient permissions to manage model inventory fields.
+By default, the [{{< fa hand >}} Customer Admin]{.bubble} role has sufficient permissions to manage inventory fields.
 
-## Can the {{< var vm.product >}} model inventory be customized?
+## Can the {{< var vm.product >}} inventory be customized?
 
-- Yes, information that is displayed on the model inventory is configurable on a per user basis. 
-- You can also search, filter, and sort models to narrow down results.  
-- Fields that appear on all models for all users can also be customized.
+- Yes, information that is displayed on the inventory is configurable on a per user basis. 
+- You can also search, filter, and sort records (such as models) to narrow down results.  
+- Fields that appear on all records for all users can also be customized.
  
- By default, the [{{< fa hand >}} Customer Admin]{.bubble} role has sufficient permissions to manage model inventory fields.
+ By default, the [{{< fa hand >}} Customer Admin]{.bubble} role has sufficient permissions to manage inventory fields.
 
-## Can I archive or delete models within {{< var vm.product >}}?
+## Can I archive or delete records within {{< var vm.product >}}?
 
-Yes, models can be archived within the {{< var validmind.platform >}} model inventory to keep your inventory accurate and up to date with your organization’s current resources.[^4]
+Yes, records (such as models) can be archived within the {{< var validmind.platform >}} inventory to keep your inventory accurate and up to date with your organization’s current resources.[^4]
 
-By default, the [{{< fa hand >}} Customer Admin]{.bubble} role has sufficient permissions to archive and delete models.
+By default, the [{{< fa hand >}} Customer Admin]{.bubble} role has sufficient permissions to archive and delete records.
 
-## Can I track model interdependencies within the model inventory?
+## Can I track interdependencies within the inventory?
 
-- Yes, the {{< var validmind.platform >}} allows you to connect two or more models together in your model inventory.[^5] 
-- You can note both upstream and downstream models.
+- Yes, the {{< var validmind.platform >}} allows you to connect two or more records (models) together in your inventory.[^5] 
+- You can note both upstream and downstream records.
 
-By default, the [{{< fa code >}} Developer]{.bubble} role has sufficient permissions to edit model interdependencies.
+By default, the [{{< fa code >}} Developer]{.bubble} role has sufficient permissions to edit record interdependencies.
 
-{{< include _faq-model-updates.qmd >}}
+{{< include _faq-record-updates.qmd >}}
 
 {{< include _faq-tracking.qmd >}}
 
@@ -69,12 +69,12 @@ By default, the [{{< fa code >}} Developer]{.bubble} role has sufficient permiss
 
 <!-- FOOTNOTES -->
 
-[^1]: [Register records in the inventory](/guide/inventory/working-with-the-inventory.qmd)
+[^1]: [Register records in the inventory](/guide/inventory/register-records-in-inventory.qmd)
 
 [^2]: [Manage permissions](/guide/configuration/manage-permissions.qmd)
 
 [^3]: [Manage inventory fields](/guide/inventory/manage-inventory-fields.qmd)
 
-[^4]: [Archive and delete models](/guide/inventory/archive-delete-records.qmd)
+[^4]: [Archive and delete records](/guide/inventory/archive-delete-records.qmd)
 
-[^5]: [Configure model interdependencies](/guide/inventory/configure-record-interdependencies.qmd)
\ No newline at end of file
+[^5]: [Configure record interdependencies](/guide/inventory/configure-record-interdependencies.qmd)
\ No newline at end of file
diff --git a/site/faq/faq-organizations.qmd b/site/faq/faq-organizations.qmd
index 4a6818d07f..4709d309a5 100644
--- a/site/faq/faq-organizations.qmd
+++ b/site/faq/faq-organizations.qmd
@@ -19,19 +19,19 @@ categories: ["access", "permissions", "organizations", "user registration", "val
 
 ## How do I get access to {{< var vm.product >}}?
 
-#### 1. Register with ValidMind
+#### 1. Register with {{< var vm.product >}}
 
-- First register with our cloud-hosted {{< var validmind.platform >}},[^1] which enables you to work with model documentation or configure ValidMind for your organization.
-- With an email address or a Google, GitHub, or Microsoft account, you can gain access to ValidMind either by signing up independently, or by accepting an invite from another member of your organization.
+- First register with our cloud-hosted {{< var validmind.platform >}},[^1] which enables you to work with documentation or configure {{< var vm.product >}} for your organization.
+- With an email address or a Google, GitHub, or Microsoft account, you can gain access to {{< var vm.product >}} either by signing up independently, or by accepting an invite from another member of your organization.
 
-#### 2. Log in to ValidMind
+#### 2. Log in to {{< var vm.product >}}
 
 - Once you've signed up or accepted an invite, log in to the {{< var validmind.platform >}}.[^2]
-- {{< var vm.product >}} supports logging in via both the public interent and private network endpoints.
+- {{< var vm.product >}} supports logging in via both the public internet and private network endpoints.
 
 ## What are organizations within {{< var vm.product >}}?
 
-Access to the {{< var validmind.platform >}} where your model inventory is hosted is associated with an organization,[^3] which encompasses all your users, groups, and business units. 
+Access to the {{< var validmind.platform >}} where your inventory is hosted is associated with an organization,[^3] which encompasses all your users, groups, and business units. 
 
 - As a user,[^4] you can belong to multiple organizations.
 - You will see the option to switch between organizations only if you belong to more than one organization.
@@ -46,8 +46,8 @@ By default, the [{{< fa hand >}} Customer Admin]{.bubble} role[^5] has sufficien
 
 ## How do user roles, user groups, and access permissions work? 
 
- - Users belong to groups which determine which models they can see, and have roles with attached permissions which define the level of access they have to features.
- - Groups are segments of users with the ability to view models associated with that group. Access to granular features in the {{< var vm.platform >}} within a group’s set of models is further defined by roles and permissions.
+ - Users belong to groups which determine which records (such as models) they can see, and have roles with attached permissions which define the level of access they have to features.
+ - Groups are segments of users with the ability to view records associated with that group. Access to granular features in the {{< var vm.platform >}} within a group’s set of records is further defined by roles and permissions.
  - Roles are a named set of permissions that determine your users’ access to features within the {{< var vm.platform >}} based on your organization’s structure. 
  - Permissions dictate user access controls within the {{< var vm.platform >}}, and are associated with specific roles.
 
diff --git a/site/faq/faq-privacy.qmd b/site/faq/faq-privacy.qmd
index 79644eb4e9..b2468c25e0 100644
--- a/site/faq/faq-privacy.qmd
+++ b/site/faq/faq-privacy.qmd
@@ -28,12 +28,12 @@ categories: ["data handling", "privacy", "confidentiality", "record activity", "
 
 Access to the {{< var validmind.platform >}} is facilitated through AWS PrivateLink, which provides private connectivity between {{< var vm.product >}} and your on-premises networks without exposing your traffic to the public internet.[^2]
 
-## What model assets are automatically imported into {{< var vm.product >}}?
+## What assets are automatically imported into {{< var vm.product >}}?
 
 {{< var vm.product >}} stores the following assets in documents via our {{< var validmind.api >}}:
 
-- Dataset and model metadata which allow generating documentation snippets programmatically (example: stored definition for "common logistic regression limitations" when a logistic regression model has been passed to the {{< var vm.product >}} test suite execution)
-- Quality and performance metrics collected from the dataset and model
+- Dataset and model (any type of record) object metadata which allow generating documentation snippets programmatically (example: stored definition for "common logistic regression limitations" when a logistic regression model has been passed to the {{< var vm.product >}} test suite execution)
+- Quality and performance metrics collected from the dataset and record
 - Outputs from executed test suites
 - Images, plots, and visuals generated as part of extracting metrics and running tests
 
@@ -55,32 +55,7 @@ Furthermore, {{< var vm.product >}}'s data retention policy complies with the SO
 
 {{< include _faq-activity.qmd >}}
 
-{{< include _faq-model-updates.qmd >}}
-
-<!-- BELOW REMOVED AFTER ANDRES CONFIRMED WE DON'T SUPPORT SPARK DATAFRAMES IN A WAY OUR USERS WOULD EXPECT - BC (Nov 27, 2024) -->
-
-<!-- ## Can you accommodate Spark DataFrames?
-
-- Yes, the {{< var validmind.developer >}} can extract dataset quality metrics on Pandas DataFrame, NumPy arrays, or Spark DataFrame instances using standard metrics provided by popular open-source frameworks such as scikit-learn, statsmodels, and more.
-- Each test defines a mapping to the different supported dataset and/or model interfaces — when passing a Spark DataFrame, the {{< var vm.developer >}} will directly call native evaluation metrics provided by the SparkML API or custom ones built by the developer, such as via UDFs. -->
-
-<!-- BELOW REMOVED ON REQUEST AS PER SC-6528 -->
-
-<!-- ## How does {{< var vm.product >}} handle end-user computing and spreadsheet models?
-
-Customers can register spreadsheet models in the model inventory and centralize tracking of the associated documentation files with the inventory metadata (roadmap item – Q3’2023). However, {{< var vm.product >}} cannot automate documentation generation for spreadsheet models. -->
-
-<!-- ## Can the tool automatically document other non-standard ETL steps or performance metrics from notebooks?
-
-Support for more complex data processing pipelines is on our roadmap, currently scheduled for Q4'2023. We are implementing connector interfaces that will allow us to extract relationships between raw data sources and final post-processed datasets for Spark and Snowflake. -->
-
-<!-- ## Can we customize illustrations?
-
-{{< var vm.product >}} utilizes open-source libraries (such as Seaborn and Matplotlib) to generate plots and illustrations. We are working on implementing the ability for model developers to customize styling parameters for these libraries directly within the {{< var vm.developer >}}.
-
-This feature is currently scheduled for Q4 2023.
-
-Additionally, {{< var vm.product >}} is developing a feature that enables developers to create custom visualization widgets by writing JavaScript-based rendering code. -->
+{{< include _faq-record-updates.qmd >}}
 
 ## Learn more
 
diff --git a/site/faq/faq-reporting.qmd b/site/faq/faq-reporting.qmd
index 0b9abd046a..c672652c5f 100644
--- a/site/faq/faq-reporting.qmd
+++ b/site/faq/faq-reporting.qmd
@@ -22,7 +22,7 @@ categories: ["exports", "analytics", "reports", "ongoing monitoring", "validmind
 
 ## What analytic features are offered by {{< var vm.product >}}?
 
-- Out-of-the-box reports within the {{< var validmind.platform >}}[^1] are broken down by data on models and data on artifacts.
+- Out-of-the-box reports within the {{< var validmind.platform >}}[^1] are broken down by data on records (such as models) and data on artifacts.
 - For each of the bar charts, you can hover for numerical breakdowns or click on individual bars to get a more detailed view.[^2]
 - You're also able to add custom report pages and analytic widgets to supplement the out-of-the-box reports provided.[^3] 
 
diff --git a/site/faq/faq-testing.qmd b/site/faq/faq-testing.qmd
index eeea2514f0..6f82ab1694 100644
--- a/site/faq/faq-testing.qmd
+++ b/site/faq/faq-testing.qmd
@@ -15,30 +15,32 @@ listing:
     fields: [title, description]
     contents:
     - ../developer/how-to/testing-overview.qmd
-    - ../developer/test-descriptions.qmd
+    - title: "{{< var vm.product >}} test sandbox"
+      description: "Tests that are available as part of the {{< var validmind.developer >}}, grouped by type of validation or monitoring test."
+      path: ../developer/how-to/test-sandbox.qmd
     - ../guide/monitoring/ongoing-monitoring.qmd
-categories: ["testing", "model documentation", "customization", "custom data", "explainability", "ongoing monitoring", "validmind library"]
+categories: ["testing", "documentation", "customization", "custom data", "explainability", "ongoing monitoring", "validmind library"]
 ---
 
 ## How do the out-of-the-box tests developed by {{< var vm.product >}} work?
 
 All the default tests are developed using open-source Python and R libraries.
 
-The {{< var validmind.developer >}}[^1] test interface is a light wrapper that defines utility functions to agnostically interact with different dataset and model backends, and contains functions to collect and post results to the {{< var validmind.platform >}}[^2] using a generic results schema.
+The {{< var validmind.developer >}}[^1] test interface is a light wrapper that defines utility functions to agnostically interact with different dataset and record (model) backends, and contains functions to collect and post results to the {{< var validmind.platform >}}[^2] using a generic results schema.
 
-## When do I use tests and tests suites?
+## When do I use tests and test suites?
 
 While you have the flexibility to decide when to use which {{< var vm.product >}} tests, here are a few typical scenarios:[^3]
 
 - **Dataset testing** — To document and validate your dataset.
-- **Model testing** — To document and validate your model.
+- **Model testing** — To document and validate your record, such as a model.
 - **End-to-end testing** — To document a binary classification model and the relevant dataset end-to-end.
 
 ## Can we configure, customize, or add our own tests?
 
 Yes, {{< var vm.product >}} allows tests to be manipulated at several levels:
 
-- You can configure which tests are required to run programmatically depending on the model use case.[^4]
+- You can configure which tests are required to run programmatically depending on the record's use case.[^4]
 - You can change the thresholds and parameters for default tests already available in the {{< var vm.developer >}} — for instance, changing the threshold parameter for the class imbalance flag.[^5]
 - You can also connect your own custom tests with the {{< var validmind.developer >}}. These custom tests are configurable and are able to run programmatically, just like the rest of the {{< var vm.developer >}}.[^6]
 - Personalize tests further for your use case by using {{< var vm.product >}}'s `RawData` feature[^7] to customize the output of tests.
@@ -49,32 +51,32 @@ In addition to custom tests, you can also add use case and test-specific context
 
 ## How do I log tests as a developer?
 
-You use the {{< var validmind.developer >}} to run and log tests during model development, the results of which are then inserted your model documentation within the {{< var validmind.platform >}}.[^9] The {{< var vm.developer >}} also automatically generates draft test descriptions for your test results — generations that can be modified for your custom use cases.[^10]
+You use the {{< var validmind.developer >}} to run and log tests during development, the results of which are then inserted into your documentation within the {{< var validmind.platform >}}.[^9] The {{< var vm.developer >}} also automatically generates draft test descriptions for your test results — generations that can be modified for your custom use cases.[^10]
 
 To log tests as a developer with the {{< var validmind.developer >}}:
 
-- You must have the [{{< fa code >}} Developer]{.bubble} role[^11] or another role with sufficient permissions to create and own models, and to work with model documentation.
-- You must be the model owner or model developer, but not the model validator,[^12] for the model you want to log tests and update documentation for.
+- You must have the [{{< fa code >}} Developer]{.bubble} role[^11] or another role with sufficient permissions to create and own records (models), and to work with documentation.
+- You must be the record owner or record developer, but not the record validator,[^12] for the record you want to log tests and update documentation for.
 
 ::: {.callout}
 ## Want to learn how to use {{< var vm.product >}} as a developer?
 
-Check out our introductory series — [**{{< var vm.product >}} for model development**](/developer/validmind-library.qmd#for-model-development)
+Check out our introductory series — [**{{< var vm.product >}} for development**](/developer/validmind-library.qmd#development)
 :::
 
 ## How do I log tests as a validator?
 
-You use the {{< var validmind.developer >}} to run and log tests during model validation, the results of which are then inserted your validation report within the {{< var validmind.platform >}}.[^13] The {{< var vm.developer >}} also automatically generates draft test descriptions for your test results — generations that can be modified for your custom use cases.[^14]
+You use the {{< var validmind.developer >}} to run and log tests during validation, the results of which are then inserted into your validation report within the {{< var validmind.platform >}}.[^13] The {{< var vm.developer >}} also automatically generates draft test descriptions for your test results — generations that can be modified for your custom use cases.[^14]
 
 To log tests as a validator with the {{< var validmind.developer >}}:
 
-- You must have the [{{< fa circle-check >}} Validator]{.bubble} role[^15] or another role with sufficient permissions to access models for validation, to review model documentation, and to work with validation reports and model artifacts.
-- You must be the model validator, but not the model owner or model developer,[^16] for the model you want to log tests and update documentation for.
+- You must have the [{{< fa circle-check >}} Validator]{.bubble} role[^15] or another role with sufficient permissions to access records (models) for validation, to review documentation, and to work with validation reports and artifacts.
+- You must be the record validator, but not the record owner or record developer,[^16] for the record you want to log tests and update documentation for.
 
 ::: {.callout}
 ## Want to learn how to use {{< var vm.product >}} as a validator?
 
-Check out our introductory series — [**{{< var vm.product >}} for model validation**](/developer/validmind-library.qmd#for-model-validation)
+Check out our introductory series — [**{{< var vm.product >}} for validation**](/developer/validmind-library.qmd#validation)
 :::
 
 {{< include _faq-explainability.qmd >}}
@@ -115,7 +117,7 @@ Check out our introductory series — [**{{< var vm.product >}} for model valida
 
 [^12]: [Manage record stakeholder types](/guide/configuration/manage-record-stakeholder-types.qmd)
 
-[^13]: [Assess compliance](/guide/validation/assess-compliance.qmd#link-validator-evidence)
+[^13]: [Assess compliance](/guide/validation/assess-compliance.qmd#map-evidence)
 
 [^14]: [Can we configure, customize, or add our own tests?](#can-we-configure-customize-or-add-our-own-tests)
 
diff --git a/site/faq/faq-validation.qmd b/site/faq/faq-validation.qmd
index ee56299e2a..741abe5beb 100644
--- a/site/faq/faq-validation.qmd
+++ b/site/faq/faq-validation.qmd
@@ -2,10 +2,8 @@
 # Copyright © 2023-2026 ValidMind Inc. All rights reserved.
 # Refer to the LICENSE file in the root of this repository for details.
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
-title: "Model validation and artifacts"
+title: "Validation and artifacts"
 date: last-modified
-aliases:
-  - /guide/faq-documentation.html
 listing:
   - id: faq-validation
     type: grid
@@ -17,7 +15,7 @@ listing:
     - ../guide/validation/manage-validation-guidelines.qmd
     - ../guide/validation/preparing-validation-reports.qmd
     - ../guide/validation/working-with-artifacts.qmd
-categories: ["model validation", "validation guidelines", "model artifacts", "findings", "model documentation", "templates", "compliance", "validmind platform"]
+categories: ["validation", "validation guidelines", "artifacts", "findings", "documentation", "templates", "compliance", "validmind platform"]
 ---
 
 ## Can I set up custom validation guidelines for use in templates?
@@ -29,9 +27,9 @@ Yes, {{< var vm.product >}} supports the implementation of custom validation gui
 
 By default, the [{{< fa hand >}} Customer Admin]{.bubble} role[^2] has sufficient permissions to manage validation guidelines. 
 
-## How does {{< var vm.product >}} help with assessing model compliance?
+## How does {{< var vm.product >}} help with assessing compliance?
 
-Use {{< var vm.product >}} to assess compliance of your models with guidelines based on analyzing evidence and artifacts (findings),[^3] providing an unbiased starting point that enables more efficient discussions between validators and developers.
+Use {{< var vm.product >}} to assess compliance of your records (such as models) with guidelines based on analyzing evidence and artifacts (findings),[^3] providing an unbiased starting point that enables more efficient discussions between validators and developers.
 
 Without leaving the {{< var validmind.platform >}}, you're able to:
 
@@ -39,19 +37,19 @@ Without leaving the {{< var validmind.platform >}}, you're able to:
 2. Link tracked artifacts to validation reports
 3. Provide granular compliance assessments for each section of your validation report
 
-By default, the [{{< fa circle-check >}} Validator]{.bubble} role has sufficient permissions to assess model compliance on validation reports.
+By default, the [{{< fa circle-check >}} Validator]{.bubble} role has sufficient permissions to assess compliance on validation reports.
 
-## What support does {{< var vm.product >}} offer for model artifacts?
+## What support does {{< var vm.product >}} offer for artifacts?
 
-- Within the {{< var validmind.platform >}}, you're able to log artifacts at the model or the documentation section level.[^4]
+- Within the {{< var validmind.platform >}}, you're able to log artifacts at the record (model) or the documentation section level.[^4]
 - On each artifact, you're able to outline proposed remediation plans, attach supporting documentation, track the artifact's status, attach the artifact to a risk area and/or documentation section, designate a due date, and assign a resolution owner. 
-- You can also access a complete list of filterable artifacts logged across all your models, or look at only artifacts linked to a specific model.[^5]
+- You can also access a complete list of filterable artifacts logged across all your records, or look at only artifacts linked to a specific record.[^5]
 
-By default, the [{{< fa circle-check >}} Validator]{.bubble} role has sufficient permissions to manage model artifacts.
+By default, the [{{< fa circle-check >}} Validator]{.bubble} role has sufficient permissions to manage artifacts.
 
 ## Can I create custom artifact types?
 
-Yes, you can create custom artifact types to track categories of observations beyond the default types (Validation Issue, Policy Exception, Model Limitation).[^6]
+Yes, you can create custom artifact types to track categories of observations beyond the default types (Validation Issue, Policy Exception, Limitation).[^6]
 
 Common examples include:
 
diff --git a/site/faq/faq-workflows.qmd b/site/faq/faq-workflows.qmd
index a11bf82fb3..5b9a1424c6 100644
--- a/site/faq/faq-workflows.qmd
+++ b/site/faq/faq-workflows.qmd
@@ -9,7 +9,7 @@ aliases:
 listing:
   - id: faq-workflows
     type: grid
-    grid-columns: 3
+    grid-columns: 2
     max-description-length: 250
     sort: false
     fields: [title, description]
@@ -18,12 +18,12 @@ listing:
     - ../guide/workflows/manage-record-stages.qmd
     - ../guide/inventory/manage-inventory-fields.qmd
     - ../guide/attestation/working-with-attestations.qmd
-categories: ["workflows", "model lifecycle", "lifecycle statuses", "attestations", "validmind platform", "validmind library"]
+categories: ["workflows", "lifecycle", "lifecycle statuses", "attestations", "validmind platform", "validmind library"]
 ---
 
 ## Can I customize workflows within {{< var vm.product >}}?
 
-- Yes, you can create custom workflows for the review and approval of models throughout their lifecycles with {{< var validmind.platform >}},[^1] enabling you to more easily oversee your organization's unique model risk management process. 
+- Yes, you can create custom workflows for the review and approval of records (such as models) throughout their lifecycles with {{< var validmind.platform >}},[^1] enabling you to more easily oversee your organization's unique risk management process. 
 - For example, workflows can be configured to include any number of review stages involving different sets of stakeholders — at any point in the process.
 
 By default, the [{{< fa hand >}} Customer Admin]{.bubble} role[^2] has sufficient permissions to manage workflows.
@@ -35,19 +35,19 @@ By default, the [{{< fa hand >}} Customer Admin]{.bubble} role[^2] has sufficien
 
 By default, the [{{< fa hand >}} Customer Admin]{.bubble} role has sufficient permissions to manage lifecycle statuses.
 
-{{< include _faq-progress-model.qmd >}}
+{{< include _faq-progress-workflow.qmd >}}
 
 ## Can we work with disconnected workflows?
 
 Yes, {{< var vm.product >}} supports disconnected workflows natively at the data-collection level since the {{< var validmind.developer >}}[^3] creates individual test runs every time a new test iteration is executed. 
 
 - This allows for running parallel/disconnected tests that individually send results to the {{< var validmind.platform >}}.
-- Visualizing the disconnected workflow in terms of model testing and documentation will depend on requirements at the use-case level.
+- Visualizing the disconnected workflow in terms of testing and documentation will depend on requirements at the use-case level.
 
 ::: {.callout}
-## You can also leverage the {{< var validmind.developer >}} once you are ready to document a specific model for review and validation. 
+## You can also leverage the {{< var validmind.developer >}} once you are ready to document a specific record (model) for review and validation. 
 
-You do not need to use the {{< var validmind.platform >}} while you are in the exploration or R&D phase of model development.
+You do not need to use the {{< var validmind.platform >}} while you are in the exploration or R&D phase of development.
 :::
 
 {{< include _faq-attestations.qmd >}}
diff --git a/site/faq/faq.qmd b/site/faq/faq.qmd
index 74bf9a5488..50a718ba8e 100644
--- a/site/faq/faq.qmd
+++ b/site/faq/faq.qmd
@@ -18,11 +18,11 @@ listing:
     - path: faq-workflows.qmd
       title: "Workflows"
     - path: faq-inventory.qmd
-      title: "Model inventory and activity"
+      title: "Inventory and activity"
     - path: faq-documentation.qmd
-      title: "Model documents and templates"
+      title: "Documents and templates"
     - path: faq-validation.qmd
-      title: "Model validation and artifacts"
+      title: "Validation and artifacts"
     - path: faq-collaboration.qmd
       title: "Collaboration"
     - path: faq-reporting.qmd
diff --git a/site/get-started/_sidebar.yaml b/site/get-started/_sidebar.yaml
index 12e5b1ecb5..a92e0d79e7 100644
--- a/site/get-started/_sidebar.yaml
+++ b/site/get-started/_sidebar.yaml
@@ -8,9 +8,9 @@ website:
       title: "Get Started"
       contents:
         - text: "Quickstarts"
-        - text: "Model Development"
+        - text: "Development"
           file: get-started/developer/quickstart-developer.qmd
-        - text: "Model Validation"
+        - text: "Validation"
           file: get-started/validator/quickstart-validator.qmd
         - text: "Setup & Administration"
           file: get-started/administrator/quickstart-administrator.qmd
\ No newline at end of file
diff --git a/site/get-started/common-steps/_get-your-code-snippet.qmd b/site/get-started/common-steps/_get-your-code-snippet.qmd
index cdcd43ea5a..7c95e6c25d 100644
--- a/site/get-started/common-steps/_get-your-code-snippet.qmd
+++ b/site/get-started/common-steps/_get-your-code-snippet.qmd
@@ -2,9 +2,10 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-:::: {.content-visible unless-format="revealjs" when-meta="includes.developer"}
-Before we move on, let's also retrieve the unique *code snippet* for your model that enables you to connect your testing environment with the correct model in the {{< var validmind.platform >}}:
+Before we move on, let's also retrieve the unique *code snippet* for your model that enables you to connect your testing environment with the correct document in the {{< var validmind.platform >}}:
+
 
+:::: {.content-visible unless-format="revealjs" when-meta="includes.developer"}
 a. In the left sidebar that appears for your model, click **{{< fa rocket >}} Getting Started**.
 
 a. Select `Development` from the **[document]{.smallcaps}** drop-down menu.
@@ -17,8 +18,6 @@ a. Click **{{< fa regular copy >}} Copy snippet to clipboard**.
 
 
 :::: {.content-visible unless-format="revealjs" unless-meta="includes.developer"}
-Before we move on, let's also retrieve the unique *code snippet* for your model that enables you to connect your testing environment with the correct model in the {{< var validmind.platform >}}:
-
 a. In the left sidebar that appears for your model, click **{{< fa rocket >}} Getting Started**.
 
 a. Select `Validation` from the **[document]{.smallcaps}** drop-down menu.
diff --git a/site/get-started/common-steps/_register-your-first-model.qmd b/site/get-started/common-steps/_register-your-first-model.qmd
index 90b8e7000e..332c9ca023 100644
--- a/site/get-started/common-steps/_register-your-first-model.qmd
+++ b/site/get-started/common-steps/_register-your-first-model.qmd
@@ -5,16 +5,18 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 :::: {.content-visible unless-format="revealjs" when-meta="includes.developer"}
 a. In the left sidebar, click **{{< fa cubes >}} Inventory**.
 
-a. Click **{{< fa plus >}} Register New Model**.
+a. Under the [record type]{.smallcaps} drop-down, select `Model`.^[[Manage inventory record types](/guide/inventory/manage-inventory-record-types.qmd)]
 
-a. Enter in the **[model name]{.smallcaps}** and select any option for the following required fields:
+a. Click **{{< fa plus >}} Register Model**.
+
+a. Enter the **[model name]{.smallcaps}** and select any option for the following required fields:
 
    - **[business unit]{.smallcaps}**  — For example: `Finance`
    - **[prelimnary risk tier]{.smallcaps}** — For example: `1`
 
-a. Click **Next {{< fa angle-right >}}** to continue to assignment of model stakeholders.
+a. Click **Next {{< fa angle-right >}}** to continue to assignment of inventory record stakeholders.
 
-a. Select your own name under the **[model owner]{.smallcaps}** drop-down.
+a. Select your own name under the **[record owner]{.smallcaps}** drop-down.
 
 a. Click **Register Model** to add the model to your inventory.
 
@@ -22,13 +24,13 @@ a. Click **Register Model** to add the model to your inventory.
 
 ::: {.w-50-ns}
 
-![Registration modal with the options filled out for the model development quickstart](developer-new-model.png){fig-alt="A screenshot showing the registration modal with the options filled out for the model development quickstart" .screenshot group="developer-registration"}
+![Registration modal with the options filled out for the development quickstart](developer-new-model.png){fig-alt="A screenshot showing the registration modal with the options filled out for the development quickstart" .screenshot group="developer-registration"}
 
 :::
 
 ::: {.w-40-ns}
 
-![Model stakeholder selection step](/get-started/common-steps/select-model-owner.png){fig-alt="A screenshot showing the model stakeholder selection step" .screenshot group="developer-registration"}
+![Inventory record stakeholder selection step](/get-started/common-steps/select-model-owner.png){fig-alt="A screenshot showing the inventory record stakeholder selection step" .screenshot group="developer-registration"}
 
 :::
 
@@ -41,16 +43,18 @@ a. Click **Register Model** to add the model to your inventory.
 :::: {.content-visible unless-format="revealjs" unless-meta="includes.developer"}
 a. In the left sidebar, click **{{< fa cubes >}} Inventory**.
 
-a. Click **{{< fa plus >}} Register New Model**.
+a. Under the [record type]{.smallcaps} drop-down, select `Model`.^[[Manage inventory record types](/guide/inventory/manage-inventory-record-types.qmd)]
+
+a. Click **{{< fa plus >}} Register Model**.
 
-a. Enter in the **[model name]{.smallcaps}** and select any option for the following required fields:
+a. Enter the **[model name]{.smallcaps}** and select any option for the following required fields:
 
    - **[business unit]{.smallcaps}**  — For example: `Finance`
    - **[prelimnary risk tier]{.smallcaps}** — For example: `1`
 
-a. Click **Next {{< fa angle-right >}}** to continue to assignment of model stakeholders.
+a. Click **Next {{< fa angle-right >}}** to continue to assignment of inventory record stakeholders.
 
-a. Select your own name under the **[model owner]{.smallcaps}** drop-down — don't worry, we'll adjust these permissions next for validation.
+a. Select your own name under the **[record owner]{.smallcaps}** drop-down — don't worry, we'll adjust these permissions next for validation.
 
 a. Click **Register Model** to add the model to your inventory.
 
@@ -58,13 +62,13 @@ a. Click **Register Model** to add the model to your inventory.
 
 ::: {.w-50-ns}
 
-![Registration modal with the options filled out for the model validation quickstart](validator-new-model.png){fig-alt="A screenshot showing the registration modal with the options filled out for the model validation quickstart" .screenshot group="validator-registration"}
+![Registration modal with the options filled out for the validation quickstart](validator-new-model.png){fig-alt="A screenshot showing the registration modal with the options filled out for the validation quickstart" .screenshot group="validator-registration"}
 
 :::
 
 ::: {.w-40-ns}
 
-![Model stakeholder selection step](/get-started/common-steps/select-model-owner.png){fig-alt="A screenshot showing the model stakeholder selection step" .screenshot group="validator-registration"}
+![Inventory record stakeholder selection step](/get-started/common-steps/select-model-owner.png){fig-alt="A screenshot showing the inventory record stakeholder selection step" .screenshot group="validator-registration"}
 
 :::
 
@@ -74,4 +78,3 @@ a. Click **Register Model** to add the model to your inventory.
 
 
 
-
diff --git a/site/get-started/common-steps/_run-quickstart-notebook.qmd b/site/get-started/common-steps/_run-quickstart-notebook.qmd
index 4a44eb9f20..30d195ed57 100644
--- a/site/get-started/common-steps/_run-quickstart-notebook.qmd
+++ b/site/get-started/common-steps/_run-quickstart-notebook.qmd
@@ -4,21 +4,35 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 ### Run the quickstart notebook
 
+:::: {.content-visible unless-format="revealjs" when-meta="includes.developer"}
+::: {.callout title="Do you have your code snippet?"}
+
+To initialize the {{< var validmind.developer >}} which connects your environment to the correct model in the {{< var validmind.platform >}}, you'll need your unique code snippet!^[[Register your first record](#register-your-first-record): Click **3. Get your code snippet**]
+:::
+
+::::
+
+
+:::: {.content-visible unless-format="revealjs" unless-meta="includes.developer"}
 ::: {.callout title="Do you have your code snippet?"}
 
 To initialize the {{< var validmind.developer >}} which connects your environment to the correct model in the {{< var validmind.platform >}}, you'll need your unique code snippet!^[[Get your code snippet](#get-your-code-snippet)]
 :::
 
-1. Follow the instructions to run the first two code cells in the notebook,[^run-cells] which sets the stage by installing and initializing {{< var vm.product >}}.^[[Install and initialize the {{< var validmind.developer >}}](/developer/model-documentation/install-and-initialize-validmind-library.qmd)]
+
+::::
+
+1. Follow the instructions to run the first two code cells in the notebook,[^run-cells] which sets the stage by installing and initializing {{< var vm.product >}}.^[[Install and initialize the {{< var validmind.developer >}}](/developer/quickstart/install-and-initialize-validmind-library.qmd)]
 
 1. Under the cell at bottom of the **Get your code snippet** section, confirm that you see a success message verifying that you've connected to the right model.
 
    This message verifies that the {{< var vm.developer >}} works as expected as is connected to the correct model and document type within the {{< var vm.platform >}}.
 
 
+
 <!-- FOOTNOTES -->
 
 [^run-cells]:
 
    - Hover over each cell and click the {{< fa circle-play >}} **icon**; OR
-   - Press `Shift + Enter` on Windows or `Cmd + Enter` if you are on a Mac
\ No newline at end of file
+   - Press `Shift + Enter` on Windows or `Cmd + Enter` if you are on a Mac
diff --git a/site/get-started/common-steps/_select-template.qmd b/site/get-started/common-steps/_select-template.qmd
index 86ca70945c..598a50ebde 100644
--- a/site/get-started/common-steps/_select-template.qmd
+++ b/site/get-started/common-steps/_select-template.qmd
@@ -12,6 +12,11 @@ c. Click **Use Template** to apply the template.
 
 ![Model documentation template selection](documentation-template-selection.png){fig-alt="A screenshot showing the model documentation template selection" .screenshot}
 
+::: {.callout}
+If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document.^[[Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents)]
+
+:::
+
 
 
 ::::
@@ -26,5 +31,11 @@ c. Click **Use Template** to apply the template.
 
 ![Validation report template selection](validation-template-selection.png){fig-alt="A screenshot showing the validation report template selection" .screenshot}
 
+::: {.callout}
+If you cannot locate your Validation document, make sure Validation type documents are enabled for model records and create a new document.^[[Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents)]
+
+:::
+
+
 
 ::::
diff --git a/site/get-started/developer/quickstart-developer.qmd b/site/get-started/developer/quickstart-developer.qmd
index a3f75af042..222b63f5a2 100644
--- a/site/get-started/developer/quickstart-developer.qmd
+++ b/site/get-started/developer/quickstart-developer.qmd
@@ -2,7 +2,7 @@
 # Copyright © 2023-2026 ValidMind Inc. All rights reserved.
 # Refer to the LICENSE file in the root of this repository for details.
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
-title: "Quickstart — Model Development"
+title: "Quickstart — Development"
 subtitle: "15 minutes"
 date: last-modified
 listing:
@@ -26,17 +26,17 @@ includes:
    developer: true
 ---
 
-Register your first model, use the {{< var validmind.developer >}} to run tests and document a model, then review your generated model documentation within the {{< var validmind.platform >}}.
+Register your first record (model), use the {{< var validmind.developer >}} to run tests and document a model, then review your generated documentation within the {{< var validmind.platform >}}.
 
 {{< include /get-started/common-steps/_before-you-begin.qmd >}}
 
-## Register your first model
+## Register your first record
 
-The first step to using {{< var vm.product >}} to develop models is to register them in your model inventory:
+The first step to using {{< var vm.product >}} to develop records is to register them in your inventory. In this guide, we'll use a model-type record for our example:
 
 ::: {.panel-tabset}
 
-#### 1. Register a model
+#### 1. Register a sample model
 
 {{< include /get-started/common-steps/_register-your-first-model.qmd >}}
 
@@ -52,13 +52,13 @@ The first step to using {{< var vm.product >}} to develop models is to register
 
 ## Using the {{< var validmind.developer >}}
 
-Next, let's set up the {{< var validmind.developer >}} in your development environment of choice so we can use it to run and log tests, which helps automate the documentation of your models.
+Next, let's set up the {{< var validmind.developer >}} in your development environment of choice so we can use it to run and log tests, which helps automate the documentation of your records.
 
-Our companion notebook, **Quickstart for model documentation,**[^1] walks you through the steps of installing the {{< var vm.developer >}} in your environment, initializing the {{< var vm.developer >}} for use, and running a full suite of documentation tests that logs results to the {{< var validmind.platform >}}.
+Our companion notebook, **Quickstart for documentation,**[^1] walks you through the steps of installing the {{< var vm.developer >}} in your environment, initializing the {{< var vm.developer >}} for use, and running a full suite of documentation tests that logs results to the {{< var validmind.platform >}}.
 
 {{< include /get-started/common-steps/_access-quickstart-notebook.qmd >}}
 
-1. Open [Quickstart for model documentation]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/quickstart/quickstart_model_documentation.ipynb) and [run the quickstart notebook](#run-the-quickstart-notebook).
+1. Open [Quickstart for documentation]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/quickstart/quickstart_documentation.ipynb) and [run the quickstart notebook](#run-the-quickstart-notebook).
 
 #### Download the notebooks
 
@@ -66,11 +66,11 @@ Our companion notebook, **Quickstart for model documentation,**[^1] walks you th
 
 {{< include /get-started/common-steps/_download-notebooks.qmd >}}
 
-1. After the cloning process is complete, open `notebooks/quickstart/quickstart_model_documentation.ipynb` in your development environment and [run the quickstart notebook](#run-the-quickstart-notebook).
+1. After the cloning process is complete, open `notebooks/quickstart/quickstart_documentation.ipynb` in your development environment and [run the quickstart notebook](#run-the-quickstart-notebook).
 
 {{< include /get-started/common-steps/_download-code-samples.qmd >}}
 
-1. Open `notebooks/quickstart/quickstart_model_documentation.ipynb` in your development environment and [run the quickstart notebook](#run-the-quickstart-notebook).
+1. Open `notebooks/quickstart/quickstart_documentation.ipynb` in your development environment and [run the quickstart notebook](#run-the-quickstart-notebook).
 
 :::
 
@@ -88,7 +88,7 @@ Our companion notebook, **Quickstart for model documentation,**[^1] walks you th
 
 3. Continue running the rest of the notebook to automatically populate test results for your sample model to your documentation for that model in the {{< var vm.platform >}}.
 
-## Work with model documentation
+## Work with documentation
 
 After you successfully run the notebook, return to the {{< var validmind.platform >}}:
 
@@ -98,14 +98,14 @@ After you successfully run the notebook, return to the {{< var validmind.platfor
 
 3. In the left sidebar that appears for the model, click **Development** under {{< fa file >}} Documents:
 
-   - Your model's documentation is broken down into sections, defined by your document templates.[^3]
+   - Your documentation is broken down into sections, defined by your document templates.[^3]
    - Each section can be assigned a completion status,[^4] allowing you to track the progress of your documentation.
 
 4. Click on any section of the documentation to review the test results and drafts of test result summaries generated by the {{< var validmind.developer >}}.
 
    In any subsection, expand the **{{< var vm.product >}} Insights™** panel to view the Guidelines[^5] that tell you more about what these sections mean and help you with the task of documenting the model as a developer.
 
-5. Refine your model documentation by:
+5. Refine your documentation by:
 
    - Adding or editing content blocks[^6]
    - Adding additional test results after you've logged them[^7]
@@ -128,7 +128,7 @@ After you successfully run the notebook, return to the {{< var validmind.platfor
 
 ## What's next
 
-Now that you've grasped the basics of using {{< var vm.product >}} for model development, continue on your journey with our end-to-end training course for developers and browse through our resource hub for the {{< var validmind.developer >}}:
+Now that you've grasped the basics of using {{< var vm.product >}} for development, continue on your journey with our end-to-end training course for developers and browse through our resource hub for the {{< var validmind.developer >}}:
 
 :::{#whats-next}
 :::
@@ -136,7 +136,7 @@ Now that you've grasped the basics of using {{< var vm.product >}} for model dev
 
 <!-- FOOTNOTES -->
 
-[^1]: [Quickstart for model documentation](/notebooks/quickstart/quickstart_model_documentation.ipynb)
+[^1]: [Quickstart for documentation](/notebooks/quickstart/quickstart_documentation.ipynb)
 
 [^2]: [Working with the inventory](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records)
 
diff --git a/site/get-started/validator/quickstart-validator.qmd b/site/get-started/validator/quickstart-validator.qmd
index 8ca60db6f1..db62f00678 100644
--- a/site/get-started/validator/quickstart-validator.qmd
+++ b/site/get-started/validator/quickstart-validator.qmd
@@ -2,7 +2,7 @@
 # Copyright © 2023-2026 ValidMind Inc. All rights reserved.
 # Refer to the LICENSE file in the root of this repository for details.
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
-title: "Quickstart — Model Validation"
+title: "Quickstart — Validation"
 subtitle: "20 minutes"
 date: last-modified
 listing:
@@ -17,15 +17,15 @@ listing:
     - ../../developer/validmind-library.qmd
 ---
 
-Use the {{< var validmind.developer >}} to run tests and validate a model, then attach your test results as evidence to your validation report in the {{< var validmind.platform >}}.
+Use the {{< var validmind.developer >}} to run tests and validate a record (model), then attach your test results as evidence to your validation report in the {{< var validmind.platform >}}.
 
 {{< include /get-started/common-steps/_before-you-begin.qmd >}}
 
 ## Register a model for validation
 
-Typically, you will be asked to validate a champion model that has already been independently registered in the model inventory and submitted to you.
+Typically, you will be asked to validate a champion that has already been independently registered in the inventory and submitted to you. In this guide, we'll use a model-type record for our example:
 
-#### 1. Register a model
+#### 1. Register a sample model
 
 For this quickstart, you'll register a dummy model first and assign yourself as the validator to familiarize you with the {{< var validmind.platform >}} interface:
 
@@ -33,13 +33,13 @@ For this quickstart, you'll register a dummy model first and assign yourself as
 
 #### 2. Assign validator credentials
 
-In order to log tests as a validator instead of as a developer, we'll need to adjust your **model stakeholder** permissions.
+In order to log tests as a validator instead of as a developer, we'll need to adjust your **inventory record stakeholder** permissions.
 
 On the model details page after you've registered your model:
 
 ::: {.panel-tabset}
 
-#### Remove yourself as model owner
+#### Remove yourself as owner
 
 a. Click on the **[owners]{.smallcaps}** tile, then click on the **x** next to your name.
 b. Click **Save** to apply your changes to that role.
@@ -57,7 +57,7 @@ b. Click **Save** to apply your changes to that role.
 :::
 
 ::: {.column-margin}
-![Model stakeholders with only the [validators]{.smallcaps} assigned](model-stakeholders.png){width=90% fig-alt="A screenshot showing the model stakeholders with only validators assigned" .screenshot}
+![Inventory record stakeholders with only the [validators]{.smallcaps} assigned](model-stakeholders.png){width=90% fig-alt="A screenshot showing the inventory record stakeholders with only validators assigned" .screenshot}
 :::
 
 #### 3. Select a report template
@@ -70,13 +70,13 @@ b. Click **Save** to apply your changes to that role.
 
 ## Using the {{< var validmind.developer >}}
 
-Next, let's set up the {{< var validmind.developer >}} in your validation environment of choice so we can use it to run and log tests, which helps automate the validation of your models.
+Next, let's set up the {{< var validmind.developer >}} in your validation environment of choice so we can use it to run and log tests, which helps automate the validation of your records.
 
-Our companion notebook, **Quickstart for model validation,**[^1] walks you through the steps of installing the {{< var vm.developer >}} in your environment, initializing the {{< var vm.developer >}} for use, and running data quality and model evaluation tests that log results to the {{< var validmind.platform >}}.
+Our companion notebook, **Quickstart for validation,**[^1] walks you through the steps of installing the {{< var vm.developer >}} in your environment, initializing the {{< var vm.developer >}} for use, and running data quality and model evaluation tests that log results to the {{< var validmind.platform >}}.
 
 {{< include /get-started/common-steps/_access-quickstart-notebook.qmd >}}
 
-1. Open [Quickstart for model validation]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/quickstart/quickstart_model_validation.ipynb) and [run the quickstart notebook](#run-the-quickstart-notebook).
+1. Open [Quickstart for validation]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/quickstart/quickstart_validation.ipynb) and [run the quickstart notebook](#run-the-quickstart-notebook).
 
 #### Download the notebooks
 
@@ -84,11 +84,11 @@ Our companion notebook, **Quickstart for model validation,**[^1] walks you throu
 
 {{< include /get-started/common-steps/_download-notebooks.qmd >}}
 
-1. After the cloning process is complete, open `notebooks/quickstart/quickstart_model_validation.ipynb` in your validation environment and [run the quickstart notebook](#run-the-quickstart-notebook)..
+1. After the cloning process is complete, open `notebooks/quickstart/quickstart_validation.ipynb` in your validation environment and [run the quickstart notebook](#run-the-quickstart-notebook)..
 
 {{< include /get-started/common-steps/_download-code-samples.qmd >}}
 
-1. Open `notebooks/quickstart/quickstart_model_validation.ipynb` in your validation environment and [run the quickstart notebook](#run-the-quickstart-notebook).
+1. Open `notebooks/quickstart/quickstart_validation.ipynb` in your validation environment and [run the quickstart notebook](#run-the-quickstart-notebook).
 
 :::
 
@@ -116,9 +116,9 @@ After you successfully run the notebook, return to the {{< var validmind.platfor
 
 3. In the left sidebar that appears for the model, click **Validation** under {{< fa file >}} Documents:
 
-   - Your model's validation is broken down into sections, defined by your validation report templates.[^3]
+   - Your validation report is broken down into sections, defined by your report templates.[^3]
    - The report includes risk assessment summaries at the overall and per-section level, overviews of your compliance assessments provided within your validation report.[^4]
-   - Each sub-section allows you to attach test results as evidence,[^5] as well as log artifacts based on your evaluation of datasets or models.[^6]
+   - Each sub-section (or guideline) allows you to attach test results as evidence,[^5] as well as log artifacts based on your evaluation of datasets or records.[^6]
 
 :::: {.flex .flex-wrap .justify-around}
 
@@ -138,13 +138,13 @@ After you successfully run the notebook, return to the {{< var validmind.platfor
 
 #### Add evidence to your report
 
-Expand any section of the validation report to attach your test results and drafts of test result summaries generated by the {{< var validmind.developer >}} as evidence by clicking on **{{< fa link >}} Link Evidence to Report**.
+Expand any section of the validation report to attach your test results and drafts of test result summaries generated by the {{< var validmind.developer >}} as evidence by clicking **Evidence** on any guideline to expand the evidence panel.
 
 For example:
 
-1. Locate the 2.2.1. Data Quality section and click on **Class Imbalance Assessment**.
+1. Within your validation report, click on **Class Imbalance Assessment**.
 
-2. Under the Class Imbalance Assessment sub-section, locate Validator Evidence then click **{{< fa link >}} Link Evidence to Report**.
+2. Under the Class Imbalance Assessment guideline click **{{< fa link >}} Link Evidence**, then select **Validator Evidence** as the [evidence type]{.smallcaps}.
 
 3. Select the Class Imbalance test results we logged: **ValidMind Data Validation Class Imbalance**
 
@@ -159,7 +159,7 @@ For example:
 
 ## What's next
 
-Now that you've grasped the basics of using {{< var vm.product >}} for model validation, continue on your journey with our end-to-end training course for validators and browse through our resource hub for the {{< var validmind.developer >}}:
+Now that you've grasped the basics of using {{< var vm.product >}} for validation, continue on your journey with our end-to-end training course for validators and browse through our resource hub for the {{< var validmind.developer >}}:
 
 :::{#whats-next}
 :::
@@ -167,15 +167,15 @@ Now that you've grasped the basics of using {{< var vm.product >}} for model val
 
 <!-- FOOTNOTES -->
 
-[^1]: [Quickstart for model validation](/notebooks/quickstart/quickstart_model_validation.ipynb)
+[^1]: [Quickstart for validation](/notebooks/quickstart/quickstart_validation.ipynb)
 
 [^2]: [Working with the inventory](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records)
 
 [^3]: [Working with document templates](/guide/templates/working-with-document-templates.qmd)
 
-[^4]: [Assess compliance](/guide/validation/assess-compliance.qmd#provide-compliance-assessments)
+[^4]: [Assess compliance](/guide/validation/assess-compliance.qmd#assign-compliance-assessments)
 
-[^5]: [Assess compliance](/guide/validation/assess-compliance.qmd#link-validator-evidence)
+[^5]: [Assess compliance](/guide/validation/assess-compliance.qmd#map-evidence)
 
 [^6]: [Add and manage artifacts](/guide/validation/add-manage-artifacts.qmd#add-artifacts-on-validation-reports)
 
diff --git a/site/guide/_sidebar.yaml b/site/guide/_sidebar.yaml
index bf5173df14..3d02a23c7e 100644
--- a/site/guide/_sidebar.yaml
+++ b/site/guide/_sidebar.yaml
@@ -71,7 +71,7 @@ website:
               contents:
                 - guide/workflows/manage-record-stages.qmd
                 - guide/workflows/configure-workflows.qmd
-                - guide/workflows/workflow-configuration-examples.qmd
+                # - guide/workflows/workflow-configuration-examples.qmd
             - file: guide/workflows/working-with-workflows.qmd
               contents:
                 - guide/workflows/manage-workflows.qmd
diff --git a/site/guide/configuration/_add-business-units.qmd b/site/guide/configuration/_add-business-units.qmd
index d9fe0f3a9e..ddc3be0ff2 100644
--- a/site/guide/configuration/_add-business-units.qmd
+++ b/site/guide/configuration/_add-business-units.qmd
@@ -7,7 +7,7 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 1. Click **{{< fa plus >}} Add Business Unit** under Business Units.
 
-1. Enter in your **[business unit name]{.smallcaps}**.
+1. Enter your **[business unit name]{.smallcaps}**.
 
 1. Click **Add Business Unit** to save your changes.
 
@@ -18,7 +18,7 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 :::: {.content-visible unless-format="revealjs" unless-meta="includes.quickstart"}
 a. Click **{{< fa plus >}} Add Business Unit** under Business Units.
 
-a. Enter in your **[business unit name]{.smallcaps}**.
+a. Enter your **[business unit name]{.smallcaps}**.
 
 a. Click **Add Business Unit** to save your changes.
 
@@ -35,7 +35,7 @@ a. Under {{< fa building >}} Organization, select **Organization**.
 
 a. Click **{{< fa plus >}} Add Business Unit** under Business Units.
 
-a. Enter in your **[business unit name]{.smallcaps}**.
+a. Enter your **[business unit name]{.smallcaps}**.
 
 a. Click **Add Business Unit** to save your changes.
 
diff --git a/site/guide/documentation/_add-test-results.qmd b/site/guide/documentation/_add-test-results.qmd
index c5d512bd15..bf9e22965e 100644
--- a/site/guide/documentation/_add-test-results.qmd
+++ b/site/guide/documentation/_add-test-results.qmd
@@ -36,11 +36,11 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 
 :::: {.content-hidden unless-format="revealjs"}
-With the test results logged, let's head to the record we connected to at the beginning of this notebook and insert our test results into the documentation:
+With the test results logged, let's head to the model we connected to at the beginning of this notebook and insert our test results into the documentation:
 
-1. From the **{{< fa cubes >}} Inventory** in the {{< var validmind.platform >}}, go to the record you connected to earlier.
+1. From the **{{< fa cubes >}} Inventory** in the {{< var validmind.platform >}}, go to the model you connected to earlier.
 
-1. In the left sidebar that appears for your record, click **Development** under {{< fa file >}} Documents.
+1. In the left sidebar that appears for your model, click **Development** under {{< fa file >}} Documents.
 
 1. Locate the Data Preparation section and click on **2.3 Correlations and Interactions** to expand that section.
 
diff --git a/site/guide/documentation/_check-documents.qmd b/site/guide/documentation/_check-documents.qmd
index 7594bd37bf..af38364c4d 100644
--- a/site/guide/documentation/_check-documents.qmd
+++ b/site/guide/documentation/_check-documents.qmd
@@ -89,9 +89,9 @@ To export the results of the {{< var vm.checker >}} to a `.pdf` (Portable Docume
 :::: {.content-visible when-format="revealjs" when-meta="includes.developer"}
 1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
 
-1. Select a record or find your record [by applying a filter or searching for it](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records){target="_blank"}.
+1. Select a model or find your model [by applying a filter or searching for it](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records){target="_blank"}.
 
-1. In the left sidebar that appears for your record, click **{{< fa file >}} Documents** and select **Development**.
+1. In the left sidebar that appears for your model, click **{{< fa file >}} Documents** and select **Development**.
 
 1. Locate the {{< var vm.checker >}} box on the right and click **{{< fa check >}} Check Document**.
 
@@ -124,7 +124,7 @@ b. Review questions that require attention. Each question includes:
      - **Observation** — An analysis of how the documentation currently addresses the question
      - **Recommendation** — If suggested, guidance on how to revise the documentation to better address the question
 
-Use the feedback provided by the {{< var validmind.checker >}} to review the appropriate sections of your documentation and decide what revisions should be made. Or, if you have run the {{< var vm.checker >}} before and were just checking that all documentation issues have been addressed, submit your record for validation.
+Use the feedback provided by the {{< var validmind.checker >}} to review the appropriate sections of your documentation and decide what revisions should be made. Or, if you have run the {{< var vm.checker >}} before and were just checking that all documentation issues have been addressed, submit your model for validation.
 
 #### 3. (Optional) Export results
 
@@ -143,9 +143,9 @@ To export the results of the {{< var vm.checker >}} to a `.pdf` (Portable Docume
 :::: {.content-visible when-format="revealjs" unless-meta="includes.developer"}
 1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
 
-1. Select a record or find your record [by applying a filter or searching for it](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records){target="_blank"}.
+1. Select a model or find your model [by applying a filter or searching for it](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records){target="_blank"}.
 
-1. In the left sidebar that appears for your record, click **{{< fa file >}} Documents** and select **Validation**.
+1. In the left sidebar that appears for your model, click **{{< fa file >}} Documents** and select **Validation**.
 
 1. Locate {{< fa file-circle-check >}} Check Document on the right and click to expand the menu, then click **{{< fa check >}} Check Document**.
 
diff --git a/site/guide/documentation/_locate-document-overview.qmd b/site/guide/documentation/_locate-document-overview.qmd
index 59a5a4513d..af25cd9fec 100644
--- a/site/guide/documentation/_locate-document-overview.qmd
+++ b/site/guide/documentation/_locate-document-overview.qmd
@@ -18,7 +18,7 @@ To locate your document overview for a record:
 :::: {.content-hidden unless-format="revealjs"}
 1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
 
-1. Select a record or [find your record by applying a filter or searching for it](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records){target="blank"}.
+1. Select a record or [find your record by applying a filter or searching for it](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records){target="_blank"}.
 
 1. In the left sidebar that appears for your record, click **{{< fa file >}} Documents** and select **Development**.
 
diff --git a/site/guide/documentation/content-editing-toolbar.png b/site/guide/documentation/content-editing-toolbar.png
index 846109487e..9421913ad7 100644
Binary files a/site/guide/documentation/content-editing-toolbar.png and b/site/guide/documentation/content-editing-toolbar.png differ
diff --git a/site/guide/documentation/content_blocks/_generate-with-ai.qmd b/site/guide/documentation/content_blocks/_generate-with-ai.qmd
index 8df9c71777..f3ed00600d 100644
--- a/site/guide/documentation/content_blocks/_generate-with-ai.qmd
+++ b/site/guide/documentation/content_blocks/_generate-with-ai.qmd
@@ -3,9 +3,9 @@ Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 :::: {.content-visible unless-format="revealjs"}
-1. Click **[{{< fa diamond >}} (Generate Text with AI)]{.pink}** in the toolbar while editing a content block.
+1. Click **{{< fa ellipsis-vertical >}}** in the content editing toolbar and select **[{{< fa diamond >}} (Generate Text with AI)]{.pink}**.
 
-1. Enter in a custom prompt and click **Send**, or click **Generate Content** to compose a draft for review.
+1. Enter a custom prompt and click **Send**, or click **Generate Content** to compose a draft for review.
 
    <!-- PDF CONTEXT DOCUMENTS ARE BEHIND A FEATURE FLAG -->
 
@@ -31,9 +31,9 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 <!-- INLINE LINKS FOR REVEALJS TRAINING -->
 :::: {.content-hidden unless-format="revealjs"}
-1. Click **[{{< fa diamond >}} (Generate Text with AI)]{.pink}** in the toolbar while editing a content block.
+1. Click **{{< fa ellipsis-vertical >}}** in the content editing toolbar and select **[{{< fa diamond >}} (Generate Text with AI)]{.pink}**.
 
-1. Enter in a custom prompt and click **Send**, or click **Generate Content** to compose a draft for review.
+1. Enter a custom prompt and click **Send**, or click **Generate Content** to compose a draft for review.
 
    :::: {.content-visible when-format="revealjs" when-meta="includes.pdf-context"}
    You can also include [record attachments in `.pdf` format](/guide/inventory/edit-inventory-fields.qmd#manage-attachments){target="_blank"} as context documents:
diff --git a/site/guide/documentation/work-with-content-blocks.qmd b/site/guide/documentation/work-with-content-blocks.qmd
index cd1344e9b6..6ec599dbae 100644
--- a/site/guide/documentation/work-with-content-blocks.qmd
+++ b/site/guide/documentation/work-with-content-blocks.qmd
@@ -14,17 +14,17 @@ includes:
 
 Make edits to your documents by adding or removing content blocks directly in the online editor.
 
-## What are content blocks?
-
-Content blocks provide you with sections that are part of a template, and are used in documents.
-
-- You can think of these sections as an empty canvas that you fill in with text and test results.
-- Multiple sections are joined to create a longer document with a table of contents that has different heading and subheading levels, such as "1.," "1.1.," and so on.
-
 ::: {.callout title="Static PDF documents cannot be edited."}
 You can only work with content blocks in PDFs converted to editable documents,[^1] documents generated by the {{< var validmind.developer >}}, or documents created in the {{< var validmind.platform >}}.
 :::
 
+## What are content blocks?
+
+Content blocks are modular document template components, used to populate your documents:
+
+- Content blocks are empty canvases that you fill in with text and test results.
+- Content blocks are inserted into document templates that define the structure of your documents.[^2]
+
 #### Content block types
 
 Content blocks can be new, blank blocks, or prepopulated via your library of logged test or metric results and text block templates:
@@ -43,11 +43,12 @@ The content editing toolbar is a rich text editor that enables you to:
 
 - Undo or redo changes
 - Format your text, including adding hyperlinks and code blocks
-- Reference related record and artifact field values with variables[^2]
-- Insert LaTex formulas[^3]
+- Reference related record and artifact field values with variables[^3]
+- Insert LaTeX formulas[^4]
+- Reference other sections of the document[^5]
 - Attach images via upload or URL
 
-You can also use the toolbar to suggest changes, save named versions of content, and leave comments.[^4]
+You can also use the toolbar to suggest changes, save named versions of content, and leave comments.[^6]
 
 ::: {.callout title="Stuck on where to start?"}
 Use {{< var vm.product >}} to assist you with generating content via AI!^[[Generate content drafts with AI](#generate-content)]
@@ -58,9 +59,9 @@ Use {{< var vm.product >}} to assist you with generating content via AI!^[[Gener
 ## Prerequisites
 
 - [x] {{< var link.login >}}
-- [x] There are records registered in the inventory.[^5]
-- [x] Documents exist and are completed or are in progress for your record.[^6]
-- [x] You are a [{{< fa code >}} Developer]{.bubble} or [{{< fa circle-check >}} Validator]{.bubble}, or assigned another role with sufficient permissions to perform the tasks in this guide.[^7]
+- [x] There are records registered in the inventory.[^7]
+- [x] Documents exist and are completed or are in progress for your record.[^8]
+- [x] You are a [{{< fa code >}} Developer]{.bubble} or [{{< fa circle-check >}} Validator]{.bubble}, or assigned another role with sufficient permissions to perform the tasks in this guide.[^9]
 
 :::
 
@@ -79,26 +80,26 @@ Use {{< var vm.product >}} to assist you with generating content via AI!^[[Gener
 
    #### [from library]{.smallcaps}
    Text Block
-   : Inserts a text block from a template in your block library:[^8]
+   : Inserts a text block from a template in your block library:[^10]
    a. Select the reusable blocks you want to add.
    b. Click **Insert # Text Block(s) to Document**.
 
-   Test-Driven[^9]
+   Test-Driven[^11]
    : Adds a new section with logged test results.
 
-   Metric Over Time[^10]
+   Metric Over Time[^12]
    : Adds a new section with logged metric over time results.
 
    :::
 
-7. After adding the block to your document, click on the text to make changes or add comments.[^11]
+7. After adding the block to your document, click on the text to make changes or add comments.[^13]
 
 ### Reference field values
 
 While editing a simple text block within documents, you can reference values in the form of variables from:
 
 ::: {.callout}
-- To reference field values in the form of variables, your organization must not have tracked changes enabled by default.[^12]
+- To reference field values in the form of variables, your organization must not have tracked changes enabled by default.[^14]
 - Note that while you are able to select fields with empty values within available record or artifact type fields, no value will be displayed in the content block until the field is populated.
 
 :::
@@ -118,8 +119,8 @@ While editing a simple text block within documents, you can insert math equation
 While editing a simple text block within documents, you can have {{< var vm.product >}} assist you with generating content drafts.
 
 ::: {.callout title="How can generate content drafts with AI?"}
-- To use the generate content drafts with AI feature, your organization must not have tracked changes enabled by default.[^13]
-- Generating content drafts works best after you've logged tests with the {{< var validmind.developer >}},[^14] as existing test descriptions and results provide more context for the {{< var vm.product >}} AI Content Builder to draw upon.
+- To use the generate content drafts with AI feature, your organization must not have tracked changes enabled by default.[^15]
+- Generating content drafts works best after you've logged tests with the {{< var validmind.developer >}},[^16] as existing test descriptions and results provide more context for the {{< var vm.product >}} AI Content Builder to draw upon.
 
 :::
 
@@ -128,7 +129,7 @@ To generate content drafts:
 
 {{< include content_blocks/_generate-with-ai.qmd >}}
 
-When generating content drafts with AI, accepted versions and edits are retained in your {{< fa wifi >}} Activity[^15] just like other updates to your documents.
+When generating content drafts with AI, accepted versions and edits are retained in your {{< fa wifi >}} Activity[^17] just like other updates to your documents.
 
 <br>
 
@@ -150,6 +151,34 @@ When you generate content, the content builder uses the following context:
 :::
 :::
 
+### Reference document sections
+
+While editing a simple text block within documents, you can directly reference other sections of the document and create hyperlinks to those sections:
+
+::: {.panel-tabset}
+
+#### From the content block editor
+
+1. In any simple text block, type `#` to retrieve the table of contents for the document you're editing.
+
+2. Select the title of the section you want to reference from the drop-down menu.
+
+3. After you click out of the content block editor, click on the hyperlink to verify that it navigates you to the correct section as expected.
+
+#### Using the content toolbar
+
+1. Click **{{< fa ellipsis-vertical >}}** in the content editing toolbar.
+
+2. Select **{{< fa link >}} Insert Reference**.
+
+3. Select the title of the section you want to reference from the drop-down menu.
+
+4. After you click out of the content block editor, click on the hyperlink to verify that it navigates you to the correct section as expected.
+
+:::
+
+Hyperlinks will also take you to the referenced section in PDF document exports.[^18]
+
 ## Remove content blocks
 
 ::: {.callout-important}
@@ -158,11 +187,11 @@ Test-driven or metric over time blocks can be re-added later on but **text block
 
 1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
 
-2. Select a record or find your record by applying a filter or searching for it.[^16]
+2. Select a record or find your record by applying a filter or searching for it.[^19]
 
-3. In the left sidebar that appears for your record, click **{{< fa file >}} Documents** and select the **Latest** tab.[^17]
+3. In the left sidebar that appears for your record, click **{{< fa file >}} Documents** and select the **Latest** tab.[^20]
 
-4. Click on the document file you want to remove a block from.[^18]
+4. Click on the document file you want to remove a block from.[^21]
 
 5. Click on a section header to expand that section and remove content.
 
@@ -177,36 +206,42 @@ Test-driven or metric over time blocks can be re-added later on but **text block
 
 [^1]: [Manage documents](/guide/templates/manage-documents.qmd#add-record-documents)
 
-[^2]: [Reference field values](#reference-field-values)
+[^2]: [Working with templates](/guide/templates/working-with-document-templates.qmd)
+
+[^3]: [Reference field values](#reference-field-values)
+
+[^4]: [Insert mathematical formulas](#insert-mathematical-formulas)
+
+[^5]: [Reference document sections](#reference-document-sections)
 
-[^3]: [Insert mathematical formulas](#insert-mathematical-formulas)
+[^6]: [Collaborate with others](collaborate-with-others.qmd)
 
-[^4]: [Collaborate with others](collaborate-with-others.qmd)
+[^7]: [Register records in the inventory](/guide/inventory/register-records-in-inventory.qmd)
 
-[^5]: [Register records in the inventory](/guide/inventory/register-records-in-inventory.qmd)
+[^8]: [Working with documents](/guide/templates/working-with-documents.qmd)
 
-[^6]: [Working with documents](/guide/templates/working-with-documents.qmd)
+[^9]: [Manage permissions](/guide/configuration/manage-permissions.qmd)
 
-[^7]: [Manage permissions](/guide/configuration/manage-permissions.qmd)
+[^10]: [Manage text block library](/guide/templates/manage-text-block-library.qmd)
 
-[^8]: [Manage text block library](/guide/templates/manage-text-block-library.qmd)
+[^11]: [Work with test results](/guide/documentation/work-with-test-results.qmd)
 
-[^9]: [Work with test results](/guide/documentation/work-with-test-results.qmd)
+[^12]: [Work with metrics over time](/guide/monitoring/work-with-metrics-over-time.qmd)
 
-[^10]: [Work with metrics over time](/guide/monitoring/work-with-metrics-over-time.qmd)
+[^13]: [Collaborate with others](/guide/documentation/collaborate-with-others.qmd)
 
-[^11]: [Collaborate with others](/guide/documentation/collaborate-with-others.qmd)
+[^14]: [Managing your organization](/guide/configuration/managing-your-organization.qmd#manage-document-defaults)
 
-[^12]: [Managing your organization](/guide/configuration/managing-your-organization.qmd#manage-document-defaults)
+[^15]: [Managing your organization](/guide/configuration/managing-your-organization.qmd#manage-document-defaults)
 
-[^13]: [Managing your organization](/guide/configuration/managing-your-organization.qmd#manage-document-defaults)
+[^16]: [Run tests and test suites](/developer/how-to/testing-overview.qmd)
 
-[^14]: [Run tests and test suites](/developer/how-to/testing-overview.qmd)
+[^17]: [View record activity](/guide/inventory/view-record-activity.qmd)
 
-[^15]: [View model activity](/guide/inventory/view-record-activity.qmd)
+[^18]: [Export documents](/guide/reporting/export-documents.qmd)
 
-[^16]: [Working with the model inventory](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-models)
+[^19]: [Working with the inventory](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records)
 
-[^17]: [Work with document versions](/guide/documentation/work-with-document-versions.qmd)
+[^20]: [Work with document versions](/guide/documentation/work-with-document-versions.qmd)
 
-[^18]: [Working with documents](/guide/templates/working-with-documents.qmd)
\ No newline at end of file
+[^21]: [Working with documents](/guide/templates/working-with-documents.qmd)
\ No newline at end of file
diff --git a/site/guide/documentation/work-with-document-versions.qmd b/site/guide/documentation/work-with-document-versions.qmd
index 8c1ad1cdae..15ee59055d 100644
--- a/site/guide/documentation/work-with-document-versions.qmd
+++ b/site/guide/documentation/work-with-document-versions.qmd
@@ -33,7 +33,7 @@ Save read-only versions of your documents in the {{< var validmind.platform >}}
 
 5. On the document overview page, click **{{< fa bookmark >}} Save Version**.
 
-6. Enter in your **[notes]{.smallcaps}** for the version.
+6. Enter your **[notes]{.smallcaps}** for the version.
 
 7. Click **Save Version** to create a read-only version of that document that captures the contents in the current state.
 
diff --git a/site/guide/documentation/working-with-documentation.qmd b/site/guide/documentation/working-with-documentation.qmd
index 566f2e7f94..d5ada74553 100644
--- a/site/guide/documentation/working-with-documentation.qmd
+++ b/site/guide/documentation/working-with-documentation.qmd
@@ -55,26 +55,26 @@ This section describes how to work with Development type documents[^1] (for exam
 
 ## Key concepts
 
-<!-- TO EDIT THESE KEY CONCEPTS, SEE `about/glossary/_model-documentation.qmd` -->
+<!-- TO EDIT THESE KEY CONCEPTS, SEE `about/glossary/_documentation.qmd` -->
 
-{{< include /about/glossary/model_documentation/_doc-intro.qmd >}}
+{{< include /about/glossary/documentation/_doc-intro.qmd >}}
 
 :::: {.flex .flex-wrap .justify-around}
 
 ::: {.w-50-ns}
 
-{{< include /about/glossary/model_documentation/_conceptual-soundness.qmd >}}
+{{< include /about/glossary/documentation/_conceptual-soundness.qmd >}}
 
-{{< include /about/glossary/model_documentation/_data-preparation.qmd >}}
+{{< include /about/glossary/documentation/_data-preparation.qmd >}}
 
 
 :::
 
 ::: {.w-40-ns}
 
-{{< include /about/glossary/model_documentation/_model-development.qmd >}}
+{{< include /about/glossary/documentation/_model-development.qmd >}}
 
-{{< include /about/glossary/model_documentation/_monitoring-governance.qmd >}}
+{{< include /about/glossary/documentation/_monitoring-governance.qmd >}}
 
 :::
 
diff --git a/site/guide/integrations/configure-connections.qmd b/site/guide/integrations/configure-connections.qmd
index 831f96e5aa..2bca5f107e 100644
--- a/site/guide/integrations/configure-connections.qmd
+++ b/site/guide/integrations/configure-connections.qmd
@@ -165,7 +165,7 @@ Required configuration details:
 
 4. In the modal that opens, select one of the supported connections, such as MLflow or Jira.
 
-5. Enter in the:
+5. Enter the following:
 
    - **[integration name]{.smallcaps}** — How other admins can identify the connection.
    - **[description]{.smallcaps}** (optional) — The intended usage or additional details.
diff --git a/site/guide/integrations/integrations-examples/use-webhooks-with-workflows.qmd b/site/guide/integrations/integrations-examples/use-webhooks-with-workflows.qmd
index 22b7dd9a0d..ea216d903f 100644
--- a/site/guide/integrations/integrations-examples/use-webhooks-with-workflows.qmd
+++ b/site/guide/integrations/integrations-examples/use-webhooks-with-workflows.qmd
@@ -36,7 +36,7 @@ Start a {{< var vm.product >}} workflow from an external system by sending a POS
 4. Copy or select the webhook details:
 
    - **URL** — Click **{{< fa regular copy >}} Copy** for the unique POST webhook URL to use when configuring your external system.
-   - **[select target model for payload]{.smallcaps}** — Select the model that is associated with the webhook payload from the dropdown.
+   - **[select target {record-type} record for payload]{.smallcaps}** — Select the record that is associated with the webhook payload from the dropdown.
    - **Payload** — Click **{{< fa regular copy >}} Copy** for the JSON payload that external systems must send in their POST request, where the value for `target_cuid` is shown after you select a target:
    
      ```json
@@ -84,7 +84,7 @@ Trigger a waiting {{< var vm.product >}} workflow step to continue from an exter
 4. Copy or select the webhook details:
 
    - **URL** — Click **{{< fa regular copy >}} Copy** for the unique POST webhook URL to use when configuring your external system.
-   - **[select target model for payload]{.smallcaps}** — Select the model that is associated with the webhook payload from the dropdown.
+   - **[select target {record-type} record for payload]{.smallcaps}** — Select the record that is associated with the webhook payload from the dropdown.
    - **Payload** — Click **{{< fa regular copy >}} Copy** for the JSON payload that external systems must send in their POST request, where the value for `target_cuid` is shown after you select a target:
 
      ```json
diff --git a/site/guide/inventory/_add-edit-record-types.qmd b/site/guide/inventory/_add-edit-record-types.qmd
index ff0ca938fa..21416b69e7 100644
--- a/site/guide/inventory/_add-edit-record-types.qmd
+++ b/site/guide/inventory/_add-edit-record-types.qmd
@@ -46,7 +46,7 @@ b. Make your desired changes to your record type, then click **Update**.
 
 :::: {.content-hidden unless-format="revealjs"}
 
-- To add: Click **{{< fa plus >}} Add Inventory Record Type**, enter in the record type details, then click **Create**.
+- To add: Click **{{< fa plus >}} Add Inventory Record Type**, enter the record type details, then click **Create**.
 - To edit: Click  on an existing record type, update the record type details, then click **Update**.
 
 #### Record type details
diff --git a/site/guide/inventory/_field-types.qmd b/site/guide/inventory/_field-types.qmd
index df5e65c8f8..77fabc701e 100644
--- a/site/guide/inventory/_field-types.qmd
+++ b/site/guide/inventory/_field-types.qmd
@@ -72,26 +72,6 @@ Calculation
 {{< var vm.product >}} runs calculated field formulas on the Starlark formula engine. Formulas authored on earlier releases were written in Python and have been migrated to Starlark automatically. When creating or editing formulas, you now must use the Starlark syntax.
 :::
 
-##### Available helpers
-
-Reference these helpers in your formulas — they cover the date, number, and list operations the engine does not expose directly:
-
-| Helper | Returns | Description |
-|---|---|---|
-| `today()` | `"YYYY-MM-DD"` | Current date as an ISO string. |
-| `safe_parse_date(value, default=None)` | `"YYYY-MM-DD"` or `default` | Parses ISO dates/datetimes or millisecond/second epoch timestamps. |
-| `to_iso(value)` | `"YYYY-MM-DD"` or `None` | Alias for `safe_parse_date` with no default. |
-| `add_days(date, n)` | `"YYYY-MM-DD"` or `None` | Adds `n` days to an ISO date. |
-| `add_months(date, n)` | `"YYYY-MM-DD"` or `None` | Adds `n` months to an ISO date. |
-| `days_between(a, b)` | `int` or `None` | Days between two ISO dates (`a` − `b`). |
-| `days_since(date)` | `int` or `None` | Days from `date` to today. |
-| `months_between(a, b)` | `int` or `None` | Full-month difference between two ISO dates. |
-| `get_year(date)` / `get_month(date)` / `get_day(date)` | `int` or `None` | Components of an ISO date. |
-| `safe_int(value, default=0)` | `int` | Tolerates strings and missing values. |
-| `safe_float(value, default=0.0)` | `float` | Tolerates strings and missing values. |
-| `list_count(list, value)` | `int` | Number of times `value` appears in `list`. |
-| `zfill(value, width)` | `string` | Zero-pads `value` to `width` characters. |
-
 :::: {.content-visible when-format="html" when-meta="includes.inventory"}
 1. Select from the drop-down of **[available record fields]{.smallcaps}** to allow your formula access to the field's values.^[Fields are grouped by field type.]
 2. Replace the demonstration formula with your own in the code box provided.^[Reference fields with dictionary-style access — `params["fieldKey"]` — and use the available helpers for date and number work.]
@@ -126,9 +106,9 @@ def formula(params):
 
 :::: {.content-visible when-format="html" when-meta="includes.artifacts"}
 1. Select from the drop-down of **[available artifact fields]{.smallcaps}** and **[record fields available via]{.smallcaps} `params["model"]`** to allow your formula access to the field's values.^[Fields are grouped by field type.]
-2. Replace the demonstration formula with your own in the code box provided.^[Reference fields with dictionary-style access — `params["fieldKey"]` and `params["model"]["fieldKey"]` for parent inventory record data — and use the available helpers for date and number work.
-4. Click **Test Calculation {{< fa angle-down >}}** to open the testing area.
-5. Enter in sample values in the testing area then click **{{< fa play >}} Test Calculation** to validate your formula.
+2. Replace the demonstration formula with your own in the code box provided.^[Reference fields with dictionary-style access — `params["fieldKey"]` and `params["model"]["fieldKey"]` for parent inventory record data — and use the available helpers for date and number work.]
+3. Click **Test Calculation {{< fa angle-down >}}** to open the testing area.
+4. Enter in sample values in the testing area then click **{{< fa play >}} Test Calculation** to validate your formula.
 <br><br>
 
 ::: {.callout-button .pl4 .nt4}
@@ -195,6 +175,70 @@ def formula(params):
 
 ::::
 
+
+
+::: {.panel-tabset}
+
+#### Params dictionary
+
+In addition to custom field keys you add from the **available fields** drop-down, formulas can read built-in keys on the `params` dictionary:
+
+<!-- VISIBLE ONLY ON PAGES THAT HAVE A CUSTOM METADATA TAG:
+
+```includes:
+    inventory: true
+``` -->
+
+:::: {.content-visible when-format="html" when-meta="includes.inventory"}
+| Param | Applies to | Availability | Description |
+|---|---|---|---|
+| `params["<fieldKey>"]` | Inventory records & artifacts | Add the field from the **available fields** drop-down | Current value of another custom field on the same record or artifact. |
+| `params["model_stage"]` | Inventory records | Add **Model Stage** from the **available fields** drop-down | Current model stage name as a string (for example, `"Production"`). Returns an empty string when no stage is assigned. Compare directly: `params["model_stage"] == "Production"`. |
+| `params["stakeholders"]` | Inventory records | Add a stakeholder role from the **available fields** drop-down (for example, **Stakeholders — Owners**) | Assigned users by stakeholder role. Default role keys are `owners`, `developers`, and `validators`. Custom stakeholder types use `custom_stakeholder_<cuid>`. Each entry includes `name`, `email`, and `title`. |
+| `params["integrations"]` | Inventory records & artifacts | Reference `params["integrations"]` in the formula source | Linked external integration data keyed by service (for example, `params["integrations"]["mlflow"]`). Empty when integrations are not configured or not referenced. |
+
+::::
+
+<!-- VISIBLE ONLY ON PAGES THAT **DO NOT** HAVE A CUSTOM METADATA TAG:
+
+```includes:
+    inventory: true
+``` -->
+
+:::: {.content-visible when-format="html" unless-meta="includes.inventory"}
+| Param | Applies to | Availability | Description |
+|---|---|---|---|
+| `params["<fieldKey>"]` | Inventory records & artifacts | Add the field from the **available fields** drop-down | Current value of another custom field on the same record or artifact. |
+| `params["integrations"]` | Inventory records & artifacts | Reference `params["integrations"]` in the formula source | Linked external integration data keyed by service (for example, `params["integrations"]["mlflow"]`). Empty when integrations are not configured or not referenced. |
+| `params["finding_type"]` | Artifacts | Always available on artifact formulas | Artifact type metadata with `["tag"]` (technical identifier) and `["name"]` (display name). |
+| `params["model"]` | Artifacts | Always available when the artifact is linked to an inventory record | Parent inventory record custom field values (for example, `params["model"]["criticality_level"]`). |
+
+::::
+
+
+#### Available helpers
+
+Reference these helpers in your formulas — they cover the date, number, and list operations the engine does not expose directly:
+
+| Helper | Returns | Description |
+|---|---|---|
+| `today()` | `"YYYY-MM-DD"` | Current date as an ISO string. |
+| `safe_parse_date(value, default=None)` | `"YYYY-MM-DD"` or `default` | Parses ISO dates/datetimes or millisecond/second epoch timestamps. |
+| `to_iso(value)` | `"YYYY-MM-DD"` or `None` | Alias for `safe_parse_date` with no default. |
+| `add_days(date, n)` | `"YYYY-MM-DD"` or `None` | Adds `n` days to an ISO date. |
+| `add_months(date, n)` | `"YYYY-MM-DD"` or `None` | Adds `n` months to an ISO date. |
+| `days_between(a, b)` | `int` or `None` | Days between two ISO dates (`a` − `b`). |
+| `days_since(date)` | `int` or `None` | Days from `date` to today. |
+| `months_between(a, b)` | `int` or `None` | Full-month difference between two ISO dates. |
+| `get_year(date)` / `get_month(date)` / `get_day(date)` | `int` or `None` | Components of an ISO date. |
+| `safe_int(value, default=0)` | `int` | Tolerates strings and missing values. |
+| `safe_float(value, default=0.0)` | `float` | Tolerates strings and missing values. |
+| `list_count(list, value)` | `int` | Number of times `value` appears in `list`. |
+| `zfill(value, width)` | `string` | Zero-pads `value` to `width` characters. |
+
+:::
+
+
 Checkbox
 : A `true`/`false` value set by a toggle.
 
@@ -266,7 +310,7 @@ Calculation
     1. Select from the drop-down of **[available record fields]{.smallcaps}**, or **[available artifact fields]{.smallcaps}** and **[record fields available via]{.smallcaps} `params["model"]`** (artifact fields) to allow your formula access to the field's values.
     2. Replace the demonstration formula with your own in the code box provided.
     4. Click **Test Calculation {{< fa angle-down >}}** to open the testing area.
-    5. Enter in sample values in the testing area then click **{{< fa play >}} Test Calculation** to validate your formula.
+    5. Enter sample values in the testing area then click **{{< fa play >}} Test Calculation** to validate your formula.
 
 Checkbox
 : A `true`/`false` value set by a toggle.
diff --git a/site/guide/inventory/_remove-layout-view.qmd b/site/guide/inventory/_remove-layout-view.qmd
deleted file mode 100644
index 8401ffa09e..0000000000
--- a/site/guide/inventory/_remove-layout-view.qmd
+++ /dev/null
@@ -1,44 +0,0 @@
-<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
-Refer to the LICENSE file in the root of this repository for details.
-SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
-
-<!-- COPYRIGHT TEXT MESSES WITH AUTOMATIC RENUMBERING IN INCLUDES -->
-
-<!-- VISIBLE ONLY ON PAGES THAT HAVE A CUSTOM METADATA TAG:
-
-```includes:
-    inventory: true
-``` -->
-
-:::: {.content-visible when-format="html" when-meta="includes.inventory"}
-2. Select the **[record type]{.smallcaps}** you want to remove a view for from the drop-down menu.
-
-3. Click **{{< fa bookmark >}} Select View**.
-
-4. Hover over the view you want to modify.
-
-5. When the **{{< fa ellipsis-vertical >}}** appears, click on it to edit the name or description or to delete the view:
-
-    - To edit a view, select **{{< fa pencil >}} Edit View**. Make your edits then click **Save Changes** to apply your adjustments.
-    - To remove a view, select [**{{< fa trash-can >}} Remove View**]{.red}. Click **Yes, Delete View** to confirm permanent deletion of that view.
-
-::::
-
-<!-- VISIBLE ONLY ON PAGES THAT **DO NOT** HAVE A CUSTOM METADATA TAG:
-
-```includes:
-    inventory: true
-``` -->
-
-:::: {.content-visible when-format="html" unless-meta="includes.inventory"}
-3. Click **{{< fa bookmark >}} Select View**.
-
-4. Hover over the view you want to modify.
-
-5. When the **{{< fa ellipsis-vertical >}}** appears, click on it to edit the name or description or to delete the view:
-
-    - To edit a view, select **{{< fa pencil >}} Edit View**. Make your edits then click **Save Changes** to apply your adjustments.
-    - To remove a view, select [**{{< fa trash-can >}} Remove View**]{.red}. Click **Yes, Delete View** to confirm permanent deletion of that view.
-
-::::
-
diff --git a/site/guide/inventory/_rename-field-keys.qmd b/site/guide/inventory/_rename-field-keys.qmd
index 487373b087..c72fd1ca25 100644
--- a/site/guide/inventory/_rename-field-keys.qmd
+++ b/site/guide/inventory/_rename-field-keys.qmd
@@ -6,7 +6,7 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 1. When the **{{< fa ellipsis-vertical >}}** appears, click on it and select **{{< fa pen-to-square >}} Rename Key**.
 
-1. Enter in the [new key]{.smallcaps} and click **Check Availability**.
+1. Enter the [new key]{.smallcaps} and click **Check Availability**.
 
 1. If the key is not already in use, you'll be presented with a list of dependencies to review.
 
diff --git a/site/guide/inventory/_save-layout-view.qmd b/site/guide/inventory/_save-layout-view.qmd
deleted file mode 100644
index ea195d16d1..0000000000
--- a/site/guide/inventory/_save-layout-view.qmd
+++ /dev/null
@@ -1,21 +0,0 @@
-<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
-Refer to the LICENSE file in the root of this repository for details.
-SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
-
-<!-- COPYRIGHT TEXT MESSES WITH AUTOMATIC RENUMBERING IN INCLUDES -->
-
-2. Click **{{< fa bookmark >}} Save View** to save your first view.
-
-    To add subsequent saved views, click **{{< fa bookmark >}} Select View**.
-
-3. Select **{{< fa bookmark >}} Save New View**.
-
-4. On the Add New View modal that appears, enter the:
-
-    - **[view name]{.smallcaps}**
-    - **[description]{.smallcaps}** (optional)
-
-5. Click **Add New View** to create your saved view.
-
-
-
diff --git a/site/guide/inventory/customize-inventory-layout.qmd b/site/guide/inventory/customize-inventory-layout.qmd
index d5e4eed899..250efa80e5 100644
--- a/site/guide/inventory/customize-inventory-layout.qmd
+++ b/site/guide/inventory/customize-inventory-layout.qmd
@@ -62,38 +62,15 @@ Once customized, you can save views for later application for each type of recor
 
 ### Manage custom inventory views
 
-:::{.callout title="Saved views are unique to you and do not display for other users in your organization."}
-
-While customizations to table views apply across all record types, saving a view only applies to that record type.
-
-:::
-
-::: {.panel-tabset}
-
-#### Save inventory views
-
-
-
-
 You can save custom table configurations as a view to reapply at any time:
 
-1. Customize a table view for the **[record type]{.smallcaps}** you want to save a view for.[^7]
+#### Manage personal inventory views
 
-    You can also apply filters or sorting before saving your view to include them in the view.[^8]
+{{< include /guide/shared/manage-views/_personal-views.qmd >}}
 
-{{< include _save-layout-view.qmd >}}
+#### Manage organization inventory views
 
-#### Edit or remove saved inventory views
-
-::: {.callout-important}
-Deletion of saved views is permanent.
-:::
-
-1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
-
-{{< include _remove-layout-view.qmd >}}
-
-:::
+{{< include /guide/shared/manage-views/_organization-views.qmd >}}
 
 
 <!-- FOOTNOTES -->
@@ -102,14 +79,10 @@ Deletion of saved views is permanent.
 
 [^2]: [Customize table view](#customize-table-view)
 
-[^3]: [Working with the inventory](working-with-the-inventory.qmd)
+[^3]: [Working with the inventory](working-with-the-inventory.qmd#search-filter-and-sort-records)
 
 [^4]: [Swap between views](#swap-between-views)
 
 [^5]: [Manage inventory fields](manage-inventory-fields.qmd)
 
 [^6]: [Manage custom inventory views](#manage-custom-inventory-views)
-
-[^7]: [Customize table view](#customize-table-view)
-
-[^8]: [Working with the inventory](working-with-the-inventory.qmd)
\ No newline at end of file
diff --git a/site/guide/inventory/edit-inventory-fields.qmd b/site/guide/inventory/edit-inventory-fields.qmd
index f9885de76f..5e1b16274e 100644
--- a/site/guide/inventory/edit-inventory-fields.qmd
+++ b/site/guide/inventory/edit-inventory-fields.qmd
@@ -30,13 +30,40 @@ Edit individual detail fields on a record to ensure that record details are accu
 
 2. Under the [record type]{.smallcaps} drop-down, select the type of record you want to edit fields for.[^4]
 
-2. Select a record or find your record by applying a filter or searching for it.[^5]
+3. You can edit fields on individual records, or edit fields on records in bulk for a specific record type:
 
-3. On the record details page, click on an inventory field to make your changes.[^6]
+::: {.panel-tabset}
+
+#### Edit fields on individual records
+
+a. Select a record or find your record by applying a filter or searching for it.[^5]
+
+b. On the record details page, click on an inventory field to make your changes.[^6]
+
+c. Click **Save** to apply your changes.
+
+#### Edit fields in bulk for a specific record type
+
+a. First, make sure you're in table view for the record type you want to edit fields for.[^7]
+
+b. Select the records you want to edit fields for by:
 
-4. Click **Save** to apply your changes.
+    - Clicking {{< fa square >}} in the header column to select all records shown on that page.
+    - Clicking {{< fa square >}} next to a specific record.
 
-Changes you make to inventory fields are automatically logged to that record’s activity.[^7]
+    To view more records for selection, scroll down to the bottom of the table view and click **Next {{< fa arrow-right >}}**.
+
+c. At the bottom of the page, review the count of records selected to verify that the correct number of records are selected for editing, then click **{{< fa pencil >}} Edit**.
+
+d. Make your changes to the inventory fields for the selected records.
+
+e. Click **Continue {#}** where `{#}` is the number of fields to be edited.
+
+f. Review the changes to be applied to the inventory fields for the selected records to verify that the changes are correct, then click **Save {#} Changes**.
+
+:::
+
+Changes you make to inventory fields are automatically logged to that record’s activity.[^8]
 
 <br>
 
@@ -52,7 +79,7 @@ Changes you make to inventory fields are automatically logged to that record’s
 
 ### Add or remove stakeholders
 
-1. On the record's detail page, click on the inventory record stakeholder type[^8] you'd like to add users to.
+1. On the record's detail page, click on the inventory record stakeholder type[^9] you'd like to add users to.
 
 2. Select your desired users from the drop-down menu.
 
@@ -70,15 +97,15 @@ Changes you make to inventory fields are automatically logged to that record’s
 
 :::: {.content-visible when-format="html" when-meta="includes.pdf-context"}
 ::: {.callout title="Uploaded files must be less than 50 MB each in size."}
-- To work with attachments on records, first add an attachment inventory field.[^9]
-- Select attachments in `.pdf` format as context documents when generating text blocks with AI within your documents.[^10]
+- To work with attachments on records, first add an attachment inventory field.[^10]
+- Select attachments in `.pdf` format as context documents when generating text blocks with AI within your documents.[^11]
 :::
 
 ::::
 
 :::: {.content-visible when-format="html" unless-meta="includes.pdf-context"}
 ::: {.callout title="Uploaded files must be less than 50 MB each in size."}
-To work with attachments on records, first add an attachment inventory field.[^9]
+To work with attachments on records, first add an attachment inventory field.[^10]
 :::
 
 :::: 
@@ -121,14 +148,16 @@ To work with attachments on records, first add an attachment inventory field.[^9
 
     :::
 
-[^7]: [View record activity](view-record-activity.qmd)
+[^7]: [Customize inventory layout](/guide/inventory/customize-inventory-layout.qmd#swap-between-views)
+
+[^8]: [View record activity](view-record-activity.qmd)
 
-[^8]: [Manage record stakeholder types](/guide/configuration/manage-record-stakeholder-types.qmd)
+[^9]: [Manage record stakeholder types](/guide/configuration/manage-record-stakeholder-types.qmd)
 
-[^9]: [Manage inventory fields](manage-inventory-fields.qmd#inventory-field-types)
+[^10]: [Manage inventory fields](manage-inventory-fields.qmd#inventory-field-types)
 
 :::: {.content-visible when-format="html" when-meta="includes.pdf-context"}
-[^10]: [Work with content blocks](/guide/documentation/work-with-content-blocks.qmd#generate-content)
+[^11]: [Work with content blocks](/guide/documentation/work-with-content-blocks.qmd#generate-content)
 
 ::::
 
diff --git a/site/guide/inventory/manage-inventory-fields.qmd b/site/guide/inventory/manage-inventory-fields.qmd
index e9541ad0da..b810431c5c 100644
--- a/site/guide/inventory/manage-inventory-fields.qmd
+++ b/site/guide/inventory/manage-inventory-fields.qmd
@@ -101,7 +101,7 @@ To group inventory fields, first create an inventory field group:
 
 2. Under {{< fa cube >}} Inventory, select **Inventory Record Fields**.
 
-3. Click **{{< fa folder-plus >}} Add Group** and enter in a **[name]{.smallcaps}** and a optional **[description]{.smallcaps}** for the group.
+3. Click **{{< fa folder-plus >}} Add Group** and enter a **[name]{.smallcaps}** and an optional **[description]{.smallcaps}** for the group.
 
 4. Click **Create Group** to add the new group.
 
diff --git a/site/guide/monitoring/enable-monitoring.qmd b/site/guide/monitoring/enable-monitoring.qmd
index 4445972aeb..0b835bec0c 100644
--- a/site/guide/monitoring/enable-monitoring.qmd
+++ b/site/guide/monitoring/enable-monitoring.qmd
@@ -26,7 +26,7 @@ To start uploading ongoing monitoring results for a model to {{< var vm.product
 
 ### 1. Get monitoring code snippet
 
-{{< include /developer/model-documentation/_code-snippet.qmd >}}
+{{< include /developer/quickstart/_code-snippet.qmd >}}
 
 To enable ongoing monitoring for a model, add `monitoring=True` to your code snippet:
 
@@ -93,7 +93,7 @@ b. Confirm that `monitoring=True` is present in the `vm.init` method, similar to
 
    You'll still need to include your document key and the monitoring flag.
 
-   [Store model credentials in `.env` files](/developer/model-documentation/store-credentials-in-env-file.qmd){.button .button-green}
+   [Store model credentials in `.env` files](/developer/quickstart/store-credentials-in-env-file.qmd){.button .button-green}
 
    :::
 
@@ -144,7 +144,7 @@ After you have enabled ongoing monitoring and run your code to generate some out
 
 [^4]: Selecting a **[document]{.smallcaps}** to connect to requires {{< var validmind.developer >}} version >=2.12.0.
 
-[^5]: [Install and initialize the {{< var validmind.developer >}}](/developer/model-documentation/install-and-initialize-validmind-library.qmd)
+[^5]: [Install and initialize the {{< var validmind.developer >}}](/developer/quickstart/install-and-initialize-validmind-library.qmd)
 
 [^6]: [Working with the inventory](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records)
 
diff --git a/site/guide/monitoring/ongoing-monitoring.qmd b/site/guide/monitoring/ongoing-monitoring.qmd
index 6bd12dd7d2..e4cb438f01 100644
--- a/site/guide/monitoring/ongoing-monitoring.qmd
+++ b/site/guide/monitoring/ongoing-monitoring.qmd
@@ -27,9 +27,12 @@ listing:
       - ../../notebooks/use_cases/ongoing_monitoring/application_scorecard_ongoing_monitoring.ipynb
       # - ../../notebooks/use_cases/credit_risk/application_scorecard_full_suite.ipynb
   - id: ongoing-monitoring-tests
-    contents: "../../tests/ongoing_monitoring/*.md"
+    contents: 
+    - title: "{{< var vm.product >}} Test Sandbox"
+      description: "Tests that are available as part of the {{< var validmind.developer >}}, grouped by type of validation or monitoring test."
+      path: ../../developer/how-to/test-sandbox.qmd
     type: grid
-    grid-columns: 3
+    grid-columns: 2
     max-description-length: 250
     page-size: 150
     fields: [title, description]  
@@ -37,7 +40,7 @@ listing:
 
 Monitoring of model performance in model risk management involves regularly assessing a model's accuracy, stability, and robustness to ensure it remains reliable after deployment. 
 
-Monitoring is a critical component of model risk management, as emphasized in regulations such as SR 11-7, SS1/23, and E-24,[^1] and includes:
+Monitoring is a critical component of model risk management, as emphasized in regulations such as SR 26-2, SS1/23, and E-24,[^1] and includes:
 
 - Tracking key performance indicators, detecting model drift, recalibrating as needed, and validating assumptions. 
 - Backtesting to verify predictive power, maintaining transparent reporting and governance, and ensuring ongoing compliance with regulatory standards. 
@@ -151,7 +154,7 @@ To try out monitoring, check out the code sample for ongoing monitoring of model
 
 <!-- FOOTNOTES -->
 
-[^1]: [Regulatory requirements](/about/overview-model-risk-management.qmd#regulatory-requirements)
+[^1]: [Regulatory requirements](/about/use-cases/model-risk-management.qmd#regulatory-frameworks)
 
 [^2]: [Working with documentation](/guide/documentation/working-with-documentation.qmd)
 
diff --git a/site/guide/reporting/_create-a-visualization.qmd b/site/guide/reporting/_create-a-visualization.qmd
index 2735588020..a485657a72 100644
--- a/site/guide/reporting/_create-a-visualization.qmd
+++ b/site/guide/reporting/_create-a-visualization.qmd
@@ -13,7 +13,7 @@ a. Click **{{< fa pencil >}} Edit Dashboard**.
 
 a. Select **{{< fa plus >}} Add Widget** then **{{< fa plus >}} Add Visualization**.
 
-a. On the Add Visualization panel, enter in your **[title]{.smallcaps}**.
+a. On the Add Visualization panel, enter your **[title]{.smallcaps}**.
 
 a. Select a **[visualization type]{.smallcaps}**:
 
@@ -37,7 +37,7 @@ a. When you are done configuring your dataset, click **Add Visualization** to in
 :::: {.content-hidden unless-format="revealjs"}
 a. Select **{{< fa plus >}} Add Widget** then **{{< fa plus >}} Add Visualization**.
 
-a. On the Add Visualization panel, enter in your **[title]{.smallcaps}**.
+a. On the Add Visualization panel, enter your **[title]{.smallcaps}**.
 
 a. Select a **[visualization type]{.smallcaps}**:
 
diff --git a/site/guide/reporting/_create-an-analytics-page.qmd b/site/guide/reporting/_create-an-analytics-page.qmd
index 039b26e78d..5a5ee949ac 100644
--- a/site/guide/reporting/_create-an-analytics-page.qmd
+++ b/site/guide/reporting/_create-an-analytics-page.qmd
@@ -6,7 +6,7 @@ a. In the left sidebar, click **{{< fa square-poll-vertical >}} Analytics**.
 
 a. Click **{{< fa plus >}} Add Page**.
 
-a. On the Add New Page module, enter in the:
+a. On the Add New Page module, enter the following:
 
     - **[page name]{.smallcaps}**
     - **[description]{.smallcaps}** (optional)
diff --git a/site/guide/shared/_work-with-filters.qmd b/site/guide/shared/_work-with-filters.qmd
index f98eda71a2..893c54118f 100644
--- a/site/guide/shared/_work-with-filters.qmd
+++ b/site/guide/shared/_work-with-filters.qmd
@@ -44,7 +44,7 @@ Value editor
 :::: {.content-visible when-format="html" when-meta="includes.inventory"}
 - **[record information]{.smallcaps}** — One of the inventory record fields always created by {{< var vm.product >}}, such as the Business Unit.
 - **[stakeholders]{.smallcaps}** — Record Owner, Record Developer, or Record Validator, or custom stakeholders if applicable.
-- **[record fields]{.smallcaps}** — One of the organization-specific inventory record fields you added for your own use.
+- **[record fields]{.smallcaps}** — One of the organization-specific inventory record fields you added for your own use, by field group.
 
 ::::
 
@@ -55,11 +55,22 @@ Value editor
 
 ::::
 
-:::: {.content-visible when-format="html" when-meta="includes.workflows"}
+:::: {.content-visible when-format="html" when-meta="includes.workflow.setup"}
 - **[workflow fields]{.smallcaps}** — Workflow properties, such as the workflow status, trigger, workflow target (type of workflow), or target type (subcategory of workflow target).
 
 ::::
 
+:::: {.content-visible when-format="html" when-meta="includes.workflow.view"}
+::: {.pl4 .pr3}
+Inventory
+
+- **[record information]{.smallcaps}** — One of the inventory record fields always created by {{< var vm.product >}}, such as the Business Unit.
+- **[stakeholders]{.smallcaps}** — Record Owner, Record Developer, or Record Validator, or custom stakeholders if applicable.
+- **[record fields]{.smallcaps}** — One of the organization-specific inventory record fields you added for your own use, by field group.
+:::
+
+::::
+
 :::: {.content-visible when-format="html" when-meta="includes.all"}
 :::: {.columns}
 
@@ -68,7 +79,7 @@ Value editor
 
 - **[record information]{.smallcaps}** — One of the inventory record fields always created by {{< var vm.product >}}, such as the Business Unit.
 - **[stakeholders]{.smallcaps}** — Record Owner, Record Developer, or Record Validator, or custom stakeholders if applicable.
-- **[record fields]{.smallcaps}** — One of the organization-specific inventory record fields you added for your own use.
+- **[record fields]{.smallcaps}** — One of the organization-specific inventory record fields you added for your own use, by field group.
 :::
 
 ::: {.column width="50%" .pl4 .pr3}
@@ -83,15 +94,28 @@ Value editor
 
 ::::
 
-::: {.column width="100%" .pl4 .pr3}
-[Workflow Filters]{.small-text}
+:::: {.columns}
 
-- **[workflow fields]{.smallcaps}** — Workflow properties, such as the workflow status, trigger, workflow target (type of workflow), or target type (subcategory of workflow target).
+::: {.column width="50%" .pl4 .pr2}
+[Workflow View Filters]{.small-text}
 
+Inventory
+
+- **[record information]{.smallcaps}** — One of the inventory record fields always created by {{< var vm.product >}}, such as the Business Unit.
+- **[stakeholders]{.smallcaps}** — Record Owner, Record Developer, or Record Validator, or custom stakeholders if applicable.
+- **[record fields]{.smallcaps}** — One of the organization-specific inventory record fields you added for your own use, by field group.
+:::
+
+::: {.column width="50%" .pl4 .pr3}
+[Workflow Setup Filters]{.small-text}
+
+- **[workflow fields]{.smallcaps}** — Workflow properties, such as the workflow status, trigger, workflow target (type of workflow), or target type (subcategory of workflow target).
 :::
 
 ::::
 
+::::
+
 
 3. From the operator dropdown, select one of:<br>[Available operators update based on the field selector]{.small-text}
 
diff --git a/site/guide/shared/manage-views/_organization-views.qmd b/site/guide/shared/manage-views/_organization-views.qmd
new file mode 100644
index 0000000000..1c866adb5a
--- /dev/null
+++ b/site/guide/shared/manage-views/_organization-views.qmd
@@ -0,0 +1,74 @@
+<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
+Refer to the LICENSE file in the root of this repository for details.
+SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
+
+::: {.callout}
+To publish a saved personal view to your organization, you must have permissions to manage shared workflow timeline views.^[[Manage permissions](/guide/configuration/manage-permissions.qmd)]
+:::
+
+::: {.panel-tabset}
+
+### Share views with your organization
+
+:::: {.content-visible when-format="html" when-meta="includes.workflow.view"}
+1. Save a personal workflow timeline view.^[[Manage personal timeline views](/guide/workflows/working-with-workflows.qmd#manage-personal-timeline-views)]
+
+::::
+
+:::: {.content-visible when-format="html" when-meta="includes.inventory"}
+1. Save a personal inventory view.^[[Manage personal inventory views](/guide/inventory/customize-inventory-layout.qmd#manage-personal-inventory-views)]
+
+::::
+
+:::: {.content-visible when-format="html" when-meta="includes.artifacts"}
+1. Save a personal artifact view.^[[Manage personal artifact views](/guide/validation/customize-artifact-layouts.qmd#manage-personal-artifact-views)]
+
+::::
+
+2. Select **My Views (#)**.
+
+3. Click on the name of your saved view, or **{{< fa bookmark >}} Select View** if you are not currently displaying a saved view.
+
+4. Hover over the name of the view you want to share with your organization.
+
+5. When the **{{< fa ellipsis-vertical >}}** appears, click on it and select **{{< fa upload >}} Publish to Organization**.
+
+6. (Optional) Edit the [view name]{.smallcaps} and [description]{.smallcaps} for your shared view.
+
+7. Click **{{< fa upload >}} Publish View** to share your view with your organization.
+
+### Unshare or remove saved organization views
+
+#### Unshare saved organization views
+
+To unshare a saved organization view:
+
+1. Click on the name of your saved view, or **{{< fa bookmark >}} Select View** if you are not currently displaying a saved view.
+
+2. Select **Organization (#)**.
+
+3. Hover over the view you want to remove from shared organization access.
+
+4. When the **{{< fa ellipsis-vertical >}}** appears, click on it and select **{{< fa download >}} Unpublish**.
+
+5. Click **Yes, Unpublish View** to confirm removal of the view from shared organization access.
+
+#### Remove saved organization views
+
+To remove a saved organization view:
+
+::: {.callout-important}
+Deletion of saved views is permanent.
+:::
+
+1. Click on the name of your saved view, or **{{< fa bookmark >}} Select View** if you are not currently displaying a saved view.
+
+2. Select **Organization (#)**.
+
+3. Hover over the view you want to remove from your organization.
+
+4. When the **{{< fa ellipsis-vertical >}}** appears, click on it and select **{{< fa trash-can >}} Remove View**.
+
+5. Click **Yes, Remove View** to confirm permanent deletion of that view.
+
+:::
\ No newline at end of file
diff --git a/site/guide/shared/manage-views/_personal-views.qmd b/site/guide/shared/manage-views/_personal-views.qmd
new file mode 100644
index 0000000000..3d81b810e4
--- /dev/null
+++ b/site/guide/shared/manage-views/_personal-views.qmd
@@ -0,0 +1,96 @@
+<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
+Refer to the LICENSE file in the root of this repository for details.
+SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
+
+::: {.panel-tabset}
+
+### Save personal views
+
+:::: {.content-visible when-format="html" when-meta="includes.workflow.view"}
+1. Apply a search or filters to the workflow timeline.^[[View all workflow executions](/guide/workflows/working-with-workflows.qmd#view-all-workflow-executions)]
+
+::::
+
+:::: {.content-visible when-format="html" when-meta="includes.inventory"}
+1. Customize a table view for the **[record type]{.smallcaps}** you want to save a view for.^[[Customize table view](/guide/inventory/customize-inventory-layout.qmd#customize-table-view)]
+
+    You can also apply filters or sorting before saving your view to include them in the view.^[[Working with the inventory](/guide/inventory/working-with-the-inventory.qmd)]
+
+::::
+
+:::: {.content-visible when-format="html" when-meta="includes.artifacts"}
+1. First, customize an artifact layout.^[[Customize artifact layouts by type](/guide/validation/customize-artifact-layouts.qmd#customize-artifact-layouts-by-type)]
+
+   You can also apply filters or sorting before saving your view to include them in the view.^[[View and filter artifacts](/guide/validation/view-filter-artifacts.qmd#filter-and-sort-artifacts)]
+
+::::
+
+2. Click on the name of your saved view, or **{{< fa bookmark >}} Select View** if you are not currently displaying a saved view.
+
+3. Select **My Views (#)** and click on **{{< fa bookmark >}} Save New View** to create your saved view.
+
+4. Enter the **[view name]{.smallcaps}** and **[description]{.smallcaps}** for your saved view.
+
+5. Click **Add New View** to save your saved view.
+
+:::: {.content-visible when-format="html" when-meta="includes.workflow.view"}
+Once you've created a saved personal view, you can share it with others in your organization.^[[Manage organization workflow timeline views](/guide/workflows/working-with-workflows.qmd#manage-organization-timeline-views)]
+
+::::
+
+:::: {.content-visible when-format="html" when-meta="includes.inventory"}
+Once you've created a saved personal view, you can share it with others in your organization.^[[Manage organization inventory views](/guide/inventory/customize-inventory-layout.qmd#manage-organization-inventory-views)]
+
+::::
+
+:::: {.content-visible when-format="html" when-meta="includes.artifacts"}
+Once you've created a saved personal view, you can share it with others in your organization.^[[Manage organization artifact views](/guide/validation/customize-artifact-layouts.qmd#manage-organization-artifact-views)]
+
+::::
+
+
+### Edit or remove saved personal views
+
+::: {.callout-important}
+Deletion of saved views is permanent.
+:::
+
+:::: {.content-visible when-format="html" unless-meta="includes.artifacts"}
+
+1. Click on the name of your saved view, or **{{< fa bookmark >}} Select View** if you are not currently displaying a saved view.
+
+2. Select **My Views (#)**.
+
+3. Hover over the name of the view you want to edit or remove.
+
+4. When the **{{< fa ellipsis-vertical >}}** appears, click on it and select:
+
+    - **{{< fa pencil >}} Edit View** to edit the [view name]{.smallcaps} and [description]{.smallcaps}. Click **Save Changes** to apply your edits.
+    - [**{{< fa trash-can >}} Remove View**]{.red} to delete the view. Click **Yes, Delete View** to confirm permanent deletion of that view.
+
+::::
+
+
+:::: {.content-visible when-format="html" when-meta="includes.artifacts"}
+#### Edit or remove validation issue views
+
+To modify a saved validation issues view:
+
+1. In the left sidebar, click **{{< fa triangle-exclamation >}} Validation Issues** for a list of validation issues across all records.
+
+{{< include /guide/validation/_remove-artifact-view.qmd >}}
+
+#### Edit or remove all other artifact type views
+
+To modify a saved view for all other artifact types:
+
+1. In the left sidebar, click **{{< fa border-all >}} Artifacts** for lists of other artifact types across all records, then select an artifact type^[[Manage artifact types](/guide/validation/manage-artifact-types.qmd)] for a list of that artifact type:
+
+      - Policy Exception
+      - Limitation
+
+{{< include /guide/validation/_remove-artifact-view.qmd >}}
+
+::::
+
+:::
\ No newline at end of file
diff --git a/site/guide/templates/_add-assessment-questions.qmd b/site/guide/templates/_add-assessment-questions.qmd
index 8838206a42..87d2b971c6 100644
--- a/site/guide/templates/_add-assessment-questions.qmd
+++ b/site/guide/templates/_add-assessment-questions.qmd
@@ -9,7 +9,7 @@ Manually add assessment questions, or generate questions from a PDF upload for D
 
 a. Click **{{< fa plus >}} Add Question** to create a new question.
 
-a. Enter in the **[questions]{.smallcaps}**:
+a. Enter the **[questions]{.smallcaps}**:
 
     - Each line without a break (enter) is considered one complete question.^[Empty lines will be ignored.]
     - To add a separate question, press enter to start a new line.
@@ -44,7 +44,7 @@ Select the assessment you want to add questions to by clicking on it:
 
 1. Click **{{< fa plus >}} Add Question** to create a new question.
 
-1. Enter in the **[questions]{.smallcaps}**:
+1. Enter the **[questions]{.smallcaps}**:
 
     - Each line without a break (enter) is considered one complete question. Empty lines will be ignored.
     - To add a separate question, press enter to start a new line.
diff --git a/site/guide/templates/_customize-document-templates.qmd b/site/guide/templates/_customize-document-templates.qmd
index e94cd2314e..1f37129c2e 100644
--- a/site/guide/templates/_customize-document-templates.qmd
+++ b/site/guide/templates/_customize-document-templates.qmd
@@ -96,7 +96,7 @@ Customize {{< var vm.product >}}'s templates for documents to fit your specific
 
 1.  Under {{< fa file >}} Documents, select **Templates**.
 
-1. Select one of the tabs for the [type of template you want to edit](/guide/templates/manage-document-types.qmd){target="blank"}.
+1. Select one of the tabs for the [type of template you want to edit](/guide/templates/manage-document-types.qmd){target="_blank"}.
 
 1. Click the template to edit and on the template details page, select **{{< fa pencil >}} Edit Outline**. 
 
diff --git a/site/guide/templates/_duplicate-template.qmd b/site/guide/templates/_duplicate-template.qmd
index 41aa0abacc..f2f3c0420f 100644
--- a/site/guide/templates/_duplicate-template.qmd
+++ b/site/guide/templates/_duplicate-template.qmd
@@ -34,7 +34,7 @@ To duplicate an existing template and start with version one of that new templat
 
 1.  Under {{< fa file >}} Documents, select **Templates**.
 
-1. Select one of the tabs for the [type of template you want to duplicate](/guide/templates/working-with-documents.qmd){target="blank"}.
+1. Select one of the tabs for the [type of template you want to duplicate](/guide/templates/working-with-documents.qmd){target="_blank"}.
 
 1. Click on the template to duplicate and on the template details page, select **{{< fa copy >}} Duplicate Template**. 
 
diff --git a/site/guide/templates/_template-schema-generated.qmd b/site/guide/templates/_template-schema-generated.qmd
index 62b8a5efb4..3256ea27cc 100644
--- a/site/guide/templates/_template-schema-generated.qmd
+++ b/site/guide/templates/_template-schema-generated.qmd
@@ -1137,7 +1137,7 @@ Source: backend/src/backend/templates/documentation/model_documentation/mdd_temp
     </div>
 
     <footer>
-        <p class="generated-by-footer">Generated using <a href="https://github.com/coveooss/json-schema-for-humans">json-schema-for-humans</a> on 2026-04-28 at 19:22:39 -0700</p>
+        <p class="generated-by-footer">Generated using <a href="https://github.com/coveooss/json-schema-for-humans">json-schema-for-humans</a> on 2026-05-22 at 13:46:20 -0700</p>
     </footer></div></body>
 </html>
 ```
diff --git a/site/guide/templates/_view-document-templates.qmd b/site/guide/templates/_view-document-templates.qmd
index f374270c08..a2bc6d93ea 100644
--- a/site/guide/templates/_view-document-templates.qmd
+++ b/site/guide/templates/_view-document-templates.qmd
@@ -65,7 +65,7 @@ To review the existing templates available to your organization:
 
 1.  Under {{< fa file >}} Documents, select **Templates**.
 
-1. Select one of the tabs for [the document type with the templates you want to view](/guide/templates/working-with-documents.qmd){target="blank"}.
+1. Select one of the tabs for [the document type with the templates you want to view](/guide/templates/working-with-documents.qmd){target="_blank"}.
 
 1. Select one of the available templates to view detailed information about the template.
 
diff --git a/site/guide/templates/_what-is-document-checker.qmd b/site/guide/templates/_what-is-document-checker.qmd
index bb20d68bee..34206792f1 100644
--- a/site/guide/templates/_what-is-document-checker.qmd
+++ b/site/guide/templates/_what-is-document-checker.qmd
@@ -46,7 +46,7 @@ As a compliance tool, the {{< var validmind.checker >}} is most useful when your
 
 By default, {{< var vm.product >}} supports the following regulations:
 
-- Federal Reserve Supervisory Letter SR 11-7 (United States)
+- Federal Reserve Supervisory Letter SR 26-2 (United States)
 - Bank of England Prudential Regulation Authority (PRA) Supervisory Statement SS1/23 (United Kingdom)
 - Office of the Superintendent of Financial Institutions (OSFI) Guideline E-23 (Canada)
 - European Union Artificial Intelligence Act (Regulation (EU) 2024/1689, EU AI Act)
diff --git a/site/guide/templates/customize-document-checker.qmd b/site/guide/templates/customize-document-checker.qmd
index 2ff9e2bccc..535c206cf0 100644
--- a/site/guide/templates/customize-document-checker.qmd
+++ b/site/guide/templates/customize-document-checker.qmd
@@ -139,7 +139,7 @@ d. Once cloned, add or edit the assessment questions.[^3]
 ### Edit assessment questions
 
 ::: {.callout title="How do I locate a specific question?"}
-Click **{{<fa magnifying-glass >}} Search** to enter in your keywords, then press **Search** to narrow down results.
+Click **{{<fa magnifying-glass >}} Search** to enter your keywords, then press **Search** to narrow down results.
 :::
 
 a. Hover over the question you want to edit.
diff --git a/site/guide/templates/manage-document-types.qmd b/site/guide/templates/manage-document-types.qmd
index d8def7e441..dfc5752195 100644
--- a/site/guide/templates/manage-document-types.qmd
+++ b/site/guide/templates/manage-document-types.qmd
@@ -34,7 +34,7 @@ These stock document types cannot be deleted, only edited:
 
 3. Click **{{< fa plus >}} Add Document Type**.
 
-4. Enter in the document type details:
+4. Enter the document type details:
 
     - Provide a **[name]{.smallcaps}** and an optional **[description]{.smallcaps}**.
     - Toggle whether this document type should be automatically created **[when record is registered]{.smallcaps}**.
diff --git a/site/guide/templates/manage-documents.qmd b/site/guide/templates/manage-documents.qmd
index 001220bb4a..d06e02b407 100644
--- a/site/guide/templates/manage-documents.qmd
+++ b/site/guide/templates/manage-documents.qmd
@@ -31,7 +31,7 @@ Add or delete documents available on individual records in your inventory.
 
 4. Click **{{< fa plus >}} Create Document**.
 
-5. Enter in the document details:
+5. Enter the document details:
 
     - **[document title]{.smallcaps}** — Title of your document.[^7]
     - **[document type]{.smallcaps}**[^8] — The type of your document.
diff --git a/site/guide/validation/_add-artifacts-on-documentation.qmd b/site/guide/validation/_add-artifacts-on-documentation.qmd
index 6018aa579d..ecd4c4fe44 100644
--- a/site/guide/validation/_add-artifacts-on-documentation.qmd
+++ b/site/guide/validation/_add-artifacts-on-documentation.qmd
@@ -23,32 +23,26 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 1. On the modal that opens, provide information for your artifact.
 
-1. When you are done, click **Save** to submit the artifact.
+1. When you are done, click **Add {Artifact Type}** where `{Artifact Type}` is the artifact type you want to add to submit the artifact.
 
    Once created, you can then add supporting documentation to your artifact.^[[Manage attachments on artifacts](/guide/validation/add-manage-artifacts.qmd#manage-attachments)]
 
 ::::
 
 :::: {.content-hidden unless-format="revealjs"}
-1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
-
-1. Select a record or [find your record by applying a filter or searching for it](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records){target="_blank"}.
-
-1. In the left sidebar that appears for your record, click **Development** under {{< fa file >}} Documents.
+a. In the left sidebar that appears for your record, click **Development** under {{< fa file >}} Documents.
 
-    <!-- Either log an artifact on this overview page, or via a specific documentation section. Both methods will allow you to associate an artifact with a documentation section.  -->
-
-1. On your record's documentation page, click **{{< fa plus >}} Add Artifact**.
+b. On your record's documentation page, click **{{< fa plus >}} Add Artifact**.
 
-1. Select the [artifact type](/guide/validation/manage-artifact-types.qmd){target="_blank"} you want to add:
+c. Select the [artifact type](/guide/validation/manage-artifact-types.qmd){target="_blank"} you want to add:
 
    - Validation Issue
    - Policy Exception
    - Limitation
 
-1. On the modal that opens, provide information for your artifact.
+d. On the modal that opens, provide information for your artifact.
 
-1. When you are done, click **Save** to submit the artifact. 
+e. When you are done, click **Add {Artifact Type}** where `{Artifact Type}` is the artifact type you want to add to submit the artifact.
 
    Once created, you can then [add supporting documentation to your artifact](/guide/validation/add-manage-artifacts.qmd#manage-attachments){target="_blank"}.
 
diff --git a/site/guide/validation/_add-edit-artifact-statuses.qmd b/site/guide/validation/_add-edit-artifact-statuses.qmd
index 79fb4e0dd4..25797b00e9 100644
--- a/site/guide/validation/_add-edit-artifact-statuses.qmd
+++ b/site/guide/validation/_add-edit-artifact-statuses.qmd
@@ -8,7 +8,7 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 a. Click **{{< fa plus >}} Add Status**.
 
-b. Enter in a **[status name]{.smallcaps}** and assign a **[color]{.smallcaps}** to your artifact status.
+b. Enter a **[status name]{.smallcaps}** and assign a **[color]{.smallcaps}** to your artifact status.
 
 c. When you are done, click **Add Status** to create your new status.
 
@@ -36,7 +36,7 @@ Artifact statuses cannot be deleted if in use on an artifact. Ensure that the st
 
 a. Click **{{< fa plus >}} Add Status**.
 
-b. Enter in a **[status name]{.smallcaps}** and assign a **[color]{.smallcaps}** to your artifact status.
+b. Enter a **[status name]{.smallcaps}** and assign a **[color]{.smallcaps}** to your artifact status.
 
 c. When you are done, click **Add Status** to create your new status.
 
diff --git a/site/guide/validation/_add-edit-artifact-types.qmd b/site/guide/validation/_add-edit-artifact-types.qmd
index 7f52899cd1..de814dd5b1 100644
--- a/site/guide/validation/_add-edit-artifact-types.qmd
+++ b/site/guide/validation/_add-edit-artifact-types.qmd
@@ -11,13 +11,13 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 3. Click **{{< fa plus >}} Add Artifact Type**.
 
-4. Enter in a [name]{.smallcaps} and an optional [description]{.smallcaps} for your artifact type.
+4. Enter a [name]{.smallcaps} and an optional [description]{.smallcaps} for your artifact type.
 
 5. Click **Create** to create your new artifact type.
 
 6. Click on your newly created artifact type to edit its details and permissions.
 
-7. Enter in the artifact type's details:
+7. Enter the artifact type's details:
 
     - **[fields]{.smallcaps}** — Select the default artifact fields that should appear on this type of artifact and click **Save Fields** to apply your changes.[^add-fields-callout]
     - **[record fields display]{.smallcaps}**[^add-record-fields-config] — Select which upstream record fields^[[Edit inventory fields](/guide/inventory/edit-inventory-fields.qmd)] to display as read-only under the Inventory Record Information section on artifacts of this type and click **Save Record Fields Configuration** to apply your changes.
@@ -95,7 +95,7 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 a. Click **{{< fa plus >}} Add Artifact Type**.
 
-b. Enter in a [name]{.smallcaps} and an optional [description]{.smallcaps} for your artifact type.
+b. Enter a [name]{.smallcaps} and an optional [description]{.smallcaps} for your artifact type.
 
 c. Click **Create** to create your new artifact type.
 
diff --git a/site/guide/validation/_assess-evidence-for-compliance.qmd b/site/guide/validation/_assess-evidence-for-compliance.qmd
new file mode 100644
index 0000000000..c6c25d79a2
--- /dev/null
+++ b/site/guide/validation/_assess-evidence-for-compliance.qmd
@@ -0,0 +1,188 @@
+<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
+Refer to the LICENSE file in the root of this repository for details.
+SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
+
+:::: {.content-visible unless-format="revealjs"}
+## Assess evidence for compliance
+
+:::: {.column-margin}
+![Assess Evidence panel](/guide/validation/assess-evidence-panel.png){fig-alt="Assess Evidence panel showing option to identify potential risks and compliance gaps based on linked evidence." .screenshot}
+::::
+
+Assess Evidence uses AI to analyze the linked evidence and generate a structured compliance assessment, identifying potential risks and compliance gaps.
+
+1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
+
+2. Select a record or find your record by applying a filter or searching for it.^[[Working with the inventory](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records)]
+
+3. In the left sidebar that appears for your record, click **{{< fa file >}} Documents** and select the **Latest** tab.^[[Work with document versions](/guide/documentation/work-with-document-versions.qmd)]
+
+4. Click on a Validation type file.^[[Preparing validation reports](/guide/validation/preparing-validation-reports.qmd#validation-overview)]
+
+5. You can assess evidence for compliance at three levels:
+
+::: {.panel-tabset}
+
+#### For the entire report
+
+Click **{{< fa wand-magic-sparkles >}} Assess Evidence** in the right sidebar to expand the evidence assessment panel for the entire report.
+
+#### For an entire section
+
+Sections include subsections with guidelines, and a risk assessment summary at the top of the page.
+
+a. Click on a section of the validation report to expand that section.
+b. Click **{{< fa wand-magic-sparkles >}} Assess Evidence** at the top of the page to open the evidence assessment panel for that section.
+
+#### For individual guidelines
+
+Guidelines are organized into subsections under a parent section.
+
+a. Click on a section of the validation report to expand that section.
+b. In any subsection, click **{{< fa wand-magic-sparkles >}} Assess Evidence** to open the evidence assessment panel for that guideline.
+
+:::
+
+6. Click **Assess Evidence** to run an analysis on the linked evidence and generate an Evidence Assessment containing:
+
+   - **Guideline Assessment** — A compliance conclusion indicating whether the guideline requirements are fully met, partially met, or not met, with an explanation of the evidence quality.
+   - **Validation Observations** — Specific findings about gaps or issues in the evidence, with each observation covering a single concern and suggesting actions for developers.
+   - **Evidence Review** — A detailed analysis of what the evidence demonstrates, including references to specific test outputs, documentation, and any limitations.
+
+   If this is your first time running Assess Evidence, review the information presented to you explaining the assessment process, then click **Assess Evidence** to run the assessment.^[To hide the additional information on assessment modal for future runs, select the **Don't show this again** checkbox.]
+
+When evidence assessment is complete, the [#]{.bubble} of assessment items to review is displayed. Review the assessment items and approve or reject the suggestions as needed.
+
+### Review and approve evidence assessments
+
+After running Assess Evidence, you can review and approve assessments at three levels:
+
+::: {.panel-tabset}
+
+#### For the entire report
+
+If you have run evidence assessment for the entire report, you can review and approve suggestions at the entire report level.
+
+The **{{< fa wand-magic-sparkles >}} Assess Evidence** panel in the right sidebar for your validation report shows how many items need review across the entire report — click to expand the panel if it is collapsed:
+
+   - Select **[{{< fa check >}} Approve All]{.green}** to link all suggested assessments across all guidelines, or **[{{< fa xmark >}} Reject All]{.red}** to dismiss all suggestions.
+      - Click into any section of the report with approved assessments to confirm that any approved assessments appear in the Evidence Assessment panel for guidelines as expected.
+   - To re-run the assessment, click **{{< fa sync >}} Reassess Evidence**.
+
+#### For an entire section
+
+Sections include subsections with guidelines, and a risk assessment summary at the top of the page. If you have run mapping for an entire section, you can review and approve suggestions at the section level:
+
+a. Click on a section of the validation report to expand that section.
+
+b. Click **{{< fa wand-magic-sparkles >}} Assess Evidence** at the top of the page to open the evidence assessment panel for that section:
+
+   - Select **[{{< fa check >}} Approve All]{.green}** to link all suggested assessments for guidelines in that section, or **[{{< fa xmark >}} Reject All]{.red}** to dismiss all section suggestions.
+      - Confirm that any approved assessments appear in the Evidence Assessment panels for the guidelines in that section as expected.
+   - To re-run the assessment, click **{{< fa sync >}} Reassess Evidence**.
+
+#### For individual guidelines
+
+Guidelines are organized into subsections under a parent section. If you have run mapping for an individual guideline, you can review and approve suggestions at the guideline level:
+
+a. Click on a section of the validation report to expand that section.
+
+b. In any subsection, click **Evidence Assessment** to expand the evidence assessment panel for that guideline:
+
+   - Click **[{{< fa check >}} Approve]{.green}** to approve the assessment.
+   - Click **[{{< fa xmark >}} Reject]{.red}** to dismiss the assessment.
+   - To re-run the assessment, click **{{< fa wand-magic-sparkles >}} Reassess Evidence**.
+
+:::
+
+::::
+
+
+:::: {.content-hidden unless-format="revealjs"}
+Assess Evidence uses AI to analyze the linked evidence and generate a structured compliance assessment, identifying potential risks and compliance gaps.
+
+1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
+
+2. Select a record or find your record by [applying a filter or searching for it](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records){target="_blank"}.
+
+3. In the left sidebar that appears for your record, click **Validation** under **{{< fa file >}} Documents**.
+
+4. You can assess evidence for compliance at three levels:
+
+::: {.panel-tabset}
+
+#### For the entire report
+
+Click **{{< fa wand-magic-sparkles >}} Assess Evidence** in the right sidebar to expand the evidence assessment panel for the entire report.
+
+#### For an entire section
+
+Sections include subsections with guidelines, and a risk assessment summary at the top of the page.
+
+a. Click on a section of the validation report to expand that section.
+b. Click **{{< fa wand-magic-sparkles >}} Assess Evidence** at the top of the page to open the evidence assessment panel for that section.
+
+#### For individual guidelines
+
+Guidelines are organized into subsections under a parent section.
+
+a. Click on a section of the validation report to expand that section.
+b. In any subsection, click **{{< fa wand-magic-sparkles >}} Assess Evidence** to open the evidence assessment panel for that guideline.
+
+:::
+
+6. Click **Assess Evidence** to run an analysis on the linked evidence and generate an Evidence Assessment containing:
+
+   - **Guideline Assessment** — A compliance conclusion indicating whether the guideline requirements are fully met, partially met, or not met, with an explanation of the evidence quality.
+   - **Validation Observations** — Specific findings about gaps or issues in the evidence, with each observation covering a single concern and suggesting actions for developers.
+   - **Evidence Review** — A detailed analysis of what the evidence demonstrates, including references to specific test outputs, documentation, and any limitations.
+
+   If this is your first time running Assess Evidence, review the information presented to you explaining the assessment process, then click **Assess Evidence** to run the assessment.
+
+When evidence assessment is complete, the [#]{.bubble} of assessment items to review is displayed. Review the assessment items and approve or reject the suggestions as needed.
+
+#### Review and approve evidence assessments
+
+After running Assess Evidence, you can review and approve assessments at three levels:
+
+::: {.panel-tabset}
+
+#### For the entire report
+
+If you have run evidence assessment for the entire report, you can review and approve suggestions at the entire report level.
+
+The **{{< fa wand-magic-sparkles >}} Assess Evidence** panel in the right sidebar for your validation report shows how many items need review across the entire report — click to expand the panel if it is collapsed:
+
+   - Select **[{{< fa check >}} Approve All]{.green}** to link all suggested assessments across all guidelines, or **[{{< fa xmark >}} Reject All]{.red}** to dismiss all suggestions.
+      - Click into any section of the report with approved assessments to confirm that any approved assessments appear in the Evidence Assessment panel for guidelines as expected.
+   - To re-run the assessment, click **{{< fa sync >}} Reassess Evidence**.
+
+#### For an entire section
+
+Sections include subsections with guidelines, and a risk assessment summary at the top of the page. If you have run mapping for an entire section, you can review and approve suggestions at the section level:
+
+a. Click on a section of the validation report to expand that section.
+
+b. Click **{{< fa wand-magic-sparkles >}} Assess Evidence** at the top of the page to open the evidence assessment panel for that section:
+
+   - Select **[{{< fa check >}} Approve All]{.green}** to link all suggested assessments for guidelines in that section, or **[{{< fa xmark >}} Reject All]{.red}** to dismiss all section suggestions.
+      - Confirm that any approved assessments appear in the Evidence Assessment panels for the guidelines in that section as expected.
+   - To re-run the assessment, click **{{< fa sync >}} Reassess Evidence**.
+
+#### For individual guidelines
+
+Guidelines are organized into subsections under a parent section. If you have run mapping for an individual guideline, you can review and approve suggestions at the guideline level:
+
+a. Click on a section of the validation report to expand that section.
+
+b. In any subsection, click **Evidence Assessment** to expand the evidence assessment panel for that guideline:
+
+   - Click **[{{< fa check >}} Approve]{.green}** to approve the assessment.
+   - Click **[{{< fa xmark >}} Reject]{.red}** to dismiss the assessment.
+   - To re-run the assessment, click **{{< fa wand-magic-sparkles >}} Reassess Evidence**.
+
+:::
+
+::::
+
+
diff --git a/site/guide/validation/_provide-compliance-assessments.qmd b/site/guide/validation/_assign-compliance-assessments.qmd
similarity index 52%
rename from site/guide/validation/_provide-compliance-assessments.qmd
rename to site/guide/validation/_assign-compliance-assessments.qmd
index ad5456259d..f4a5c61660 100644
--- a/site/guide/validation/_provide-compliance-assessments.qmd
+++ b/site/guide/validation/_assign-compliance-assessments.qmd
@@ -2,6 +2,8 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
+After you have mapped and assessed available evidence, and generated or attached relevant artifacts, assign compliance assessments to each subsection of your validation report:
+
 :::: {.content-visible unless-format="revealjs"}
 ::: {.callout title="Assessment options available for selection depend on configuration for individual validation report templates."}
 Your organization can customize these options to match its own assessment framework, or choose to remove them from templates entirely.^[[Configure assessment options](/guide/validation/configure-assessment-options.qmd)]
@@ -15,32 +17,29 @@ Your organization can customize these options to match its own assessment framew
 
 1. Click on a Validation type file.^[[Preparing validation reports](/guide/validation/preparing-validation-reports.qmd#validation-overview)]
 
-   Expand any subsection of the validation report you would like to work with.
-
-1. In any section of the documentation where the **[assessment]{.smallcaps}** dropdown menu is available, select one of the available assessment options.
+   Expand any subsection of the validation report you have attached evidence and artifacts for.
 
-   Confirm that the compliance summary shown for each subsection provides an accurate overview for current qualitative and quantitative risk assessments.
+1. Under Guideline, click **Select a value for this guideline** to choose one of the available Assessment options.
 
-1. Click under **Risk Assessment Notes** to add your risk assessment notes for that section using the content editing toolbar.^[[Work with content blocks](/guide/documentation/work-with-content-blocks.qmd#content-editing-toolbar)]
+   At the top of the page for that subsection, confirm that the compliance summary shown provides an accurate overview for current qualitative and quantitative risk assessments for that subsection.
 
 ::::
 
 :::: {.content-hidden unless-format="revealjs"}
-1. In the same Class Imbalance Assessment sub-section above the Risk Assessment Notes, locate the Guideline with the **[assessment]{.smallcaps}** drop-down.
+1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
 
-1. Select one of the available assessment options.
+2. Select a record or find your record [by applying a filter or searching for it](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records){target="_blank"}.
 
-1. Confirm that the compliance summary shown for each subsection under 2. Validation provides an accurate overview for current qualitative and quantitative risk assessments:
+3. In the left sidebar that appears for your record, click **Validation** under **{{< fa file >}} Documents**.
 
-   <!-- THIS SCREENSHOT NEEDS TO BE UPDATED -->
-   ![Risk assessment compliance summary](/guide/validation/assess-compliance-summary.png){fig-alt="A screenshot of the risk assessment compliance summary" .screenshot group="compliance"}
+   Expand any subsection of the validation report you have attached evidence and artifacts for.
 
-:::: {.pa3 .mt3 .f5 .embed}
-**Assessment options available for selection depend on configuration for individual validation report templates.**
+4. Under Guideline, click **Select a value for this guideline** to choose one of the available Assessment options.
 
-Your organization can customize these options to match its own assessment framework, or choose to remove them from templates entirely.
+   At the top of the page for that subsection, confirm that the compliance summary shown provides an accurate overview for current qualitative and quantitative risk assessments for that subsection:
 
-:::
+   <!-- THIS SCREENSHOT NEEDS TO BE UPDATED -->
+   ![Risk assessment compliance summary](/guide/validation/assess-compliance-summary.png){fig-alt="A screenshot of the risk assessment compliance summary" .screenshot group="compliance"}
 
 
 ::::
diff --git a/site/guide/validation/_autogenerate-validation-issues.qmd b/site/guide/validation/_autogenerate-validation-issues.qmd
index 013d19ecf3..805bd861a0 100644
--- a/site/guide/validation/_autogenerate-validation-issues.qmd
+++ b/site/guide/validation/_autogenerate-validation-issues.qmd
@@ -2,39 +2,111 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-After you complete your risk assessment notes for a validation guideline, you can use AI to automatically suggest validation issues based on the gaps identified in your assessment.
+<!-- VISIBLE IN USER GUIDES ONLY -->
+
+::::: {.content-visible unless-format="revealjs"}
+
+::: {.callout-important title="AI suggestions require review!"}
+Always review AI-generated validation issues before approving them. The suggestions are based on patterns in your risk assessment notes and may need adjustment to accurately reflect your findings.
 
-::: {.callout title="This feature requires AI features to be enabled for your organization."}
-Contact your administrator if you don't see the **Suggest Validation Issues** option.
 :::
 
-1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
+Use AI to automatically suggest validation issues based on the gaps identified in your assessment:^[This feature requires AI capabilities to be enabled for your organization — contact an administrator if you cannot access the **{{< fa wand-magic-sparkles >}} Suggest Validation Issues** interface.]
 
-1. Select a record or find your record by applying a filter or searching for it.^[[Working with the inventory](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records)]
+a. In the Artifacts section under your evidence, click **{{< fa wand-magic-sparkles >}} Suggest Validation Issues**.
 
-1. In the left sidebar, click **Validation** to open the validation report.
+b. Click **Suggest Validation Issues** to have {{< var vm.product >}} analyze your risk assessment notes along with the guideline context and identify any gaps that warrant validation issues.
 
-1. Expand any subsection of the validation report and complete your **Risk Assessment Notes** for a guideline.
+c. Review the suggested validation issues. Each suggestion includes:
 
-1. Click **{{< fa wand-magic-sparkles >}} Suggest Validation Issues** next to the guideline you assessed.
+   - A proposed title and description outlining the issue
+   - A preliminary severity level based on the identified gap
+   - A proposed remediation plan
 
-   The AI analyzes your risk assessment notes along with the guideline context to identify any gaps that warrant validation issues.
+   Click **See more {{< fa chevron-down >}}** on each suggested issue to expand for more details.
 
-1. Review the suggested validation issues:
+d. Approve, reject, or regenerate the suggested validation issues:
 
-   Each suggestion includes:
+   ::: {.panel-tabset}
 
-   - A proposed title describing the issue
-   - A severity level based on the identified gap
-   - Recommended remediation actions
+   #### Approve/reject individual issues
 
-1. For each suggested issue, choose one of the following actions:
+   Under each individual issue:
 
    - Click **{{< fa check >}} Approve** to create the validation issue and link it to your report.
-   - Click **{{< fa xmark >}} Dismiss** to reject the suggestion if it doesn't apply.
+   - Click **{{< fa xmark >}} Reject** to reject the suggestion if it doesn't apply.
 
-1. After approving a validation issue, you can further customize it by clicking on the issue to edit fields such as owner, due date, and status.^[[Add and manage artifacts](/guide/validation/add-manage-artifacts.qmd)]
+   #### Approve/reject all issues
 
-::: {.callout-important title="AI suggestions require review"}
-Always review AI-generated validation issues before approving them. The suggestions are based on patterns in your risk assessment notes and may need adjustment to accurately reflect your findings.
+   Click **{{< fa wand-magic-sparkles >}} Suggest Validation Issues [#]{.bubble}** and select:
+
+   - **{{< fa check >}} Approve All** to approve all suggested issues at once.
+   - **{{< fa xmark >}} Reject All** to reject all suggested issues at once.
+
+   #### Regenerate new suggestions
+
+   Click **{{< fa wand-magic-sparkles >}} Suggest Validation Issues [#]{.bubble}** and select **{{< fa sync >}} Regenerate Issues**.
+
+   :::
+
+:::: {.content-visible when-format="html" when-meta="includes.compliance"}
+e. After approving a validation issue, you can further customize it by clicking on the issue to edit fields such as owner, due date, and status.^[[Add and manage artifacts](/guide/validation/add-manage-artifacts.qmd)]
+
+::::
+
+:::: {.content-visible when-format="html" unless-meta="includes.compliance"}
+e. After approving a validation issue, you can further customize it by clicking on the issue to edit fields such as owner, due date, and status.
+
+::::
+
+
+:::::
+
+<!-- VISIBLE IN TRAINING SLIDES ONLY -->
+
+::::: {.content-hidden unless-format="revealjs"}
+
+:::: {.mb2 .mr4 .pa3 .f5 .embed}
+- **Always review AI-generated validation issues before approving them.** The suggestions are based on patterns in your risk assessment notes and may need adjustment to accurately reflect your findings.
+- This feature requires AI capabilities to be enabled for your organization. Contact an administrator if you cannot access the **{{< fa wand-magic-sparkles >}} Suggest Validation Issues** interface.
 :::
+
+You can of course log artifacts manually on your validation report, but you can also use AI to automatically suggest validation issues based on the gaps identified in your assessment:
+
+a. In the left sidebar that appears for your record, click **Validation** under {{< fa file >}} Documents.
+
+b. In the Artifacts section under your evidence, click **{{< fa wand-magic-sparkles >}} Suggest Validation Issues**.
+
+c. Click **Suggest Validation Issues** to have {{< var vm.product >}} analyze your risk assessment notes along with the guideline context and identify any gaps that warrant validation issues.
+
+d. Review the suggested validation issues. Each suggestion includes:
+
+   - A proposed title and description outlining the issue
+   - A preliminary severity level based on the identified gap
+   - A proposed remediation plan
+
+   Click **See more {{< fa chevron-down >}}** on each suggested issue to expand for more details.
+
+e. Approve, reject, or regenerate the suggested validation issues:
+
+   #### Approve/reject individual issues
+
+   Under each individual issue:
+
+   - Click **{{< fa check >}} Approve** to create the validation issue and link it to your report.
+   - Click **{{< fa xmark >}} Reject** to reject the suggestion if it doesn't apply.
+
+   #### Approve/reject all issues
+
+   Click **{{< fa wand-magic-sparkles >}} Suggest Validation Issues [#]{.bubble}** and select:
+
+   - **{{< fa check >}} Approve All** to approve all suggested issues at once.
+   - **{{< fa xmark >}} Reject All** to reject all suggested issues at once.
+
+   #### Regenerate new suggestions
+
+   Click **{{< fa wand-magic-sparkles >}} Suggest Validation Issues [#]{.bubble}** and select **{{< fa sync >}} Regenerate Issues**.
+
+f. After approving a validation issue, you can further customize it by clicking on the issue to edit fields such as owner, due date, and status.
+
+:::::
diff --git a/site/guide/validation/_how-does-mapping-assessment-work.qmd b/site/guide/validation/_how-does-mapping-assessment-work.qmd
new file mode 100644
index 0000000000..51d68dd44b
--- /dev/null
+++ b/site/guide/validation/_how-does-mapping-assessment-work.qmd
@@ -0,0 +1,47 @@
+<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
+Refer to the LICENSE file in the root of this repository for details.
+SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
+
+
+:::: {.content-visible unless-format="revealjs"}
+## How does automatic evidence mapping and assessment work?
+
+Validation reports require you to link supporting evidence to each guideline and write compliance assessments, a process that can be time-consuming when done manually across dozens of guidelines.
+
+Map Evidence
+: Scans all available evidence from developers and validators, then suggests which items are relevant to each guideline. Instead of searching through evidence blocks yourself, you review AI-suggested matches and approve the ones that apply. Each suggestion includes a relevance score and explanation so you can make informed decisions.
+
+Assess Evidence
+: Analyzes the linked evidence for a guideline and drafts a structured compliance assessment. The generated assessment includes a compliance conclusion, specific observations about gaps or issues, and a technical review of what the evidence demonstrates. You review and approve the draft, and then make edits if needed — saving time while maintaining control over the final content.
+
+Both features are designed to accelerate validation without replacing your judgment. You always review and approve suggestions before they become part of the report.
+
+::::
+
+<!-- VISIBLE IN TRAINING SLIDES ONLY -->
+
+:::: {.content-hidden unless-format="revealjs"}
+#### How does automatic evidence mapping and assessment work?
+
+Validation reports require you to link supporting evidence to each guideline and write compliance assessments, a process that can be time-consuming when done manually across dozens of guidelines.
+
+::: {.panel-tabset}
+
+#### Map Evidence
+Scans all available evidence from developers and validators, then suggests which items are relevant to each guideline. Instead of searching through evidence blocks yourself, you review AI-suggested matches and approve the ones that apply. Each suggestion includes a relevance score and explanation so you can make informed decisions.
+
+#### Assess Evidence
+Analyzes the linked evidence for a guideline and drafts a structured compliance assessment. The generated assessment includes a compliance conclusion, specific observations about gaps or issues, and a technical review of what the evidence demonstrates. You review and approve the draft, and then make edits if needed — saving time while maintaining control over the final content.
+
+:::
+
+:::: {.mt4 .f4 .pa2 .embed}
+Both features are designed to accelerate validation without replacing your judgment. You always review and approve suggestions before they become part of the report.
+
+:::
+
+
+::::
+
+
+
diff --git a/site/guide/validation/_link-artifacts-to-reports.qmd b/site/guide/validation/_link-artifacts-to-reports.qmd
index d4df471212..5020d2b7b7 100644
--- a/site/guide/validation/_link-artifacts-to-reports.qmd
+++ b/site/guide/validation/_link-artifacts-to-reports.qmd
@@ -3,58 +3,58 @@ Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 :::: {.content-visible unless-format="revealjs"}
-1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
+a. Under your evidence, click **Artifacts** to expand the artifacts panel.
 
-1. Select a record or find your record by applying a filter or searching for it.^[[Working with the inventory](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records)]
-
-1. In the left sidebar that appears for your record, click **{{< fa file >}} Documents** and select the **Latest** tab.^[[Work with document versions](/guide/documentation/work-with-document-versions.qmd)]
-
-1. Click on a Validation type file.^[[Preparing validation reports](/guide/validation/preparing-validation-reports.qmd#validation-overview)]
-
-1. Expand any subsection of the validation report you would like to work with.
-
-1. In any section of the report where the button is available, click **{{< fa link >}} Link Artifact to Report** and select the artifact type^[[Manage artifact types](/guide/validation/manage-artifact-types.qmd)] you want to add:
+b. Click **{{< fa link >}} Link Artifact** and select the artifact type^[[Manage artifact types](/guide/validation/manage-artifact-types.qmd)] you want to add:
 
    - Validation Issue
    - Policy Exception
    - Limitation
 
-1. On the **Link Artifact to Report** modal that opens, select from the list of available artifacts, or click **{{< fa plus >}} Update Linked Artifacts**.^[[Add and manage artifacts](/guide/validation/add-manage-artifacts.qmd#add-artifacts-on-validation-reports)]
+c. On the Link Artifact to Report modal that opens:
 
-1. Click **Update Linked Artifacts**.
+   - Select from the list of available artifacts.
+   - Click **{{< fa plus >}} Add {Artifact Type}** where `{Artifact Type}` is the artifact type you want to add to create a new artifact,[^create-artifact] then select the new artifact from the list.
 
-   Confirm that newly linked artifact shown under Artifacts is accurate.
+d. Click **Update Linked Artifacts**.
+
+   Confirm that the newly linked artifacts shown under Artifacts is accurate.
 
 ::::
 
+<!-- ADDITIONAL FOOTNOTES: -->
 
-:::: {.content-hidden unless-format="revealjs"}
-1. From the **{{< fa cubes >}} Inventory** in the ValidMind Platform, go to the record you connected to earlier.
+[^create-artifact]:
 
-1. In the left sidebar that appears for your record, click **Validation** under {{< fa file >}} Documents.
+   1. Click **{{< fa plus >}} Add {Artifact Type}** where `{Artifact Type}` is the artifact type you want to add to create a new artifact.
+   2. Enter the details for your artifact.
+   3. Click **Add {Artifact Type}** to submit the artifact.
+
+:::: {.content-hidden unless-format="revealjs"}
+1. From the **{{< fa cubes >}} Inventory** in the {{< var validmind.platform >}}, go to the model you connected to earlier.
 
-1. Locate the Data Preparation section and click on **2.2.2. Model Performance** to expand that section.
+1. In the left sidebar that appears for your model, click **Validation** under {{< fa file >}} Documents.
 
-1. Under the Model Performance Metrics section, locate Artifacts then click **Link Artifact to Report**.
+1. Click **2.2.2. Model Performance** to expand that section.
 
-1. Select **Validation Issue** as the [type of artifact](/guide/validation/manage-artifact-types.qmd){target="_blank"}.
+1. Under the Model Performance Metrics guideline, click to expand the **Artifacts** panel.
 
-1. Click **{{< fa plus >}} Add Validation Issue** to add a validation issue type artifact.
+1. Click **{{< fa link >}} Link Artifact** and select **Validation Issue** as the [type of artifact](/guide/validation/manage-artifact-types.qmd){target="_blank"}.
 
-1. Enter in the details for your validation issue, for example:
+1. Click **{{< fa plus >}} Add Validation Issue** and enter the details for your validation issue, for example:
 
     - **[title]{.smallcaps}** — Champion Logistic Regression Model Fails Minimum Accuracy Threshold
     - **[risk area]{.smallcaps}** — Model Performance
     - **[documentation section]{.smallcaps}** — 3.2. Model Evaluation
     - **[description]{.smallcaps}** — The logistic regression champion model was subjected to a Minimum Accuracy test to determine whether its predictive accuracy meets the predefined performance threshold of 0.7. The model achieved an accuracy score of 0.6136, which falls below the required minimum. As a result, the test produced a Fail outcome.
 
-1. Click **Save**.
+1. Click **Add Validation Issue** to submit the validation issue.
 
 1. Select the validation issue you just added to link to your validation report.
 
 1. Click **Update Linked Artifacts** to insert your validation issue.
 
-1. Confirm that validation issue you inserted has been correctly inserted into section **2.2.2. Model Performance**  of the report.
+1. Confirm that the validation issue you inserted has been correctly inserted into section **2.2.2. Model Performance**  of the report.
 
 1. Click on the validation issue to expand the issue, where you can adjust details such as severity, owner, due date, status, etc. as well as include proposed remediation plans or supporting documentation as attachments.
 
diff --git a/site/guide/validation/_link-validator-evidence.qmd b/site/guide/validation/_link-validator-evidence.qmd
deleted file mode 100644
index fb243d9ae4..0000000000
--- a/site/guide/validation/_link-validator-evidence.qmd
+++ /dev/null
@@ -1,68 +0,0 @@
-<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
-Refer to the LICENSE file in the root of this repository for details.
-SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
-
-:::: {.content-visible unless-format="revealjs"}
-::: {.callout}
-To link validator evidence to a report, you must first log tests as a validator with the {{< var validmind.developer >}}.^[[{{< var validmind.developer >}}](/developer/validmind-library.qmd)]
-:::
-
-1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
-
-1. Select a record or find your record by applying a filter or searching for it.^[[Working with the inventory](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records)]
-
-1. In the left sidebar that appears for your record, click **{{< fa file >}} Documents** and select the **Latest** tab.^[[Work with document versions](/guide/documentation/work-with-document-versions.qmd)]
-
-1. Click on a Validation type file.^[[Preparing validation reports](/guide/validation/preparing-validation-reports.qmd#validation-overview)]
-
-   You can now expand any subsection of the validation report you would like to work with.
-
-1. In any section of the report where the button is available, click **{{< fa link >}} Link Evidence to Report**. 
-
-1. On the **Link Validator Evidence to Validation Document** page that opens, select the evidence that is related to your assessment. 
-   
-   If you are not sure if something is relevant, you can expand the section by clicking **{{< fa chevron-down >}}** for more details.
-
-1. Click **Update Linked Evidence**.
-
-   - Confirm that the newly linked-to evidence shown under Developer Evidence is accurate.
-   - Evidence that needs your attention gets flagged with [{{< fa triangle-exclamation >}} Requires Attention]{.bubble .yellow-bg}. These sections get flagged automatically whenever a test result is above or below a certain threshold.
-
-::::
-
-
-:::: {.content-hidden unless-format="revealjs"}
-With some test results logged, let's head to the record we connected to at the beginning of this notebook and insert our test results into the validation report as evidence.
-
-While the example below focuses on a specific test result, you can follow the same general procedure for your other results:
-
-::: {.panel-tabset}
-
-### 1. Link data quality test results
-a. From the **{{< fa cubes >}} Inventory** in the {{< var validmind.platform >}}, go to the record you connected to earlier.
-
-a. In the left sidebar that appears for your record, click **Validation** under {{< fa file >}} Documents.
-
-a. Locate the Data Preparation section and click on **2.2.1. Data Quality** to expand that section.
-
-a. Under the Class Imbalance Assessment section, locate Validator Evidence then click **Link Evidence to Report**.
-
-a. Select the Class Imbalance test results we logged: **ValidMind Data Validation Class Imbalance** 
-
-    ![The ClassImbalance tests selected](/notebooks/tutorials/model_validation/selecting-class-imbalance-results.png){fig-alt="Screenshot showing the ClassImbalance tests selected" .screenshot}
-
-a. Click **Update Linked Evidence** to add the test results to the validation report.
-
-    Confirm that the results for the Class Imbalance test you inserted has been correctly inserted into section **2.2.1. Data Quality** of the report.
-
-### 2. Review Class Imbalance test results
-
-- Once linked as evidence to section **2.2.1. Data Quality** note that the ValidMind Data Validation Class Imbalance test results are flagged as **Requires Attention** — as they include comparative results from our initial raw dataset.
-- Click **See evidence details** to review the LLM-generated description that summarizes the test results, that confirm that our final preprocessed dataset actually passes our test:
-
-  ![ClassImbalance test generated description in the text editor](/notebooks/tutorials/model_validation/class-imbalance-results-detail.png){fig-alt="Screenshot showing the ClassImbalance test generated description in the text editor" .screenshot}
-
-:::
-
-
-::::
\ No newline at end of file
diff --git a/site/guide/validation/_map-evidence-to-guidelines.qmd b/site/guide/validation/_map-evidence-to-guidelines.qmd
new file mode 100644
index 0000000000..659b50b5d1
--- /dev/null
+++ b/site/guide/validation/_map-evidence-to-guidelines.qmd
@@ -0,0 +1,234 @@
+<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
+Refer to the LICENSE file in the root of this repository for details.
+SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
+
+:::: {.content-visible unless-format="revealjs"}
+## Map evidence to guidelines
+
+:::: {.column-margin}
+![Map Evidence panel](map-evidence-panel.png){fig-alt="Map Evidence panel showing evidence type toggles for Developer Evidence and Validator Evidence, and a Relevance Threshold slider set to 0.7." .screenshot}
+::::
+
+Map Evidence uses AI to suggest relevant evidence for each validation guideline, helping you find and link supporting documentation from both developers and validators.
+
+1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
+
+2. Select a record or find your record by applying a filter or searching for it.^[[Working with the inventory](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records)]
+
+3. In the left sidebar that appears for your record, click **{{< fa file >}} Documents** and select the **Latest** tab.^[[Work with document versions](/guide/documentation/work-with-document-versions.qmd)]
+
+4. Click on a Validation type file.^[[Preparing validation reports](/guide/validation/preparing-validation-reports.qmd#validation-overview)]
+
+5. You can map evidence at three levels:
+
+::: {.panel-tabset}
+
+#### For the entire report
+
+Click **{{< fa wand-magic-sparkles >}} Map Evidence** in the right sidebar to expand the mapping panel for the entire report.
+
+#### For an entire section
+
+Sections include subsections with guidelines, and a risk assessment summary at the top of the page.
+
+a. Click on a section of the validation report to expand that section.
+b. Click **{{< fa wand-magic-sparkles >}} Map Evidence** at the top of the page to open the mapping panel for that section.
+
+#### For individual guidelines
+
+Guidelines are organized into subsections under a parent section.
+
+a. Click on a section of the validation report to expand that section.
+b. In any subsection, click **{{< fa wand-magic-sparkles >}} Map Evidence** to open the mapping panel for that guideline.
+
+:::
+
+6. Configure the mapping options:
+
+   - Toggle the **[evidence type]{.smallcaps}** toggle to include evidence from the selected types:
+      - **Developer Evidence** — Include evidence logged on the Development document associated with the record.^[[Manage document types](/guide/templates/manage-document-types.qmd)]
+      - **Validator Evidence** — Include evidence logged on the current validation report.
+   - Adjust the **[relevance threshold]{.smallcaps}** slider — lower values return more results while higher values show only the most relevant matches.
+
+7. Click **Map Evidence** to start the mapping.
+
+   If this is your first time running Map Evidence, review the information presented to you explaining the mapping process, then click **Map Evidence** to run the mapping.^[To hide the additional information on mapping modal for future runs, select the **Don't show this again** checkbox.]
+
+When mapping is complete, the [#]{.bubble} of evidence items to review is displayed. Review the evidence items and approve or reject the suggestions as needed.
+
+### Review and approve mapped evidence
+
+After running Map Evidence, you can review and approve suggestions at four levels:
+
+::: {.panel-tabset}
+
+#### For the entire report
+
+If you have run mapping for the entire report, you can review and approve suggestions at the entire report level.
+
+The **{{< fa wand-magic-sparkles >}} Map Evidence** panel in the right sidebar for your validation report shows how many items need review across the entire report — click to expand the panel if it is collapsed:
+
+   - Select **[{{< fa check >}} Approve All]{.green}** to link all suggested evidence across all guidelines, or **[{{< fa xmark >}} Reject All]{.red}** to dismiss all suggestions.
+      - Click into any section of the report with approved mapped evidence to confirm that any approved evidence appears in the Evidence panel for guidelines as expected.
+   - To re-run mapping with different settings, click **{{< fa sync >}}Remap Evidence**.
+      - (Optional) Adjust the relevance threshold or change which evidence types to include, then generate new suggestions.
+
+#### For an entire section
+
+Sections include subsections with guidelines, and a risk assessment summary at the top of the page. If you have run mapping for an entire section, you can review and approve suggestions at the section level:
+
+a. Click on a section of the validation report to expand that section.
+
+b. Click **{{< fa wand-magic-sparkles >}} Map Evidence** at the top of the page to open the mapping panel for that section:
+
+   - Select **[{{< fa check >}} Approve All]{.green}** to link all suggested evidence for guidelines in that section, or **[{{< fa xmark >}} Reject All]{.red}** to dismiss all section suggestions.
+      - Confirm that any approved evidence appears in the Evidence panels for the guidelines in that section as expected.
+   - To re-run mapping with different settings, click **{{< fa sync >}} Remap Evidence**.
+      - (Optional) Adjust the relevance threshold or change which evidence types to include, then generate new suggestions.
+
+#### For individual guidelines
+
+Guidelines are organized into subsections under a parent section. If you have run mapping for an individual guideline, you can review and approve suggestions at the guideline level:
+
+a. Click on a section of the validation report to expand that section.
+
+b. In any subsection, click **{{< fa wand-magic-sparkles >}} Map Evidence** to open the mapping panel for that guideline:
+
+   - Select **[{{< fa check >}} Approve All]{.green}** to link all suggested evidence for that guideline, or **[{{< fa xmark >}} Reject All]{.red}** to dismiss all guideline suggestions.
+      - Confirm that any approved evidence appears in the Evidence panel for that guideline as expected.
+   - To re-run mapping with different settings, click **{{< fa sync >}} Remap Evidence**.
+      - (Optional) Adjust the relevance threshold or change which evidence types to include, then generate new suggestions.
+
+#### For individual suggestions
+
+If you have run mapping at any level, you can review and approve individual suggestions at the individual suggestion level:
+
+a. Click on a section of the validation report to expand that section.
+
+b. In any subsection, click **Evidence** to expand the evidence panel for that guideline.
+
+c. Review individual evidence suggestions on the **Developer Evidence** or **Validator Evidence** tabs:
+
+   - Each item shows the evidence block name and a relevance score.
+   - Click **See Relevance Analysis** to view why the evidence was suggested.
+   - Click **[{{< fa check >}} Approve]{.green}** to link an individual item to the guideline.
+   - Click **[{{< fa xmark >}} Reject]{.red}** to dismiss an individual suggestion.
+
+d. Confirm that any approved evidence appears in the Evidence panel for that guideline as expected.
+
+:::
+
+::::
+
+
+
+:::: {.content-hidden unless-format="revealjs"}
+Map Evidence uses AI to suggest relevant evidence for each validation guideline, helping you find and link supporting documentation from both developers and validators.
+
+1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
+
+2. Select a record or find your record by [applying a filter or searching for it](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records){target="_blank"}.
+
+3. In the left sidebar that appears for your record, click **Validation** under **{{< fa file >}} Documents**.
+
+4. You can map evidence at three levels:
+
+::: {.panel-tabset}
+
+#### For the entire report
+
+Click **{{< fa wand-magic-sparkles >}} Map Evidence** in the right sidebar to expand the mapping panel for the entire report.
+
+#### For an entire section
+
+Sections include subsections with guidelines, and a risk assessment summary at the top of the page.
+
+a. Click on a section of the validation report to expand that section.
+b. Click **{{< fa wand-magic-sparkles >}} Map Evidence** at the top of the page to open the mapping panel for that section.
+
+#### For individual guidelines
+
+Guidelines are organized into subsections under a parent section.
+
+a. Click on a section of the validation report to expand that section.
+b. In any subsection, click **{{< fa wand-magic-sparkles >}} Map Evidence** to open the mapping panel for that guideline.
+
+:::
+
+6. Configure the mapping options:
+
+   - Toggle the **[evidence type]{.smallcaps}** toggle to include evidence from the selected types:
+      - **Developer Evidence** — Include evidence logged on the [Development document associated with the record](/guide/templates/manage-document-types.qmd){target="_blank"}.
+      - **Validator Evidence** — Include evidence logged on the current validation report.
+   - Adjust the **[relevance threshold]{.smallcaps}** slider — lower values return more results while higher values show only the most relevant matches.
+
+7. Click **Map Evidence** to start the mapping.
+
+   If this is your first time running Map Evidence, review the information presented to you explaining the mapping process, then click **Map Evidence** to run the mapping.
+
+When mapping is complete, the [#]{.bubble} of evidence items to review is displayed. Review the evidence items and approve or reject the suggestions as needed.
+
+#### Review and approve mapped evidence
+
+After running Map Evidence, you can review and approve suggestions at four levels:
+
+::: {.panel-tabset}
+
+#### For the entire report
+
+If you have run mapping for the entire report, you can review and approve suggestions at the entire report level.
+
+The **{{< fa wand-magic-sparkles >}} Map Evidence** panel in the right sidebar for your validation report shows how many items need review across the entire report — click to expand the panel if it is collapsed:
+
+   - Select **[{{< fa check >}} Approve All]{.green}** to link all suggested evidence across all guidelines, or **[{{< fa xmark >}} Reject All]{.red}** to dismiss all suggestions.
+      - Click into any section of the report with approved mapped evidence to confirm that any approved evidence appears in the Evidence panel for guidelines as expected.
+   - To re-run mapping with different settings, click **{{< fa sync >}}Remap Evidence**.
+      - (Optional) Adjust the relevance threshold or change which evidence types to include, then generate new suggestions.
+
+#### For an entire section
+
+Sections include subsections with guidelines, and a risk assessment summary at the top of the page. If you have run mapping for an entire section, you can review and approve suggestions at the section level:
+
+a. Click on a section of the validation report to expand that section.
+
+b. Click **{{< fa wand-magic-sparkles >}} Map Evidence** at the top of the page to open the mapping panel for that section:
+
+   - Select **[{{< fa check >}} Approve All]{.green}** to link all suggested evidence for guidelines in that section, or **[{{< fa xmark >}} Reject All]{.red}** to dismiss all section suggestions.
+      - Confirm that any approved evidence appears in the Evidence panels for the guidelines in that section as expected.
+   - To re-run mapping with different settings, click **{{< fa sync >}} Remap Evidence**.
+      - (Optional) Adjust the relevance threshold or change which evidence types to include, then generate new suggestions.
+
+#### For individual guidelines
+
+Guidelines are organized into subsections under a parent section. If you have run mapping for an individual guideline, you can review and approve suggestions at the guideline level:
+
+a. Click on a section of the validation report to expand that section.
+
+b. In any subsection, click **{{< fa wand-magic-sparkles >}} Map Evidence** to open the mapping panel for that guideline:
+
+   - Select **[{{< fa check >}} Approve All]{.green}** to link all suggested evidence for that guideline, or **[{{< fa xmark >}} Reject All]{.red}** to dismiss all guideline suggestions.
+      - Confirm that any approved evidence appears in the Evidence panel for that guideline as expected.
+   - To re-run mapping with different settings, click **{{< fa sync >}} Remap Evidence**.
+      - (Optional) Adjust the relevance threshold or change which evidence types to include, then generate new suggestions.
+
+#### For individual suggestions
+
+If you have run mapping at any level, you can review and approve individual suggestions at the individual suggestion level:
+
+a. Click on a section of the validation report to expand that section.
+
+b. In any subsection, click **Evidence** to expand the evidence panel for that guideline.
+
+c. Review individual evidence suggestions on the **Developer Evidence** or **Validator Evidence** tabs:
+
+   - Each item shows the evidence block name and a relevance score.
+   - Click **See Relevance Analysis** to view why the evidence was suggested.
+   - Click **[{{< fa check >}} Approve]{.green}** to link an individual item to the guideline.
+   - Click **[{{< fa xmark >}} Reject]{.red}** to dismiss an individual suggestion.
+
+d. Confirm that any approved evidence appears in the Evidence panel for that guideline as expected.
+
+:::
+
+::::
+
diff --git a/site/guide/validation/_remove-artifact-view.qmd b/site/guide/validation/_remove-artifact-view.qmd
new file mode 100644
index 0000000000..6fa4ae1767
--- /dev/null
+++ b/site/guide/validation/_remove-artifact-view.qmd
@@ -0,0 +1,14 @@
+<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
+Refer to the LICENSE file in the root of this repository for details.
+SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
+
+2. Click on the name of your saved view, or **{{< fa bookmark >}} Select View** if you are not currently displaying a saved view.
+
+3. Select **My Views (#)**.
+
+4. Hover over the name of the view you want to edit or remove.
+
+5. When the **{{< fa ellipsis-vertical >}}** appears, click on it and select:
+
+    - **{{< fa pencil >}} Edit View** to edit the [view name]{.smallcaps} and [description]{.smallcaps}. Click **Save Changes** to apply your edits.
+    - [**{{< fa trash-can >}} Remove View**]{.red} to delete the view. Click **Yes, Delete View** to confirm permanent deletion of that view.
\ No newline at end of file
diff --git a/site/guide/validation/add-manage-artifacts.qmd b/site/guide/validation/add-manage-artifacts.qmd
index 0e7a43aac7..13e709f57b 100644
--- a/site/guide/validation/add-manage-artifacts.qmd
+++ b/site/guide/validation/add-manage-artifacts.qmd
@@ -1,4 +1,4 @@
-   ---
+---
 # Copyright © 2023-2026 ValidMind Inc. All rights reserved.
 # Refer to the LICENSE file in the root of this repository for details.
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
@@ -32,7 +32,7 @@ Add artifacts at the record or documentation section level, update your artifact
 
 ## Add artifacts on validation reports
 
-When linking artifacts to validation reports,[^5] you can add artifacts as you assess a record's compliance:
+While assessing a record's compliance,[^5] you can add artifacts as you complete your validation report:
 
 1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
 
@@ -42,23 +42,27 @@ When linking artifacts to validation reports,[^5] you can add artifacts as you a
 
 4. Click on a Validation type file.[^8]
 
-5. In any section of the report where the button is available, click **{{< fa link >}} Link Artifact to Report** and select the artifact type[^9] you want to add:
+   Expand any subsection of the validation report you have attached evidence for to autogenerate validation issues or manually link artifacts to your report:
+
+::: {.panel-tabset}
+
+### Autogenerate validation issues
 
-   - Validation Issue
-   - Policy Exception
-   - Limitation
+{{< include _autogenerate-validation-issues.qmd >}}
 
-6. On the Link Artifact to Report modal that opens, click **{{< fa plus >}} Add {Artifact Type}**.
+### Manually add artifacts
+
+{{< include _link-artifacts-to-reports.qmd >}}
+
+:::
 
-7. On the modal that opens, provide information for your artifact.
 
-8. When you are done, click **Add {Artifact Type}** to submit the artifact.
 
 ## Update artifacts
 
 As artifacts get resolved or require other changes during the validation process, you can update them:
 
-1. Locate the artifact you want to update.[^10]
+1. Locate the artifact you want to update.[^9]
 
 2. Click on a field to make changes.
 
@@ -101,16 +105,16 @@ Uploaded files must be less than 50 MB each in size.
 ## Delete artifacts
 
 ::: {.callout-important title="Artifact deletion is permanent."}
-- While artifact deletion will be logged under your {{< fa wifi >}} Activity,[^11] deleted artifacts cannot be retrieved.
-- Deleting an artifact will also remove it from any validation reports[^12] it was previously attached to.
+- While artifact deletion will be logged under your {{< fa wifi >}} Activity,[^10] deleted artifacts cannot be retrieved.
+- Deleting an artifact will also remove it from any validation reports[^11] it was previously attached to.
 
 :::
 
 If you logged an artifact in error or otherwise no longer need to track that artifact, you can delete it:
 
-1. Locate the artifact you want to delete.[^13]
+1. Locate the artifact you want to delete.[^12]
 
-2. On the artifact's detail page, click **{{< fa trash-can>}} Delete {Artifact Type}**[^14] in the right sidebar.
+2. On the artifact's detail page, click **{{< fa trash-can>}} Delete {Artifact Type}**[^13] in the right sidebar.
 
 3. Click **Yes, Delete {Artifact Type}** to confirm permanent deletion of that artifact.
 
@@ -125,7 +129,7 @@ If you logged an artifact in error or otherwise no longer need to track that art
 
 [^4]: [Manage permissions](/guide/configuration/manage-permissions.qmd)
 
-[^5]: [Link artifacts to reports](/guide/validation/assess-compliance.qmd#link-artifacts-to-reports)
+[^5]: [Assess compliance](/guide/validation/assess-compliance.qmd#link-artifacts-to-reports)
 
 [^6]: [Working with the inventory](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records)
 
@@ -133,14 +137,12 @@ If you logged an artifact in error or otherwise no longer need to track that art
 
 [^8]: [Preparing validation reports](/guide/validation/preparing-validation-reports.qmd#validation-overview)
 
-[^9]: [Manage artifact types](manage-artifact-types.qmd)
-
-[^10]: [View and filter artifacts](view-filter-artifacts.qmd)
+[^9]: [View and filter artifacts](view-filter-artifacts.qmd)
 
-[^11]: [View record activity](/guide/inventory/view-record-activity.qmd)
+[^10]: [View record activity](/guide/inventory/view-record-activity.qmd)
 
-[^12]: [Link artifacts to reports](/guide/validation/assess-compliance.qmd#link-artifacts-to-reports)
+[^11]: [Link artifacts to reports](/guide/validation/assess-compliance.qmd#link-artifacts-to-reports)
 
-[^13]: [View and filter artifacts](view-filter-artifacts.qmd)
+[^12]: [View and filter artifacts](view-filter-artifacts.qmd)
 
-[^14]: [Manage artifact types](manage-artifact-types.qmd)
\ No newline at end of file
+[^13]: [Manage artifact types](manage-artifact-types.qmd)
\ No newline at end of file
diff --git a/site/guide/validation/assess-compliance.qmd b/site/guide/validation/assess-compliance.qmd
index e87cb793d1..b882ad7b74 100644
--- a/site/guide/validation/assess-compliance.qmd
+++ b/site/guide/validation/assess-compliance.qmd
@@ -7,6 +7,8 @@ date: last-modified
 aliases:
   - /guide/assess-compliance.html
   - /guide/model-validation/assess-compliance.html
+includes:
+  compliance: true
 ---
 
 Use the {{< var validmind.platform >}} to assess compliance of your records with guidelines based on analyzing evidence and artifacts.
@@ -15,8 +17,7 @@ Compliance assessments provide an unbiased starting point that enables more effi
 
 1. [Link evidence to reports](#link-evidence-to-reports)
 2. [Link artifacts to reports](#link-artifacts-to-reports)
-3. [Autogenerate validation issues](#autogenerate-validation-issues)
-4. [Provide compliance assessments](#provide-compliance-assessments)
+3. [Assign compliance assessments](#assign-compliance-assessments)
 
 ::: {.callout title="Compliance assessments cannot be performed within static PDF documents."}
 You can only assess compliance within PDFs converted to editable documents,[^1] validation reports generated by the {{< var validmind.developer >}}, or validation reports created in the {{< var validmind.platform >}}.
@@ -41,9 +42,7 @@ Use {{< var vm.product >}}'s AI-assisted tools to automate mapping and assessing
 
 :::
 
-### Link developer evidence
-
-To link evidence logged by developers^[[{{< var validmind.developer >}}](/developer/validmind-library.qmd)] to your validation report:
+Include sections from other documents and logged test results as evidence to validation report, then assess the linked evidence for compliance:
 
 1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
 
@@ -55,33 +54,98 @@ To link evidence logged by developers^[[{{< var validmind.developer >}}](/develo
 
    Expand any subsection of the validation report you would like to work with.
 
-5. In any section of the report where the button is available, click **{{< fa link >}} Link Developer Evidence**.
+5. Link evidence to reports in two steps:
+   a. [Map evidence](#map-evidence)
+   b. [Assess evidence](#assess-evidence)
+
+### a. Map evidence
+<span id="map-evidence"></span>
+
+1. In any section of the report where linking evidence is available, click **Evidence** to expand the evidence panel.
+
+2. Click **{{< fa link >}} Link Evidence** and select the [evidence type]{.smallcaps}:
+
+   ::: {.panel-tabset}
+
+   #### Developer Evidence
+
+   Select evidence logged on Development, Monitoring, or custom document types attached to the record:
+
+   i. Select **Developer Evidence** as the [evidence type]{.smallcaps}.
+   ii. In the left sidebar, click on the document you want to include evidence from.
+   iii. In the right panel, check off the content blocks and/or test results you want to include as evidence:[^10]
+      - Expand a section by clicking **{{< fa chevron-down >}}** to review any sub-sections.
+      - If you are not sure if a block is relevant, click on a block to preview the contents.
+      - To include all blocks in a section, check off the section header.
+   iv. When you are ready to insert the evidence, click **Update Linked Evidence**.
+
+   #### Validator Evidence
+
+   Select evidence logged on the same Validation report:[^11]
 
-6. On the **Link Developer Evidence to Validation Document** page that opens, select the evidence that is related to your assessment.
+   i. Select **Validator Evidence** as the [evidence type]{.smallcaps}.
+   ii. Check off the test results you want to include as evidence.
+      If you are not sure if a test result is relevant, click on a test result to preview the contents.
+   iii. When you are ready to insert the evidence, click **Update Linked Evidence**.
 
-   - Available evidence is associated with the relevant documentation section.
-   - If you are not sure if something is relevant, you can expand the section by clicking **{{< fa chevron-down >}}** for more details.
+   :::
 
-7. Click **Update Linked Evidence**.
+3. Confirm that the newly linked evidence appears in the Evidence panel:
 
-   - Confirm that the newly linked-to evidence shown under Developer Evidence is accurate and is connected to the correct documentation section.
+   ::: {.panel-tabset}
+
+   #### Developer Evidence
+
+   - Verify that the evidence shown under the **Developer Evidence** tab is accurate and is connected to the correct document section from the right document.
+   - Evidence that needs your attention gets flagged with [{{< fa triangle-exclamation >}} Requires Attention]{.bubble .yellow-bg}. These sections get flagged automatically whenever a test result is above or below a certain threshold.
+
+   #### Validator Evidence
+
+   - Verify that the evidence shown under the **Validator Evidence** tab is accurate and is connected to the correct test result.
    - Evidence that needs your attention gets flagged with [{{< fa triangle-exclamation >}} Requires Attention]{.bubble .yellow-bg}. These sections get flagged automatically whenever a test result is above or below a certain threshold.
 
-### Link validator evidence
+   :::
 
-{{< include _link-validator-evidence.qmd >}}
+### b. Assess evidence
+<span id="assess-evidence"></span>
+
+Once you have linked evidence to a section of your report, assess the linked evidence for compliance:[^12]
+
+1. In any section of the report where evidence has been linked, click **Evidence Assessment** to expand the evidence assessment panel.
+
+2. Click **Add your assessment** to use the content editing toolbar[^13] to enter your assessment notes.
+
+3. (Optional) When you are finished editing your assessment notes, hover over the content block and click **{{< fa unlock >}} Lock Assessment** to prevent additional changes.
 
 ## Link artifacts to reports
 
-{{< include _link-artifacts-to-reports.qmd >}}
+After you have mapped and assessed available evidence, link artifacts to reports to provide additional context and support your assessment:
 
-## Autogenerate validation issues
+1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
+
+2. Select a record or find your record by applying a filter or searching for it.[^14]
+
+3. In the left sidebar that appears for your record, click **{{< fa file >}} Documents** and select the **Latest** tab.[^15]
+
+4. Click on a Validation type file.[^16]
+
+   Expand any subsection of the validation report you have attached evidence for to autogenerate validation issues or manually link artifacts to your report:
+
+::: {.panel-tabset}
+
+### Autogenerate validation issues
 
 {{< include _autogenerate-validation-issues.qmd >}}
 
-## Provide compliance assessments
+### Manually link artifacts
+
+{{< include _link-artifacts-to-reports.qmd >}}
+
+:::
+
+## Assign compliance assessments
 
-{{< include _provide-compliance-assessments.qmd >}}
+{{< include _assign-compliance-assessments.qmd >}}
 
 
 <!-- FOOTNOTES -->
@@ -103,3 +167,18 @@ To link evidence logged by developers^[[{{< var validmind.developer >}}](/develo
 [^8]: [Work with document versions](/guide/documentation/work-with-document-versions.qmd)
 
 [^9]: [Preparing validation reports](/guide/validation/preparing-validation-reports.qmd#validation-overview)
+
+[^10]: Only sections with populated content blocks and/or test results are available for selection as evidence — empty sections will have their checkboxes disabled and grayed out.
+
+[^11]:  To link validator evidence to a report, you must first log tests on your report with the {{< var validmind.developer >}}: **[{{< var validmind.developer >}}](/developer/validmind-library.qmd)**
+
+[^12]: [a. Map evidence](#map-evidence)
+
+[^13]: [Work with content blocks](/guide/documentation/work-with-content-blocks.qmd#content-editing-toolbar)
+
+[^14]: [Working with the inventory](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records)
+
+[^15]: [Work with document versions](/guide/documentation/work-with-document-versions.qmd)
+
+[^16]: [Preparing validation reports](/guide/validation/preparing-validation-reports.qmd#validation-overview)
+
diff --git a/site/guide/validation/customize-artifact-layouts.qmd b/site/guide/validation/customize-artifact-layouts.qmd
index 47ac87c566..150fc3e61f 100644
--- a/site/guide/validation/customize-artifact-layouts.qmd
+++ b/site/guide/validation/customize-artifact-layouts.qmd
@@ -7,6 +7,8 @@ date: last-modified
 aliases:
   - customize-model-findings-layouts.qmd
   - /guide/model-validation/customize-artifact-layouts.html
+includes:
+   artifacts: true
 ---
 
 Configure the information that displays by default on the list of all tracked artifacts for each artifact type.
@@ -66,49 +68,15 @@ Once customized, you can save a view for later application.[^7]
 
 ## Manage custom artifact views
 
-:::{.callout}
-Saved views are unique to you and do not display for other users in your organization.
-:::
-
-
-### Save artifact views
-
 You can save custom artifact configurations as a view to reapply at any time for each artifact type:
 
-1. First, customize an artifact layout.[^6]
-
-   You can also apply filters or sorting before saving your view to include them in the view.[^8]
-
-{{< include /guide/inventory/_save-layout-view.qmd >}}
-
-### Edit or remove saved artifact views
-
-::: {.callout-important}
-Deletion of saved views is permanent.
-:::
-
-::: {.panel-tabset}
-
-#### Edit or remove validation issue views
-
-To modify a saved validation issues view:
-
-1. In the left sidebar, click **{{< fa triangle-exclamation >}} Validation Issues** for a list of validation issues across all records.
-
-{{< include /guide/inventory/_remove-layout-view.qmd >}}
-
-#### Edit or remove all other artifact type views
+#### Manage personal artifact views
 
-To modify a saved view for all other artifact types:
+{{< include /guide/shared/manage-views/_personal-views.qmd >}}
 
-1. In the left sidebar, click **{{< fa border-all >}} Artifacts** for lists of other artifact types across all records, then select an artifact type[^9] for a list of that artifact type:
+#### Manage organization artifact views
 
-      - Policy Exception
-      - Limitation
-
-{{< include /guide/inventory/_remove-layout-view.qmd >}}
-
-:::
+{{< include /guide/shared/manage-views/_organization-views.qmd >}}
 
 
 <!-- FOOTNOTES -->
@@ -125,8 +93,4 @@ To modify a saved view for all other artifact types:
 
 [^6]: [Manage artifact fields](manage-artifact-fields.qmd)
 
-[^7]: [Manage custom artifact views](#manage-custom-artifact-views)
-
-[^8]: [Filter and sort artifacts](view-filter-artifacts.qmd#filter-and-sort-artifacts)
-
-[^9]: [Manage artifact types](/guide/validation/manage-artifact-types.qmd)
+[^7]: [Manage custom artifact views](#manage-custom-artifact-views)
\ No newline at end of file
diff --git a/site/guide/validation/manage-artifact-fields.qmd b/site/guide/validation/manage-artifact-fields.qmd
index dd9f290c76..8d20312dd7 100644
--- a/site/guide/validation/manage-artifact-fields.qmd
+++ b/site/guide/validation/manage-artifact-fields.qmd
@@ -99,7 +99,7 @@ To group artifact fields, first create an artifact field group:
 
 2. Under {{< fa expand >}} Artifacts,  select **Artifact Fields**.
 
-3. Click **{{< fa plus >}} Add Group** and enter in a **[name]{.smallcaps}** and a **[description]{.smallcaps}** for the group.
+3. Click **{{< fa plus >}} Add Group** and enter a **[name]{.smallcaps}** and a **[description]{.smallcaps}** for the group.
 
 4. Click **Create Group** to add the new group.
 
diff --git a/site/guide/validation/map-and-assess-evidence.qmd b/site/guide/validation/map-and-assess-evidence.qmd
index 964b05fc7e..9eb1abdd90 100644
--- a/site/guide/validation/map-and-assess-evidence.qmd
+++ b/site/guide/validation/map-and-assess-evidence.qmd
@@ -19,166 +19,18 @@ Use {{< var vm.product >}}'s AI-assisted tools to streamline your validation wor
 
 :::
 
-## How do evidence mapping and assessment work?
+{{< include _how-does-mapping-assessment-work.qmd >}}
 
-Validation reports require you to link supporting evidence to each guideline and write compliance assessments, a process that can be time-consuming when done manually across dozens of guidelines.
+::: {.callout}
+## Currently, automatic mapping and assessment retrieves only Developer Evidence from the default Development document on the record, or Validator Evidence logged on the Validation report you are mapping evidence for.[^4]
 
-Map Evidence
-: Scans all available evidence from developers and validators, then suggests which items are relevant to each guideline. Instead of searching through evidence blocks yourself, you review AI-suggested matches and approve the ones that apply. Each suggestion includes a relevance score and explanation so you can make informed decisions.
-
-Assess Evidence
-: Analyzes the linked evidence for a guideline and drafts a structured compliance assessment. The generated assessment includes a compliance conclusion, specific observations about gaps or issues, and a technical review of what the evidence demonstrates. You review and approve the draft, and then make edits if needed — saving time while maintaining control over the final content.
-
-Both features are designed to accelerate validation without replacing your judgment. You always review and approve suggestions before they become part of the report.
-
-## Map evidence to guidelines
-
-:::: {.column-margin}
-![Map Evidence panel](map-evidence-panel.png){fig-alt="Map Evidence panel showing evidence type toggles for Developer Evidence and Validator Evidence, and a Relevance Threshold slider set to 0.7." .screenshot}
-::::
-
-Map Evidence uses AI to suggest relevant evidence for each validation guideline, helping you find and link supporting documentation from both developers and validators.
-
-1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
-
-2. Select a record or find your record by applying a filter or searching for it.[^4]
-
-3. In the left sidebar that appears for your record, click **{{< fa file >}} Documents** and select the **Latest** tab.[^5]
-
-4. Click on a Validation type file.[^6]
-
-5. Navigate to a section and expand the **Evidence** panel.
-
-6. Click **{{< fa wand-magic-sparkles >}} Map Evidence**.
-
-7. Configure the mapping options:
-   - Toggle **Developer Evidence** to include evidence logged via the {{< var validmind.developer >}}.
-   - Toggle **Validator Evidence** to include evidence uploaded or created by validators.
-   - Adjust the **Relevance Threshold** slider — lower values return more results while higher values show only the most relevant matches.
-
-8. Click **Map Evidence** to run the AI mapping.
-
-   The panel displays how many evidence items are available to review for each guideline in the section.
-
-### Review and approve mapped evidence
-
-After running Map Evidence, you can review and approve suggestions at three levels:
-
-::: {.panel-tabset}
-
-#### For the entire report
-
-1. Open the validation report and look at the right sidebar.
-
-2. The **Map Evidence** panel shows how many items need review across the entire report.
-
-3. Use **Approve All** to link all suggested evidence across all guidelines, or **Reject All** to dismiss all suggestions.
-
-4. To re-run mapping with different settings, click **Remap Evidence**. This lets you adjust the relevance threshold or change which evidence types to include, then generate new suggestions.
-
-#### For an entire section
-
-1. Navigate to a specific section in the validation report.
-
-2. In the section header, click **{{< fa wand-magic-sparkles >}} Map Evidence** to open the mapping panel.
-
-3. Use **Approve All** to link all suggested evidence for guidelines in that section, or **Reject All** to dismiss all section suggestions.
-
-4. To re-run mapping with different settings, click **Remap Evidence**.
-
-#### For individual guidelines
-
-1. Navigate to a specific section in the validation report.
-
-2. Expand the **Evidence** panel for a guideline.
-
-3. Click **{{< fa wand-magic-sparkles >}} Map Evidence** to open the mapping panel for that guideline.
-
-4. Review individual evidence suggestions:
-
-   - Each item shows the evidence block name and a relevance score.
-   - Click **See Relevance Analysis** to view why the evidence was suggested.
-   - Click **Approve** to link an individual item to the guideline.
-   - Click **Reject** to dismiss an individual suggestion.
-
-5. Or use **Approve All** / **Reject All** to handle all suggestions for that guideline at once.
-
-Approved evidence appears in the Evidence panel for that guideline, organized by evidence type (Developer Evidence or Validator Evidence).
+To manually add and assess evidence from other document types, refer to [Assess compliance](/guide/validation/assess-compliance.qmd).
 
 :::
 
-## Assess evidence for compliance
-
-:::: {.column-margin}
-![Assess Evidence panel](assess-evidence-panel.png){fig-alt="Assess Evidence panel showing option to identify potential risks and compliance gaps based on linked evidence." .screenshot}
-::::
-
-Assess Evidence analyzes the linked evidence and generates a structured compliance assessment, identifying potential risks and compliance gaps.
-
-1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
-
-2. Select a record or find your record by applying a filter or searching for it.[^7]
-
-3. In the left sidebar that appears for your record, click **{{< fa file >}} Documents** and select the **Latest** tab.[^8]
-
-4. Click on a Validation type file.[^9]
-
-5. Navigate to a section that has linked evidence.
-
-6. Expand the **Evidence** panel.
-
-7. Click **{{< fa wand-magic-sparkles >}} Assess Evidence**.
-
-8. The AI analyzes the linked evidence and generates an **Evidence Assessment** containing:
-
-   - **Guideline Assessment** — A compliance conclusion indicating whether the guideline requirements are fully met, partially met, or not met, with an explanation of the evidence quality.
-
-   - **Validation Observations** — Specific findings about gaps or issues in the evidence, with each observation covering a single concern and suggesting actions for developers.
-
-   - **Evidence Review** — A detailed analysis of what the evidence demonstrates, including references to specific test outputs, documentation, and any limitations.
-
-   The panel displays how many assessments are available to review.
-
-### Review and approve evidence assessments
-
-After running Assess Evidence, you can review and approve assessments at three levels:
-
-::: {.panel-tabset}
-
-#### For the entire report
-
-1. Open the validation report and look at the right sidebar.
-
-2. The **Assess Evidence** panel shows how many assessments need review across the entire report.
-
-3. Use **Approve All** to accept all generated assessments, or **Reject All** to dismiss all assessments.
-
-#### For an entire section
-
-1. Navigate to a specific section in the validation report.
-
-2. In the section header, click **{{< fa wand-magic-sparkles >}} Assess Evidence** to open the assessment panel.
-
-3. Use **Approve All** to accept all generated assessments for that section, or **Reject All** to dismiss them.
-
-4. To regenerate assessments with updated evidence, click **Re-assess Evidence**.
-
-#### For individual guidelines
-
-1. Navigate to a specific section in the validation report.
-
-2. Expand the **Evidence Assessment** panel for a guideline. Assessments pending review show a [Review]{.bubble} status.
-
-3. Review the generated assessment content.
-
-4. Click **Approve** to accept the assessment, or **Reject** to dismiss it.
-
-5. After approving, you can edit the assessment content as needed — changes are auto-saved.
-
-6. To regenerate an assessment, click **{{< fa wand-magic-sparkles >}} Reassess Evidence** to run the AI analysis again with any updated evidence.
-
-:::
+{{< include _map-evidence-to-guidelines.qmd >}}
 
+{{< include _assess-evidence-for-compliance.qmd >}}
 
 <!-- FOOTNOTES -->
 
@@ -188,14 +40,4 @@ After running Assess Evidence, you can review and approve assessments at three l
 
 [^3]: [Manage permissions](/guide/configuration/manage-permissions.qmd)
 
-[^4]: [Working with the inventory](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records)
-
-[^5]: [Work with document versions](/guide/documentation/work-with-document-versions.qmd)
-
-[^6]: [Preparing validation reports](preparing-validation-reports.qmd#validation-overview)
-
-[^7]: [Working with the inventory](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records)
-
-[^8]: [Work with document versions](/guide/documentation/work-with-document-versions.qmd)
-
-[^9]: [Preparing validation reports](preparing-validation-reports.qmd#validation-overview)
\ No newline at end of file
+[^4]: [Manage document types](/guide/templates/manage-document-types.qmd)
diff --git a/site/guide/workflows/_add-new-workflows.qmd b/site/guide/workflows/_add-new-workflows.qmd
index 5f51e45f9a..50f82770a1 100644
--- a/site/guide/workflows/_add-new-workflows.qmd
+++ b/site/guide/workflows/_add-new-workflows.qmd
@@ -20,7 +20,7 @@ d. Select the [workflow target]{.smallcaps} type to add:
 
 #### Add record workflows
 
-i. Enter in a **[title]{.smallcaps}** and a **[description]{.smallcaps}** the workflow.
+i. Enter a **[title]{.smallcaps}** and a **[description]{.smallcaps}** for the workflow.
 
 ii. Select the **[record type]{.smallcaps}**^[[Manage record types](/guide/inventory/manage-inventory-record-types.qmd)] this workflow applies to.
 
@@ -37,14 +37,14 @@ v. Click **Save Draft** to save your blank workflow, and then [configure your wo
 
 #### Add artifact workflows
 
-i. Enter in a **[title]{.smallcaps}** and a **[description]{.smallcaps}** the workflow.
+i. Enter a **[title]{.smallcaps}** and a **[description]{.smallcaps}** for the workflow.
 
 ii. Select the **[artifact type]{.smallcaps}**^[[Manage artifact types](/guide/validation/manage-artifact-types.qmd)] this workflow applies to.
 
 iii. Under **[workflow start]{.smallcaps}**, select when the workflow should be initiated:
 
 - **Manually** — Start this workflow manually.^[[Initiate workflows](/guide/workflows/manage-workflows.qmd#initiate-workflows)]
-- **On Artifact Registration** — Start this workflow when a artifact is logged on a record.[^on-artifact-registration]
+- **On Artifact Registration** — Start this workflow when an artifact is logged on a record.[^on-artifact-registration]
 - **Via Webhook** — Start this workflow when a webhook event is received.
 
 iv. Select the **[artifact type]{.smallcaps}**^[[Manage artifact types](/guide/validation/manage-artifact-types.qmd)] this workflow applies to.
@@ -97,7 +97,7 @@ d. Select the [workflow target]{.smallcaps} type to add:
 
 #### Add record workflows
 
-i.  Enter in a **[title]{.smallcaps}** and a **[description]{.smallcaps}** the workflow.
+i. Enter a **[title]{.smallcaps}** and a **[description]{.smallcaps}** for the workflow.
 
 ii. Select the [**[record type]{.smallcaps}**](/guide/inventory/manage-inventory-record-types.qmd){target="_blank"} this workflow applies to.
 
@@ -114,14 +114,14 @@ v. Click **Save Draft** to save your blank workflow, and then configure your wor
 
 #### Add artifact workflows
 
-i. Enter in a **[title]{.smallcaps}** and a **[description]{.smallcaps}** the workflow.
+i. Enter a **[title]{.smallcaps}** and a **[description]{.smallcaps}** for the workflow.
 
 ii. Select the [**[artifact type]{.smallcaps}**](/guide/validation/manage-artifact-types.qmd){target="_blank"} this workflow applies to.
 
 iii. Under **[workflow start]{.smallcaps}**, select when the workflow should be initiated:
 
 - **Manually** — Start this workflow manually.
-- **On Artifact Registration** — Start this workflow when a artifact is logged on a record.
+- **On Artifact Registration** — Start this workflow when an artifact is logged on a record.
 
 iv. Select the **[artifact type]{.smallcaps}**
 
diff --git a/site/guide/workflows/_conditional-requirements.qmd b/site/guide/workflows/_conditional-requirements.qmd
index cfac7565aa..73e8597962 100644
--- a/site/guide/workflows/_conditional-requirements.qmd
+++ b/site/guide/workflows/_conditional-requirements.qmd
@@ -8,6 +8,15 @@ Conditional requirements are required or optional for the following step types:^
 ### {{< fa cube >}} Inventory Record Stage Change [optional]{.smallercaps .pink}
 <span id="record-stage-change">
 
+1. Under **[when these conditions are met]{.smallcaps}**, set your `AND` and `OR` conditions.
+2. Add a single independent rule or a linked condition group. These rules and groups can be nested if desired:
+
+    - Click **{{< fa plus >}} Add Rule** to add an independent rule.
+    - Click **{{< fa plus-minus >}} Add Group** to add a linked group of rules that all must be true to qualify.
+
+### {{< fa tag >}} Artifact Status Change
+<span id="artifact-status-change">
+
 1. Under **[when these conditions are met]{.smallcaps}**, set your `AND` and `OR` conditions.
 2. Add a single independent rule or a linked condition group. These rules and groups can be nested if desired:
 
@@ -37,7 +46,7 @@ Conditional requirements are required or optional for the following step types:^
 - (Optional) Present these requested fields to users in steps:
 
     i. Click **{{< fa plus >}} Add Step** to add a step.
-    ii. On the Add Step modal that appears, enter in the step **[title]{.smallcaps}** and provide an optional **[description]{.smallcaps}**.
+    ii. On the Add Step modal that appears, enter the step **[title]{.smallcaps}** and provide an optional **[description]{.smallcaps}**.
     iii. Click **Save** to insert the step.
     iv. Drag request fields into a step to add them to that step.
 
@@ -113,7 +122,7 @@ a. Set the **[record field]{.smallcaps}**^[[Manage inventory fields](/guide/inve
 
 b. Select a **[time delta direction]{.smallcaps}** relative to your selected field.
 
-c. Enter in a **[wait duration]{.smallcaps}** in minutes, hours, days, or months for the delta.
+c. Enter a **[wait duration]{.smallcaps}** in minutes, hours, days, or months for the delta.
 
 :::
 
@@ -125,7 +134,7 @@ c. Enter in a **[wait duration]{.smallcaps}** in minutes, hours, days, or months
 
 #### Request timeout
 
-- Enter in a request timeout in seconds under **[timeout (seconds)]{.smallcaps}**.
+- Enter a request timeout in seconds under **[timeout (seconds)]{.smallcaps}**.
 
 - Max 300 seconds, or enter `0` to disable timeout.
 
@@ -143,7 +152,7 @@ Toggle the following request options on or off:
 
 #### Request headers
 
-Enter in optional headers to include with your request:
+Enter optional headers to include with your request:
 
 1. Click **{{< fa plus >}} Add Header** under [headers]{.smallcaps} to enter a header.
 
@@ -168,6 +177,8 @@ Configure conditional requirements for the following step types:
 
 - {{< fa cube >}} Inventory Record Stage Change **[optional]{.smallercaps}**
 
+- {{< fa tag >}} Artifact Status Change **[optional]{.smallercaps}**
+
 - {{< fa arrow-pointer >}} User Action **[optional]{.smallercaps}**
 
 - {{< fa users >}} Approval **[required]{.smallercaps}**
diff --git a/site/guide/workflows/_configure-workflow-steps.qmd b/site/guide/workflows/_configure-workflow-steps.qmd
index 3b10015256..919c8d5484 100644
--- a/site/guide/workflows/_configure-workflow-steps.qmd
+++ b/site/guide/workflows/_configure-workflow-steps.qmd
@@ -29,7 +29,7 @@ Refer to [Introduction to workflows](/guide/workflows/introduction-to-workflows.
 [^on-webhook]:
 
     1. Click **{{< fa copy >}} Copy** to the right of URL to copy the webhook URL to your clipboard. This webhook URL is where you should send your `POST` request.
-    2. Under [select target record for payload]{.smallcaps}, choose a record from [your inventory](/guide/inventory/working-with-the-inventory.qmd) to populate the target for the payload.
+    2. Under [select target {record-type} record for payload]{.smallcaps}, choose a record from [your inventory](/guide/inventory/working-with-the-inventory.qmd) to populate the target for the payload.
     3. Click **{{< fa copy >}} Copy** to the right of Payload to copy the payload to include in your `POST` request to your clipboard.
     4. Click **{{< fa copy >}}** to the right of `x-api-key` and `x-api-secret` and their values to copy them to your clipboard.
     5. Send your `POST` request to the webhook URL and include these headers with your request to authenticate your call.
diff --git a/site/guide/workflows/_configure-workflows.qmd b/site/guide/workflows/_configure-workflows.qmd
index dfa2f6fee1..325ddf45fa 100644
--- a/site/guide/workflows/_configure-workflows.qmd
+++ b/site/guide/workflows/_configure-workflows.qmd
@@ -5,9 +5,9 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 :::: {.content-visible unless-format="revealjs"}
 Set up workflows to match your organizational needs. Workflows can be as simple or as complex as required, with multiple and discrete workflows supported for unique triggers and scenarios.
 
-::: {.callout}
+<!-- ::: {.callout}
 For more assistance configuring workflows, refer to our [Workflow configuration examples](/guide/workflows/workflow-configuration-examples.qmd).
-:::
+::: -->
 
 ::::
 
diff --git a/site/guide/workflows/_review-workflow-history.qmd b/site/guide/workflows/_review-workflow-history.qmd
index 4fe3dbf903..cf1e0e979a 100644
--- a/site/guide/workflows/_review-workflow-history.qmd
+++ b/site/guide/workflows/_review-workflow-history.qmd
@@ -3,7 +3,7 @@ Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 :::: {.content-visible unless-format="revealjs"}
-Review timelines of workflows running or previously run:
+Review timelines of workflows running or previously run on a specific record or artifact:[^view-all-workflows]
 
 ::: {.panel-tabset}
 
@@ -94,6 +94,10 @@ If workflows are running or have previously run on your artifact, you can:
     - Active
     - Scheduled
 
+[^view-all-workflows]:
+
+    To monitor workflows across your whole organization on a single timeline, refer to: [View all workflow executions](/guide/workflows/working-with-workflows.qmd#view-all-workflow-executions).
+
 ::::
 
 
diff --git a/site/guide/workflows/_view-workflow-executions.qmd b/site/guide/workflows/_view-workflow-executions.qmd
new file mode 100644
index 0000000000..bb7381c58d
--- /dev/null
+++ b/site/guide/workflows/_view-workflow-executions.qmd
@@ -0,0 +1,148 @@
+<!-- Copyright © 2023-2026 ValidMind Inc. All rights reserved.
+Refer to the LICENSE file in the root of this repository for details.
+SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
+
+:::: {.content-visible unless-format="revealjs"}
+Monitor every workflow execution across your organization on a single timeline:^[To view workflows from within a record or artifact, refer to: [Manage workflows](/guide/workflows/manage-workflows.qmd#review-workflows)]
+
+1. In the left sidebar, click **{{< fa arrow-right-arrow-left >}} Workflows**.
+
+2. Under the [record type]{.smallcaps} drop-down, select the type of record you want to view all workflow executions for:^[[Manage inventory record types](/guide/inventory/manage-inventory-record-types.qmd)]
+
+    - In the left column, workflows are grouped by inventory record.
+    - Workflows past their [expected end date]{.smallcaps} are color-coded in [red]{.red}.^[[Manage workflows](/guide/workflows/manage-workflows.qmd#edit-workflow-end-dates)]
+    - Use the buttons or keyboard shortcuts[^timeline-shortcuts-all] to control the timeline:
+      - **{{< fa magnifying-glass-plus >}}** — Zoom in
+      - **{{< fa magnifying-glass-minus >}}** — Zoom out
+      - **{{< fa arrow-left >}}** — Move earlier to the left
+      - **{{< fa calendar-days >}} Go to Today** — Focus on today
+      - **{{< fa arrow-right >}}** — Move later to the right
+     - **{{< fa magnifying-glass >}} Search** — Search for records using keywords in the record name.
+     - **{{< fa filter >}} Filter** — Filter the view to display only runs from specific types and statuses of workflows.[^filter-criteria]
+
+<br>
+
+::: {.callout-button .pl4 .nt4}
+::: {.callout collapse="true" appearance="minimal"}
+#### How do I create effective filters?
+
+{{< include /guide/shared/_work-with-filters.qmd >}}
+:::
+:::
+
+3. Click on any listed workflow to review the details of that specific workflow:
+
+    - **Details** — Name and description (if present) of the workflow, the workflow's status and progress (if applicable), when it was created, and when it was started.
+    - **Activity** — History of updates to the workflow on that record, including notes submitted during transitions.[^activity-notes]
+    - **Artifacts** [record workflows only]{.smallercaps .pink} — Artifacts for that record created within the duration of that workflow's runtime.
+    - **Workflow**^[Hover over a workflow step to view an animation of the steps connecting to and from that step.] — Overview of the entire workflow. The current workflow step is highlighted on this view.
+
+[^timeline-shortcuts-all]:
+
+    ::: {.callout title="Timeline control shortcuts"}
+
+    - **Move timeline left or right** — <br>
+        - Click and drag
+        - OR <kbd>Shift</kbd> + scroll wheel
+    - **Slow zoom in or out** — <br><kbd>Alt</kbd> + scroll wheel
+    - **Quick zoom in or out** — <br><kbd>Ctrl</kbd> + scroll wheel
+    :::
+
+[^filter-criteria]:
+
+    a. Filter by Inventory criteria. To learn more, expand **How do I create effective filters?**
+    b. Filter by Workflow criteria:
+        - By **Workflow Type**:
+            - Record
+            - Artifact
+        - By **Workflow Status**:
+            - Finished
+            - Active
+            - Scheduled
+
+[^activity-notes]:
+
+    Click **{{< fa chevron-down >}}** to reveal notes, and **{{< fa chevron-up >}}** to hide them.
+    <br><br>
+    [Transition workflows](/guide/workflows/transition-workflows.qmd)
+
+::::
+
+
+:::: {.content-hidden unless-format="revealjs"}
+Monitor every workflow execution across your organization on a single timeline:
+
+1. In the left sidebar, click **{{< fa arrow-right-arrow-left >}} Workflows**.
+
+2. Under the [record type]{.smallcaps} drop-down, select the type of record you want to view all workflow executions for:
+
+    - In the left column, workflows are grouped by inventory record.
+    - Workflows past their [expected end date]{.smallcaps} are color-coded in [red]{.red}.
+
+::: {.panel-tabset}
+
+#### Control the timeline
+
+Use the buttons or keyboard shortcuts to control the timeline:
+
+::::: {.columns}
+
+:::: {.column width="50%"}
+
+- **{{< fa magnifying-glass-plus >}}** — Zoom in
+- **{{< fa magnifying-glass-minus >}}** — Zoom out
+- **{{< fa arrow-left >}}** — Move earlier to the left
+- **{{< fa calendar-days >}} Go to Today** — Focus on today
+- **{{< fa arrow-right >}}** — Move later to the right
+
+::::
+
+:::: {.column width="50%"}
+
+::: {.pa3 .f7 .embed}
+- **Move timeline left or right** —
+    - Click and drag
+    - OR <kbd>Shift</kbd> + scroll wheel
+- **Slow zoom in or out** — <br><kbd>Alt</kbd> + scroll wheel
+- **Quick zoom in or out** — <br><kbd>Ctrl</kbd> + scroll wheel
+
+:::
+
+::::
+
+:::::
+
+#### Search the timeline
+
+**{{< fa magnifying-glass >}} Search** — Search for records using keywords in the record name.
+
+#### Filter the timeline
+
+**{{< fa filter >}} Filter** — Filter the view to display only runs from specific types and statuses of workflows.
+
+:::
+
+3. Click on any listed workflow to review the details of that specific workflow:
+
+::: {.panel-tabset}
+
+#### Details
+
+Name and description (if present) of the workflow, the workflow's status and progress (if applicable), when it was created, and when it was started.
+
+#### Activity
+
+History of updates to the workflow on that record, including notes submitted during transitions.
+
+#### Artifacts
+
+[record workflows only]{.smallercaps .pink} Artifacts for that record created within the duration of that workflow's runtime.
+
+#### Workflow
+
+Overview of the entire workflow. The current workflow step is highlighted on this view.
+
+:::
+
+
+::::
diff --git a/site/guide/workflows/_workflow-states.qmd b/site/guide/workflows/_workflow-states.qmd
index aba2c05568..1604c17eaf 100644
--- a/site/guide/workflows/_workflow-states.qmd
+++ b/site/guide/workflows/_workflow-states.qmd
@@ -5,7 +5,7 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 :::: {.content-visible unless-format="revealjs"}
 ### Add workflow states
 
-Add workflow states by either while configuring a **{{< fa wifi >}} Workflow State Change** step,^[[Configure workflow steps](/guide/workflows/configure-workflows.qmd#configure-workflow-steps)] or via the **{{< fa gear >}} Settings** page:
+Add workflow states either while configuring a **{{< fa wifi >}} Workflow State Change** step,^[[Configure workflow steps](/guide/workflows/configure-workflows.qmd#configure-workflow-steps)] or via the **{{< fa gear >}} Settings** page:
 
 1. In the left sidebar, click **{{< fa gear >}} Settings**.
 
@@ -20,7 +20,7 @@ Add workflow states by either while configuring a **{{< fa wifi >}} Workflow Sta
 
 1. Click **{{< fa plus >}} Add Workflow State**.
 
-1. Enter in a **[name]{.smallcaps}** and a **[description]{.smallcaps}**, then select a **[color]{.smallcaps}** for your workflow state.
+1. Enter a **[name]{.smallcaps}** and a **[description]{.smallcaps}**, then select a **[color]{.smallcaps}** for your workflow state.
 
 1. Click **Save** to create the workflow state.
 
@@ -74,6 +74,6 @@ If a state is or was previously in use  on a workflow within a {{< fa wifi >}} W
 :::: {.content-hidden unless-format="revealjs"}
 Workflow states are statuses unique to a specific workflow, discrete from record stages.
 
-Add workflow states by either while configuring a **{{< fa wifi >}} Workflow State Change** step, or [via the **{{< fa gear >}} Settings** page](/guide/workflows/workflow-states.qmd){target="blank"}.
+Add workflow states either while configuring a **{{< fa wifi >}} Workflow State Change** step, or [via the **{{< fa gear >}} Settings** page](/guide/workflows/workflow-states.qmd){target="_blank"}.
 
 ::::
\ No newline at end of file
diff --git a/site/guide/workflows/_workflow-step-types.qmd b/site/guide/workflows/_workflow-step-types.qmd
index ce8371c606..dd5cffe0f8 100644
--- a/site/guide/workflows/_workflow-step-types.qmd
+++ b/site/guide/workflows/_workflow-step-types.qmd
@@ -16,6 +16,18 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 | [set inventory record stage to]{.smallcaps} | Select the record stage to transition to. |
 : **{{< fa cube >}} Inventory Record Stage Change** step configuration {.hover tbl-colwidths="[40,60]"}
 
+### {{< fa tag >}} Artifact Status Change
+<span id="artifact-status-change">
+
+- Transitions an artifact into another status.
+- Requires available artifact type statuses associated with the workflow.^[[Manage artifact types](/guide/validation/manage-artifact-types.qmd#manage-artifact-type-statuses)]
+
+| Field | Description |
+|---:|---|
+| [when these conditions are met]{.smallcaps} (optional) | Add conditional requirements to qualify for this step.^[ [Conditional step requirements](/guide/workflows/conditional-step-requirements.qmd#artifact-status-change)]  |
+| [set artifact status to]{.smallcaps} | Select the artifact type status to transition to. |
+: **{{< fa tag >}} Artifact Status Change** step configuration {.hover tbl-colwidths="[40,60]"}
+
 ### {{< fa wifi >}} Workflow State Change
 <span id="workflow-state-change">
 
@@ -35,6 +47,7 @@ Creates a button that performs an action on behalf of the user.
 | Field | Description |
 |---:|---|
 | [display action button when]{.smallcaps}  (optional) | Add conditional requirements for displaying this step.^[[Conditional step requirements](/guide/workflows/conditional-step-requirements.qmd#user-action)]  |
+| [step title]{.smallcaps} (optional) | Text that displays at the top of the modal that opens when users click the action button. |
 | [action button label]{.smallcaps} | Text that displays on your action button. |
 | [requested fields]{.smallcaps} (optional) | Include record or artifact fields alongside your action.[^user-action] |
 | [user action deadline]{.smallcaps} (optional) | Include a deadline for when users should complete this action by.^[Toggle **Enable deadline** on to configure a deadline.] |
@@ -52,7 +65,7 @@ Display a preconfigured message to users in the selected **[approval group]{.sma
 |---:|---|
 | [approval group]{.smallcaps}  | Select the roles, stakeholders, or user fields responsible for approval. |
 | [fields to review]{.smallcaps} (optional) | Select the record or artifact fields shown to approvers for read-only review.[^approval-2] |
-| Approval Message | When your workflow reaches this {{< fa users >}} Approval step, the selected [approval group]{.smallcaps} is shown this message.^[Enter in a **[title]{.smallcaps}** and a **[message]{.smallcaps}** to display.] |
+| Approval Message | When your workflow reaches this {{< fa users >}} Approval step, the selected [approval group]{.smallcaps} is shown this message.^[Enter a **[title]{.smallcaps}** and a **[message]{.smallcaps}** to display.] |
 : **{{< fa users >}} Approval** step configuration {.hover tbl-colwidths="[35,65]"}
 
 ### {{< fa bullhorn >}} Broadcast
@@ -81,7 +94,7 @@ Workflows cannot be saved until condition branches are connected to other steps.
 To configure a condition branch:
 
 1. On the Configure Condition Branch modal, click **{{< fa plus >}} Add Branch**.
-2. Enter in the **[path name]{.smallcaps}** and designate the **[conditions]{.smallcaps}**^[[Conditional step requirements](/guide/workflows/conditional-step-requirements.qmd#condition-branch-required)] that apply to this path.
+2. Enter the **[path name]{.smallcaps}** and designate the **[conditions]{.smallcaps}**^[[Conditional step requirements](/guide/workflows/conditional-step-requirements.qmd#condition-branch-required)] that apply to this path.
 3. Continue with steps 1 and 2 until your conditional branch logic is complete.
 
     To remove a path, click **{{< fa ellipsis-vertical >}}** and select **{{< fa trash-can >}} Remove Path**.
@@ -130,7 +143,7 @@ When a workflow reaches a webhook step, the workflow will pause. Listen for a `P
 
 #### 2. Configure and copy payload
 
-1. Under [select target record for payload]{.smallcaps}, choose a record from your inventory^[[Working with the inventory](/guide/inventory/working-with-the-inventory.qmd)] to populate the target for the payload.
+1. Under [select target {record-type} record for payload]{.smallcaps}, choose a record from your inventory^[[Working with the inventory](/guide/inventory/working-with-the-inventory.qmd)] to populate the target for the payload.
 
 2. Click **{{< fa copy >}} Copy** to the right of Payload to copy the payload to your clipboard.
 
@@ -153,9 +166,9 @@ Sends a HTTP request with optional additional conditions.^[[Conditional step req
 
 | Field | Description |
 |---:|---|
-| [url]{.smallcaps} | Enter in the URL to send the HTTP request to. |
+| [url]{.smallcaps} | Enter the URL to send the HTTP request to. |
 | [method]{.smallcaps} | Select the HTTP request method: `GET`, `POST`, `PUT`, `DELETE`[^request-types] |
-| [timeout (seconds)]{.smallcaps} | Enter in a request timeout in seconds.[^request-timeout] |
+| [timeout (seconds)]{.smallcaps} | Enter a request timeout in seconds.[^request-timeout] |
 | [fail on non-]{.smallcaps}[2]{.smallercaps}[xx]{.smallcaps}  (optional) | Toggle whether or not the request will be considered failed if the response status code is not in the `2xx` range. |
 | [allow invalid certificates]{.smallcaps} (optional) | Toggle whether or not the request will be allowed to use invalid certificates. |
 | [follow redirects]{.smallcaps} (optional) | Toggle whether or not the request will follow redirects. |
@@ -174,7 +187,7 @@ Sends a HTTP request with optional additional conditions.^[[Conditional step req
 
 [^user-action]:
 
-    Select from the drop-down to add it to your User Action step. Users must have write permissions for the field in order to enter values.
+    Select a field from the the drop-down to add it to your User Action step — click **Add All** to add all fields in that group. Users must have write permissions for the field in order to enter values.
     <br><br>
 
     - [Manage inventory fields](/guide/inventory/manage-inventory-fields.qmd)
@@ -205,7 +218,7 @@ Sends a HTTP request with optional additional conditions.^[[Conditional step req
 [^request-types]: `PUT` and `POST` requests have additional configuration fields:
 
     - **[body type]{.smallcaps}** — Select whether the body is `JSON` or `Text`.
-    - **[body]{.smallcaps}** — Enter in your payload.
+    - **[body]{.smallcaps}** — Enter your payload.
 
 [^request-timeout]: Max 300 seconds, or enter `0` to disable timeout.
 
@@ -226,8 +239,13 @@ Sends a HTTP request with optional additional conditions.^[[Conditional step req
 :::: {.content-hidden unless-format="revealjs"}
 
 #### {{< fa cube >}} Inventory Record Stage Change
+
 Transitions a record into another stage.
 
+#### {{< fa tag >}} Artifact Status Change
+
+Transitions an artifact into another status.
+
 #### {{< fa wifi >}} Workflow State Change
 
 Transitions the workflow into another workflow state.
diff --git a/site/guide/workflows/configure-workflows.qmd b/site/guide/workflows/configure-workflows.qmd
index 30f1aef081..6ef4eb217b 100644
--- a/site/guide/workflows/configure-workflows.qmd
+++ b/site/guide/workflows/configure-workflows.qmd
@@ -120,7 +120,7 @@ a. Make your desired changes to step configuration[^9] and step relationships[^1
 
 b. When you are finished, click **Save New Version** to apply your changes.
 
-c. Enter in your **[version notes]{.smallcaps}** to describe your changes.
+c. Enter your **[version notes]{.smallcaps}** to describe your changes.
 
 
 ### Delete workflow steps
diff --git a/site/guide/workflows/manage-workflows.qmd b/site/guide/workflows/manage-workflows.qmd
index f1c91bd77b..026d027a1c 100644
--- a/site/guide/workflows/manage-workflows.qmd
+++ b/site/guide/workflows/manage-workflows.qmd
@@ -8,7 +8,7 @@ aliases:
   - /guide/model-workflows/manage-model-workflows.html
 ---
 
-Review workflows associated with your records or artifacts, and initiate or abort workflows configured for your organization on your records or artifacts.
+Review and manage workflows associated with a specific record or artifact, and initiate or abort workflows configured for your organization on that record or artifact.
 
 ::: {.attn}
 
@@ -97,7 +97,7 @@ To adjust the expected end date for a workflow:
 
 5. On the workflow's detail modal, click on the **{{< fa ellipsis-vertical >}}** in the top-right hand corner and select **{{< fa calendar >}} Edit Expected End Date**.
 
-6. Enter in the new [expected end date]{.smallcaps} for the workflow.
+6. Enter the new [expected end date]{.smallcaps} for the workflow.
 
 7. Click **Save Expected End Date** to apply the new date.
 
@@ -109,7 +109,7 @@ To adjust the expected end date for a workflow:
 
 3. On the workflow's detail modal, click on the **{{< fa ellipsis-vertical >}}** in the top-right hand corner and select **{{< fa calendar >}} Edit Expected End Date**.
 
-4. Enter in the new [expected end date]{.smallcaps} for the workflow.
+4. Enter the new [expected end date]{.smallcaps} for the workflow.
 
 5. Click **Save Expected End Date** to apply the new date.
 
diff --git a/site/guide/workflows/setting-up-workflows.qmd b/site/guide/workflows/setting-up-workflows.qmd
index 60ab40641a..6b5d25cdc4 100644
--- a/site/guide/workflows/setting-up-workflows.qmd
+++ b/site/guide/workflows/setting-up-workflows.qmd
@@ -7,17 +7,19 @@ date: last-modified
 listing:
   - id: workflow-setup
     type: grid
+    grid-columns: 2
     max-description-length: 250
     sort: false
     fields: [title, description]
     contents:
     - manage-record-stages.qmd
     - configure-workflows.qmd
-    - workflow-configuration-examples.qmd
+    # - workflow-configuration-examples.qmd
 aliases:
   - /guide/model-workflows/setting-up-model-workflows.html
 includes:
-  workflows: true
+  workflow:
+    setup: true
 ---
 
 {{< include /guide/workflows/_set-up-workflows.qmd >}}
diff --git a/site/guide/workflows/workflow-configuration-examples.qmd b/site/guide/workflows/workflow-configuration-examples.qmd
index 0a3b41f12e..770d0c5128 100644
--- a/site/guide/workflows/workflow-configuration-examples.qmd
+++ b/site/guide/workflows/workflow-configuration-examples.qmd
@@ -4,6 +4,7 @@
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
 title: "Workflow configuration examples"
 date: last-modified
+search: false
 ---
 
 Learn from example workflow configurations to help you tailor workflows to fit your organization's requirements for managing risk throughout your entire risk management lifecycles.
@@ -43,7 +44,7 @@ This workflow is initiated manually[^4] — in this case via {{< fa arrow-right-
 
 This workflow is initiated when a field is populated — in this case, when the model is slated for deployment by entering value into the [deployment scheduled]{.smallcaps} date time field.[^8]
 
-- The workflow will wait until the timestamp indicated in the scheduled deployment date before revealing the next available action in the workflow — in this case, the option to deploy the model and enter in a concrete date the model was initially pushed to production.
+- The workflow will wait until the timestamp indicated in the scheduled deployment date before revealing the next available action in the workflow — in this case, the option to deploy the model and enter a concrete date the model was initially pushed to production.
 - After a model is deployed via this workflow, an email notification is sent to users notifying them of the completed implementation.
 - Actions on this workflow are linked both to a transition in model stage,[^9] as well as workflow state.[^10]
 
diff --git a/site/guide/workflows/workflow-step-types.qmd b/site/guide/workflows/workflow-step-types.qmd
index c5d00cbe87..bbb94b92a7 100644
--- a/site/guide/workflows/workflow-step-types.qmd
+++ b/site/guide/workflows/workflow-step-types.qmd
@@ -8,10 +8,11 @@ date: last-modified
 
 Select from a variety of workflow step types to build workflows from.
 
+<!--
 ::: {.callout title="Need more help configuring workflow step types?"}
 
 - [Workflow configuration examples](workflow-configuration-examples.qmd#workflow-step-type-examples)
 - [Integrations examples](/guide/integrations/integrations-examples.qmd)
-:::
+::: -->
 
 {{< include /guide/workflows/_workflow-step-types.qmd >}}
diff --git a/site/guide/workflows/working-with-workflows.qmd b/site/guide/workflows/working-with-workflows.qmd
index 8174e9e960..b98a909e97 100644
--- a/site/guide/workflows/working-with-workflows.qmd
+++ b/site/guide/workflows/working-with-workflows.qmd
@@ -18,9 +18,48 @@ listing:
 aliases:
   - /guide/working-with-model-workflows.html
   - /guide/model-workflows/working-with-model-workflows.html
+includes:
+  workflow:
+    view: true
 ---
 
 Once customized, use workflows to transition your records into their appropriate next stages throughout your risk management lifecycles.
 
+::: {.attn}
+
+## Prerequisites
+
+- [x] {{< var link.login >}}
+- [x] Workflows have already been set up for use with your records or artifacts.[^1]
+- [x] You are assigned a role with sufficient permissions to view workflows.[^2]
+
+:::
+
+## View all workflow executions
+
+{{< include /guide/workflows/_view-workflow-executions.qmd >}}
+
+### Manage workflow timeline views
+
+Save searches and filters applied to the workflow timeline as a view to reapply at any time:
+
+#### Manage personal timeline views
+
+{{< include /guide/shared/manage-views/_personal-views.qmd >}}
+
+#### Manage organization timeline views
+
+{{< include /guide/shared/manage-views/_organization-views.qmd >}}
+
+
+## Work with workflows
+
 :::{#workflows}
-:::
\ No newline at end of file
+:::
+
+
+<!-- FOOTNOTES -->
+
+[^1]: [Configure workflows](configure-workflows.qmd)
+
+[^2]: [Manage permissions](/guide/configuration/manage-permissions.qmd)
\ No newline at end of file
diff --git a/site/index.qmd b/site/index.qmd
index ac83bb25e9..711d89c7f1 100644
--- a/site/index.qmd
+++ b/site/index.qmd
@@ -530,7 +530,7 @@ Use [cases]{.pink}
 
 ::: {.f4 .blur}
 <!-- <span class="blur"> -->
-{{< var vm.product >}} gives you the tools for effective [AI governance]{.pink .b} and [model risk management]{.pink .b}, whether you are working toward EU AI Act compliance or managing model risk under SR 11-7, SS1/23, or E-23.
+{{< var vm.product >}} gives you the tools for effective [AI governance]{.pink .b} and [model risk management]{.pink .b}, whether you are working toward EU AI Act compliance or managing model risk under SR 26-2, SS1/23, or E-23.
 <!-- </span> -->
 
 :::
diff --git a/site/llm/.quarto/project-cache/deno-kv-file b/site/llm/.quarto/project-cache/deno-kv-file
new file mode 100644
index 0000000000..4e86411b58
Binary files /dev/null and b/site/llm/.quarto/project-cache/deno-kv-file differ
diff --git a/site/llm/.quarto/project-cache/deno-kv-file-shm b/site/llm/.quarto/project-cache/deno-kv-file-shm
new file mode 100644
index 0000000000..c2c3593c0f
Binary files /dev/null and b/site/llm/.quarto/project-cache/deno-kv-file-shm differ
diff --git a/site/llm/.quarto/project-cache/deno-kv-file-wal b/site/llm/.quarto/project-cache/deno-kv-file-wal
new file mode 100644
index 0000000000..f7c8b9ab86
Binary files /dev/null and b/site/llm/.quarto/project-cache/deno-kv-file-wal differ
diff --git a/site/llm/README.md b/site/llm/README.md
new file mode 100644
index 0000000000..91bd82bd9c
--- /dev/null
+++ b/site/llm/README.md
@@ -0,0 +1,54 @@
+# LLM corpus (markdown for RAG)
+
+This directory holds tooling that renders the documentation site to plain Markdown for ingestion into LanceDB and the in-app assistant (Valerie).
+
+## Output
+
+Rendered files land in `site/llm/_llm-output/` (gitignored). CI publishes that directory after `make render-llm`. Deployed environments only pick up new assistant context after the LanceDB artifact is rebuilt from a fresh render.
+
+## Render locally
+
+From `site/`:
+
+```bash
+make render-llm
+```
+
+This runs `llm/render.sh` (temporary minimal `_quarto.yml`, Quarto → GFM) and `llm/clean.sh` (Pandoc cleanup). Equivalent to the **Validate LLM markdown render** step in `.github/workflows/validate-docs-site.yaml`.
+
+Excluded from the LLM render (among others): notebooks, internal pages, contributor style guide, and most of `about/contributing/`. **Included:** `about/using-the-documentation.qmd` (docs IA hub for agents).
+
+Copied into `_llm-output/` after render:
+
+| File | Source |
+|------|--------|
+| `AGENTS.md` | Repo root |
+| `chatbot-product-map.md` | Generated (see below) |
+| `about/using-the-documentation.md` | Quarto render |
+
+See also [`AGENTS.md`](../../AGENTS.md) for how agents should use the corpus.
+
+## Chatbot product map
+
+Valerie needs routes in the product UI (especially **Settings**) mapped to documentation URLs. Human docs sidebars are organized by topic (Configuration, Workflows, Inventory); the product groups features differently.
+
+| Artifact | Purpose |
+|----------|---------|
+| `chatbot-product-map-frontend-snapshot.json` | Vendored extract from `validmind/frontend` (Settings tree, sidebar nav, `helpLink` / docs URLs) |
+| `chatbot-product-map.md` | Retrieval-oriented map: routes → primary/related docs + section headings from `.qmd` |
+
+### Why a frontend snapshot?
+
+CI does **not** check out `validmind/frontend` (private repo; cross-repo PAT scope). The snapshot is committed in this repo so pipelines can regenerate the map without frontend access. It may lag the live product until someone refreshes it locally.
+
+### Maintenance
+
+| Change | Command (from `site/`) |
+|--------|-------------------------|
+| Docs only (new `.qmd`, heading updates) | `make generate-chatbot-product-map` |
+| Product routes or in-app help links | `make refresh-chatbot-product-map` (requires a sibling `../frontend` checkout) |
+
+Commit both `chatbot-product-map.md` and `chatbot-product-map-frontend-snapshot.json` when the snapshot changes. CI fails if either file is out of date after regeneration.
+
+Generator: `site/scripts/generate_chatbot_product_map.py`  
+Tests: `python3 -m unittest discover -s site/scripts -p 'test_generate_chatbot_product_map.py' -v` (from repo root).
diff --git a/site/llm/_quarto.yml b/site/llm/_quarto.yml
index fecfcafdef..b9322acf09 100644
--- a/site/llm/_quarto.yml
+++ b/site/llm/_quarto.yml
@@ -12,7 +12,8 @@ project:
     - "../**/*.qmd"
     - "!../notebooks/"
     - "!../404.qmd"
-    - "!../about/contributing/"
+    - "!../about/contributing/validmind-community.qmd"
+    - "!../about/contributing/style-guide/"
     - "!../about/deployment/"
     - "!../about/fine-print/"
     - "!../_site/"
diff --git a/site/llm/chatbot-product-map-frontend-snapshot.json b/site/llm/chatbot-product-map-frontend-snapshot.json
new file mode 100644
index 0000000000..4ee66823a6
--- /dev/null
+++ b/site/llm/chatbot-product-map-frontend-snapshot.json
@@ -0,0 +1,365 @@
+{
+  "version": 1,
+  "generated_at": "2026-05-23T01:45:21.129000+00:00",
+  "settings": [
+    {
+      "path": "/settings/profile",
+      "label": "Profile",
+      "group": "Your Account",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings/theme-customization",
+      "label": "Theme Customization",
+      "group": "Your Account",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings/organization",
+      "label": "Organization",
+      "group": "Organization",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings/authentication",
+      "label": "Authentication",
+      "group": "Organization",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings/email-notifications",
+      "label": "Email Notifications",
+      "group": "Organization",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings/user-directory",
+      "label": "User Directory",
+      "group": "Users & Access",
+      "primary_docs": [
+        {
+          "path": "/guide/configuration/managing-users.html",
+          "anchor": null
+        }
+      ]
+    },
+    {
+      "path": "/settings/invitation",
+      "label": "Invite New Users",
+      "group": "Users & Access",
+      "primary_docs": [
+        {
+          "path": "/guide/configuration/managing-users.html",
+          "anchor": null
+        }
+      ]
+    },
+    {
+      "path": "/settings/roles",
+      "label": "Roles",
+      "group": "Users & Access",
+      "primary_docs": [
+        {
+          "path": "/guide/configuration/managing-users.html",
+          "anchor": null
+        }
+      ]
+    },
+    {
+      "path": "/settings/permissions",
+      "label": "Permissions",
+      "group": "Users & Access",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings/groups",
+      "label": "Groups",
+      "group": "Users & Access",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings/integrations/connections",
+      "label": "Connections",
+      "group": "Integrations",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings/integrations/secrets",
+      "label": "Secrets",
+      "group": "Integrations",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings/integrations/data-exports",
+      "label": "Analytics Exports",
+      "group": "Integrations",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings/finding-types",
+      "label": "Artifact Types",
+      "group": "Artifacts",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings/finding-severities",
+      "label": "Artifact Severities",
+      "group": "Artifacts",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings/finding-custom-fields",
+      "label": "Artifact Fields",
+      "group": "Artifacts",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings/regulations",
+      "label": "Regulations & Policies",
+      "group": "Governance",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings/risk-areas",
+      "label": "Risk Areas & Validation Guidelines",
+      "group": "Governance",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings/workflows",
+      "label": "Workflows",
+      "group": "Governance",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings/workflow-states",
+      "label": "Workflow States",
+      "group": "Governance",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings/attestation-templates",
+      "label": "Attestation Templates",
+      "group": "Governance",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings/document-types",
+      "label": "Document Types",
+      "group": "Documents",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings/templates",
+      "label": "Templates",
+      "group": "Documents",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings/block-library",
+      "label": "Block Library",
+      "group": "Documents",
+      "primary_docs": []
+    }
+  ],
+  "nav": [
+    {
+      "path": "/dashboard",
+      "label": "Dashboard",
+      "group": "Main navigation",
+      "primary_docs": []
+    },
+    {
+      "path": "/validation-issues",
+      "label": "Validation Issues",
+      "group": "Main navigation",
+      "primary_docs": []
+    },
+    {
+      "path": "/attestations",
+      "label": "Attestations",
+      "group": "Main navigation",
+      "primary_docs": []
+    },
+    {
+      "path": "/artifacts",
+      "label": "Artifacts",
+      "group": "Main navigation",
+      "primary_docs": []
+    },
+    {
+      "path": "/workflows",
+      "label": "Workflows",
+      "group": "Main navigation",
+      "primary_docs": []
+    },
+    {
+      "path": "/analytics",
+      "label": "sidebar.analytics",
+      "group": "Main navigation",
+      "primary_docs": []
+    },
+    {
+      "path": "/settings",
+      "label": "Settings",
+      "group": "Main navigation",
+      "primary_docs": []
+    }
+  ],
+  "file_links": {
+    "/settings": [
+      {
+        "path": "/guide/configuration/managing-users.html",
+        "anchor": null
+      }
+    ],
+    "/settings/attestations": [
+      {
+        "path": "/guide/attestation/manage-attestations.html",
+        "anchor": null
+      },
+      {
+        "path": "/guide/shared/work-with-filters.html",
+        "anchor": null
+      }
+    ],
+    "/settings/authentication": [
+      {
+        "path": "/installation/security/configure-single-sign-on-sso.html",
+        "anchor": null
+      }
+    ],
+    "/settings/block-library": [
+      {
+        "path": "/guide/templates/manage-text-block-library.html",
+        "anchor": null
+      }
+    ],
+    "/settings/custom-fields": [
+      {
+        "path": "/guide/model-inventory/manage-model-inventory-fields.html",
+        "anchor": null
+      }
+    ],
+    "/settings/document-types": [
+      {
+        "path": "/guide/templates/manage-document-types.html",
+        "anchor": null
+      }
+    ],
+    "/settings/email-notifications": [
+      {
+        "path": "/guide/configuration/manage-platform-notifications.html",
+        "anchor": "customize-email-notifications"
+      }
+    ],
+    "/settings/finding-custom-fields": [
+      {
+        "path": "/guide/model-validation/manage-model-finding-fields.html",
+        "anchor": null
+      }
+    ],
+    "/settings/finding-severities": [
+      {
+        "path": "/guide/model-validation/manage-artifact-severities.html",
+        "anchor": null
+      }
+    ],
+    "/settings/finding-types": [
+      {
+        "path": "/guide/model-validation/manage-artifact-types.html",
+        "anchor": null
+      }
+    ],
+    "/settings/groups": [
+      {
+        "path": "/guide/configuration/manage-groups.html",
+        "anchor": null
+      }
+    ],
+    "/settings/invitation": [
+      {
+        "path": "/guide/configuration/manage-users.html",
+        "anchor": "manage-user-invitations"
+      }
+    ],
+    "/settings/organization": [
+      {
+        "path": "/guide/configuration/managing-your-organization.html",
+        "anchor": null
+      }
+    ],
+    "/settings/permissions": [
+      {
+        "path": "/guide/configuration/manage-permissions.html",
+        "anchor": null
+      }
+    ],
+    "/settings/primary-record-type-stages": [
+      {
+        "path": "/guide/workflows/manage-model-stages.html",
+        "anchor": null
+      }
+    ],
+    "/settings/profile": [
+      {
+        "path": "/guide/configuration/view-your-profile.html",
+        "anchor": null
+      }
+    ],
+    "/settings/regulation-policy": [
+      {
+        "path": "/guide/templates/customize-virtual-document-validator.html",
+        "anchor": "add-or-edit-assessment-questions"
+      }
+    ],
+    "/settings/risk-areas": [
+      {
+        "path": "/guide/model-validation/manage-validation-guidelines.html",
+        "anchor": null
+      }
+    ],
+    "/settings/roles": [
+      {
+        "path": "/guide/configuration/manage-roles.html",
+        "anchor": null
+      }
+    ],
+    "/settings/stakeholders": [
+      {
+        "path": "/guide/configuration/manage-model-stakeholder-types.html",
+        "anchor": null
+      }
+    ],
+    "/settings/statuses": [
+      {
+        "path": "/guide/workflows/manage-model-stages.html",
+        "anchor": null
+      }
+    ],
+    "/settings/templates": [
+      {
+        "path": "/guide/templates/customize-document-templates.html",
+        "anchor": null
+      }
+    ],
+    "/settings/user-directory": [
+      {
+        "path": "/guide/configuration/manage-users.html",
+        "anchor": null
+      }
+    ],
+    "/settings/workflow-states": [
+      {
+        "path": "/guide/workflows/workflow-states.html",
+        "anchor": null
+      }
+    ],
+    "/settings/workflows": [
+      {
+        "path": "/guide/workflows/setting-up-workflows.html",
+        "anchor": null
+      }
+    ]
+  }
+}
diff --git a/site/llm/chatbot-product-map.md b/site/llm/chatbot-product-map.md
new file mode 100644
index 0000000000..c2abf3e499
--- /dev/null
+++ b/site/llm/chatbot-product-map.md
@@ -0,0 +1,580 @@
+# ValidMind product-to-documentation map
+
+> Auto-generated. Maps in-product routes to documentation URLs and key sections.
+> For how documentation is organized by topic, see `AGENTS.md` and
+> [Using the documentation](/about/using-the-documentation.html).
+
+## Settings
+
+### Main navigation
+
+#### `/settings` — Settings
+
+**Docs (primary):**
+
+- `/guide/configuration/managing-users.html`
+  - Sections: Key concepts; Key terms; Default roles; User management
+
+### Governance
+
+#### `/settings/attestation-templates` — Attestation Templates
+
+**Docs (related):**
+
+- `/guide/attestation/approve-attestations.html`
+  - Sections: Prerequisites; Steps
+- `/guide/attestation/manage-attestations.html`
+  - Sections: Prerequisites; Add attestation templates; Test attestation schedules; Edit attestation periods; Cancel attestation periods; View attestations dashboard; Progress; Responses
+- `/guide/attestation/review-attestations.html`
+  - Sections: Prerequisites; Steps
+- `/guide/attestation/submit-attestations.html`
+  - Sections: Prerequisites; Steps
+- `/guide/attestation/working-with-attestations.html`
+  - Sections: Prerequisites; Key concepts; Where do I access attestations?; How does the attestation process work?; How are attestation submissions organized?; How do I create meaningful attestation questionnaires?; Manage attestations
+- `/guide/templates/customize-document-checker.html`
+  - Sections: Prerequisites; Manage regulations and policies; Manage assessments; Default assessments provided by } cannot be edited, only cloned.; Add or clone assessments; Add or edit assessment questions; Add assessment questions; Edit assessment questions
+
+- *No direct help link in frontend; related docs inferred from keywords.*
+
+### Main navigation
+
+#### `/settings/attestations` — /settings/attestations
+
+**Docs (primary):**
+
+- `/guide/attestation/manage-attestations.html`
+  - Sections: Prerequisites; Add attestation templates; Test attestation schedules; Edit attestation periods; Cancel attestation periods; View attestations dashboard; Progress; Responses
+- `/guide/shared/work-with-filters.html`
+
+**Docs (related):**
+
+- `/guide/attestation/approve-attestations.html`
+  - Sections: Prerequisites; Steps
+- `/guide/attestation/review-attestations.html`
+  - Sections: Prerequisites; Steps
+- `/guide/attestation/submit-attestations.html`
+  - Sections: Prerequisites; Steps
+- `/guide/attestation/working-with-attestations.html`
+  - Sections: Prerequisites; Key concepts; Where do I access attestations?; How does the attestation process work?; How are attestation submissions organized?; How do I create meaningful attestation questionnaires?; Manage attestations
+
+### Organization
+
+#### `/settings/authentication` — Authentication
+
+**Docs (primary):**
+
+- `/installation/security/configure-single-sign-on-sso.html`
+  - Sections: What is SSO?; Prerequisites; Step 1: Set up Microsoft Entra for SSO; Step 2: Contact ValidMind to enable SSO
+
+**Docs (related):**
+
+- `/guide/configuration/managing-your-organization.html`
+  - Sections: Prerequisites; Switch between organizations; Change names of organizations; Manage document defaults; Tracked changes; Numbered table and figure captions; Organization setup
+
+### Documents
+
+#### `/settings/block-library` — Block Library
+
+**Docs (primary):**
+
+- `/guide/templates/manage-text-block-library.html`
+  - Sections: Prerequisites; Add text blocks; Add existing text blocks to library; Duplicate text blocks; Edit text blocks; Delete text blocks
+
+**Docs (related):**
+
+- `/guide/templates/customize-document-checker.html`
+  - Sections: Prerequisites; Manage regulations and policies; Manage assessments; Default assessments provided by } cannot be edited, only cloned.; Add or clone assessments; Add or edit assessment questions; Add assessment questions; Edit assessment questions
+- `/guide/templates/customize-document-templates.html`
+  - Sections: Prerequisites; Edit template outlines; Configure assessment options[^4]; Edit YAML templates; Template schema; Troubleshooting YAML templates; Add text blocks to templates; Add text blocks via template outlines
+- `/guide/templates/manage-document-templates.html`
+  - Sections: Prerequisites; View document templates; Edit document template outlines; Swap document templates; View currently applied templates; Swap between templates; Duplicate document templates; Delete document templates
+- `/guide/templates/manage-document-types.html`
+  - Sections: Prerequisites; Add document types; Edit or delete document types; Development, Validation, and Monitoring document types are stock types and cannot be deleted.
+- `/guide/templates/manage-documents.html`
+  - Sections: Prerequisites; Add record documents; How do I get the best results when converting PDFs into editable documents?; How can I trust that the conversion is accurate?; Troubleshooting; My PDF conversion is stuck. What can I do?; Edit record documents; Delete record documents
+- `/guide/templates/working-with-document-templates.html`
+  - Sections: What's next
+
+### Main navigation
+
+#### `/settings/custom-fields` — /settings/custom-fields
+
+**Docs (primary):**
+
+- `/guide/model-inventory/manage-model-inventory-fields.html`
+  - Note: no matching `.qmd` source found
+
+### Documents
+
+#### `/settings/document-types` — Document Types
+
+**Docs (primary):**
+
+- `/guide/templates/manage-document-types.html`
+  - Sections: Prerequisites; Add document types; Edit or delete document types; Development, Validation, and Monitoring document types are stock types and cannot be deleted.
+
+**Docs (related):**
+
+- `/guide/templates/customize-document-checker.html`
+  - Sections: Prerequisites; Manage regulations and policies; Manage assessments; Default assessments provided by } cannot be edited, only cloned.; Add or clone assessments; Add or edit assessment questions; Add assessment questions; Edit assessment questions
+- `/guide/templates/customize-document-templates.html`
+  - Sections: Prerequisites; Edit template outlines; Configure assessment options[^4]; Edit YAML templates; Template schema; Troubleshooting YAML templates; Add text blocks to templates; Add text blocks via template outlines
+- `/guide/templates/manage-document-templates.html`
+  - Sections: Prerequisites; View document templates; Edit document template outlines; Swap document templates; View currently applied templates; Swap between templates; Duplicate document templates; Delete document templates
+- `/guide/templates/manage-documents.html`
+  - Sections: Prerequisites; Add record documents; How do I get the best results when converting PDFs into editable documents?; How can I trust that the conversion is accurate?; Troubleshooting; My PDF conversion is stuck. What can I do?; Edit record documents; Delete record documents
+- `/guide/templates/manage-text-block-library.html`
+  - Sections: Prerequisites; Add text blocks; Add existing text blocks to library; Duplicate text blocks; Edit text blocks; Delete text blocks
+- `/guide/templates/working-with-document-templates.html`
+  - Sections: What's next
+
+### Organization
+
+#### `/settings/email-notifications` — Email Notifications
+
+**Docs (primary):**
+
+- `/guide/configuration/manage-platform-notifications.html` (section: #customize-email-notifications)
+  - Sections: Prerequisites; View platform notifications; Review updates; Mark updates as read; Dismiss updates; Customize email notifications
+
+**Docs (related):**
+
+- `/guide/configuration/managing-your-organization.html`
+  - Sections: Prerequisites; Switch between organizations; Change names of organizations; Manage document defaults; Tracked changes; Numbered table and figure captions; Organization setup
+
+### Artifacts
+
+#### `/settings/finding-custom-fields` — Artifact Fields
+
+**Docs (primary):**
+
+- `/guide/model-validation/manage-model-finding-fields.html`
+  - Note: no matching `.qmd` source found
+
+**Docs (related):**
+
+- `/guide/templates/customize-document-checker.html`
+  - Sections: Prerequisites; Manage regulations and policies; Manage assessments; Default assessments provided by } cannot be edited, only cloned.; Add or clone assessments; Add or edit assessment questions; Add assessment questions; Edit assessment questions
+- `/guide/templates/customize-document-templates.html`
+  - Sections: Prerequisites; Edit template outlines; Configure assessment options[^4]; Edit YAML templates; Template schema; Troubleshooting YAML templates; Add text blocks to templates; Add text blocks via template outlines
+- `/guide/templates/manage-document-templates.html`
+  - Sections: Prerequisites; View document templates; Edit document template outlines; Swap document templates; View currently applied templates; Swap between templates; Duplicate document templates; Delete document templates
+- `/guide/templates/manage-document-types.html`
+  - Sections: Prerequisites; Add document types; Edit or delete document types; Development, Validation, and Monitoring document types are stock types and cannot be deleted.
+- `/guide/templates/manage-documents.html`
+  - Sections: Prerequisites; Add record documents; How do I get the best results when converting PDFs into editable documents?; How can I trust that the conversion is accurate?; Troubleshooting; My PDF conversion is stuck. What can I do?; Edit record documents; Delete record documents
+- `/guide/templates/manage-text-block-library.html`
+  - Sections: Prerequisites; Add text blocks; Add existing text blocks to library; Duplicate text blocks; Edit text blocks; Delete text blocks
+
+#### `/settings/finding-severities` — Artifact Severities
+
+**Docs (primary):**
+
+- `/guide/model-validation/manage-artifact-severities.html`
+  - Note: no matching `.qmd` source found
+
+**Docs (related):**
+
+- `/guide/templates/customize-document-checker.html`
+  - Sections: Prerequisites; Manage regulations and policies; Manage assessments; Default assessments provided by } cannot be edited, only cloned.; Add or clone assessments; Add or edit assessment questions; Add assessment questions; Edit assessment questions
+- `/guide/templates/customize-document-templates.html`
+  - Sections: Prerequisites; Edit template outlines; Configure assessment options[^4]; Edit YAML templates; Template schema; Troubleshooting YAML templates; Add text blocks to templates; Add text blocks via template outlines
+- `/guide/templates/manage-document-templates.html`
+  - Sections: Prerequisites; View document templates; Edit document template outlines; Swap document templates; View currently applied templates; Swap between templates; Duplicate document templates; Delete document templates
+- `/guide/templates/manage-document-types.html`
+  - Sections: Prerequisites; Add document types; Edit or delete document types; Development, Validation, and Monitoring document types are stock types and cannot be deleted.
+- `/guide/templates/manage-documents.html`
+  - Sections: Prerequisites; Add record documents; How do I get the best results when converting PDFs into editable documents?; How can I trust that the conversion is accurate?; Troubleshooting; My PDF conversion is stuck. What can I do?; Edit record documents; Delete record documents
+- `/guide/templates/manage-text-block-library.html`
+  - Sections: Prerequisites; Add text blocks; Add existing text blocks to library; Duplicate text blocks; Edit text blocks; Delete text blocks
+
+#### `/settings/finding-types` — Artifact Types
+
+**Docs (primary):**
+
+- `/guide/model-validation/manage-artifact-types.html`
+  - Note: no matching `.qmd` source found
+
+**Docs (related):**
+
+- `/guide/templates/customize-document-checker.html`
+  - Sections: Prerequisites; Manage regulations and policies; Manage assessments; Default assessments provided by } cannot be edited, only cloned.; Add or clone assessments; Add or edit assessment questions; Add assessment questions; Edit assessment questions
+- `/guide/templates/customize-document-templates.html`
+  - Sections: Prerequisites; Edit template outlines; Configure assessment options[^4]; Edit YAML templates; Template schema; Troubleshooting YAML templates; Add text blocks to templates; Add text blocks via template outlines
+- `/guide/templates/manage-document-templates.html`
+  - Sections: Prerequisites; View document templates; Edit document template outlines; Swap document templates; View currently applied templates; Swap between templates; Duplicate document templates; Delete document templates
+- `/guide/templates/manage-document-types.html`
+  - Sections: Prerequisites; Add document types; Edit or delete document types; Development, Validation, and Monitoring document types are stock types and cannot be deleted.
+- `/guide/templates/manage-documents.html`
+  - Sections: Prerequisites; Add record documents; How do I get the best results when converting PDFs into editable documents?; How can I trust that the conversion is accurate?; Troubleshooting; My PDF conversion is stuck. What can I do?; Edit record documents; Delete record documents
+- `/guide/templates/manage-text-block-library.html`
+  - Sections: Prerequisites; Add text blocks; Add existing text blocks to library; Duplicate text blocks; Edit text blocks; Delete text blocks
+
+### Users & Access
+
+#### `/settings/groups` — Groups
+
+**Docs (primary):**
+
+- `/guide/configuration/manage-groups.html`
+  - Sections: Prerequisites; View group details; Add new groups; Remove groups; Add or remove group members
+
+**Docs (related):**
+
+- `/guide/configuration/manage-users.html`
+  - Sections: Prerequisites; View and search for users; Manage user invitations; Invite new users; Monitor user invitations; Manage user roles
+- `/guide/configuration/managing-users.html`
+  - Sections: Key concepts; Key terms; Default roles; User management
+
+### Integrations
+
+#### `/settings/integrations/connections` — Connections
+
+**Docs (related):**
+
+- `/faq/faq-integrations.html`
+  - Sections: Which languages, libraries, and environments do you support?; Currently, we support **Python }** and the most popular AI/ML and data science libraries.; What test ingestion or modeling techniques are supported?; What large language model (LLM) features are offered?; What deployment options are supported by }?; Learn more
+- `/guide/configuration/configure-aws-privatelink.html`
+  - Sections: Prerequisites; VPC service information; Steps; What's next
+- `/guide/configuration/configure-azure-private-link.html`
+  - Sections: Prerequisites; VNet service information; Steps; What's next
+- `/guide/configuration/configure-google-private-service-connect.html`
+  - Sections: Prerequisites; VPC service information; Configure your Google Cloud Platform project; Request access from }; Prepare your network for connection; Create an endpoint to connect to }; Steps; Create an endpoint to connect to the } authentication service
+- `/guide/configuration/customize-your-dashboard.html`
+  - Sections: Prerequisites; Manage dashboards; Add dashboards; Edit or remove dashboards; Manage widgets; Arrange widgets; Add widgets; Remove widgets
+- `/guide/configuration/manage-groups.html`
+  - Sections: Prerequisites; View group details; Add new groups; Remove groups; Add or remove group members
+
+- *No direct help link in frontend; related docs inferred from keywords.*
+
+#### `/settings/integrations/data-exports` — Analytics Exports
+
+**Docs (related):**
+
+- `/faq/faq-integrations.html`
+  - Sections: Which languages, libraries, and environments do you support?; Currently, we support **Python }** and the most popular AI/ML and data science libraries.; What test ingestion or modeling techniques are supported?; What large language model (LLM) features are offered?; What deployment options are supported by }?; Learn more
+- `/faq/faq-reporting.html`
+  - Sections: What analytic features are offered by }?; Learn more
+- `/guide/configuration/configure-aws-privatelink.html`
+  - Sections: Prerequisites; VPC service information; Steps; What's next
+- `/guide/configuration/configure-azure-private-link.html`
+  - Sections: Prerequisites; VNet service information; Steps; What's next
+- `/guide/configuration/configure-google-private-service-connect.html`
+  - Sections: Prerequisites; VPC service information; Configure your Google Cloud Platform project; Request access from }; Prepare your network for connection; Create an endpoint to connect to }; Steps; Create an endpoint to connect to the } authentication service
+- `/guide/configuration/customize-your-dashboard.html`
+  - Sections: Prerequisites; Manage dashboards; Add dashboards; Edit or remove dashboards; Manage widgets; Arrange widgets; Add widgets; Remove widgets
+
+- *No direct help link in frontend; related docs inferred from keywords.*
+
+#### `/settings/integrations/secrets` — Secrets
+
+**Docs (related):**
+
+- `/faq/faq-integrations.html`
+  - Sections: Which languages, libraries, and environments do you support?; Currently, we support **Python }** and the most popular AI/ML and data science libraries.; What test ingestion or modeling techniques are supported?; What large language model (LLM) features are offered?; What deployment options are supported by }?; Learn more
+- `/guide/configuration/configure-aws-privatelink.html`
+  - Sections: Prerequisites; VPC service information; Steps; What's next
+- `/guide/configuration/configure-azure-private-link.html`
+  - Sections: Prerequisites; VNet service information; Steps; What's next
+- `/guide/configuration/configure-google-private-service-connect.html`
+  - Sections: Prerequisites; VPC service information; Configure your Google Cloud Platform project; Request access from }; Prepare your network for connection; Create an endpoint to connect to }; Steps; Create an endpoint to connect to the } authentication service
+- `/guide/configuration/customize-your-dashboard.html`
+  - Sections: Prerequisites; Manage dashboards; Add dashboards; Edit or remove dashboards; Manage widgets; Arrange widgets; Add widgets; Remove widgets
+- `/guide/configuration/manage-groups.html`
+  - Sections: Prerequisites; View group details; Add new groups; Remove groups; Add or remove group members
+
+- *No direct help link in frontend; related docs inferred from keywords.*
+
+### Users & Access
+
+#### `/settings/invitation` — Invite New Users
+
+**Docs (primary):**
+
+- `/guide/configuration/managing-users.html`
+  - Sections: Key concepts; Key terms; Default roles; User management
+- `/guide/configuration/manage-users.html` (section: #manage-user-invitations)
+  - Sections: Prerequisites; View and search for users; Manage user invitations; Invite new users; Monitor user invitations; Manage user roles
+
+### Organization
+
+#### `/settings/organization` — Organization
+
+**Docs (primary):**
+
+- `/guide/configuration/managing-your-organization.html`
+  - Sections: Prerequisites; Switch between organizations; Change names of organizations; Manage document defaults; Tracked changes; Numbered table and figure captions; Organization setup
+
+### Users & Access
+
+#### `/settings/permissions` — Permissions
+
+**Docs (primary):**
+
+- `/guide/configuration/manage-permissions.html`
+  - Sections: Prerequisites; Steps
+
+**Docs (related):**
+
+- `/guide/configuration/manage-users.html`
+  - Sections: Prerequisites; View and search for users; Manage user invitations; Invite new users; Monitor user invitations; Manage user roles
+- `/guide/configuration/managing-users.html`
+  - Sections: Key concepts; Key terms; Default roles; User management
+
+### Main navigation
+
+#### `/settings/primary-record-type-stages` — /settings/primary-record-type-stages
+
+**Docs (primary):**
+
+- `/guide/workflows/manage-model-stages.html`
+  - Note: no matching `.qmd` source found
+
+### Your Account
+
+#### `/settings/profile` — Profile
+
+**Docs (primary):**
+
+- `/guide/configuration/view-your-profile.html`
+  - Note: no matching `.qmd` source found
+
+**Docs (related):**
+
+- `/guide/configuration/manage-your-profile.html`
+  - Sections: Prerequisites; Access your profile; Onboarding; User Interface Preferences; Terms; Localization; Access Keys; To revoke and regenerate keys, click **Revoke & Regenerate Keys**.
+- `/guide/configuration/personalizing-validmind.html`
+
+### Main navigation
+
+#### `/settings/regulation-policy` — /settings/regulation-policy
+
+**Docs (primary):**
+
+- `/guide/templates/customize-virtual-document-validator.html` (section: #add-or-edit-assessment-questions)
+  - Note: no matching `.qmd` source found
+
+### Governance
+
+#### `/settings/regulations` — Regulations & Policies
+
+- *No direct help link; content may be covered under scattered guide sections.*
+
+#### `/settings/risk-areas` — Risk Areas & Validation Guidelines
+
+**Docs (primary):**
+
+- `/guide/model-validation/manage-validation-guidelines.html`
+  - Note: no matching `.qmd` source found
+
+### Users & Access
+
+#### `/settings/roles` — Roles
+
+**Docs (primary):**
+
+- `/guide/configuration/managing-users.html`
+  - Sections: Key concepts; Key terms; Default roles; User management
+- `/guide/configuration/manage-roles.html`
+  - Sections: Prerequisites; Add or update roles; Two special default roles provided by } have unique characteristics.; Manage role permissions; Manage role users; Rename existing roles
+
+**Docs (related):**
+
+- `/guide/configuration/manage-users.html`
+  - Sections: Prerequisites; View and search for users; Manage user invitations; Invite new users; Monitor user invitations; Manage user roles
+
+### Main navigation
+
+#### `/settings/stakeholders` — /settings/stakeholders
+
+**Docs (primary):**
+
+- `/guide/configuration/manage-model-stakeholder-types.html`
+  - Note: no matching `.qmd` source found
+
+#### `/settings/statuses` — /settings/statuses
+
+**Docs (primary):**
+
+- `/guide/workflows/manage-model-stages.html`
+  - Note: no matching `.qmd` source found
+
+### Documents
+
+#### `/settings/templates` — Templates
+
+**Docs (primary):**
+
+- `/guide/templates/customize-document-templates.html`
+  - Sections: Prerequisites; Edit template outlines; Configure assessment options[^4]; Edit YAML templates; Template schema; Troubleshooting YAML templates; Add text blocks to templates; Add text blocks via template outlines
+
+**Docs (related):**
+
+- `/guide/templates/customize-document-checker.html`
+  - Sections: Prerequisites; Manage regulations and policies; Manage assessments; Default assessments provided by } cannot be edited, only cloned.; Add or clone assessments; Add or edit assessment questions; Add assessment questions; Edit assessment questions
+- `/guide/templates/manage-document-templates.html`
+  - Sections: Prerequisites; View document templates; Edit document template outlines; Swap document templates; View currently applied templates; Swap between templates; Duplicate document templates; Delete document templates
+- `/guide/templates/manage-document-types.html`
+  - Sections: Prerequisites; Add document types; Edit or delete document types; Development, Validation, and Monitoring document types are stock types and cannot be deleted.
+- `/guide/templates/manage-documents.html`
+  - Sections: Prerequisites; Add record documents; How do I get the best results when converting PDFs into editable documents?; How can I trust that the conversion is accurate?; Troubleshooting; My PDF conversion is stuck. What can I do?; Edit record documents; Delete record documents
+- `/guide/templates/manage-text-block-library.html`
+  - Sections: Prerequisites; Add text blocks; Add existing text blocks to library; Duplicate text blocks; Edit text blocks; Delete text blocks
+- `/guide/templates/working-with-document-templates.html`
+  - Sections: What's next
+
+### Your Account
+
+#### `/settings/theme-customization` — Theme Customization
+
+- *No direct help link; content may be covered under scattered guide sections.*
+
+### Users & Access
+
+#### `/settings/user-directory` — User Directory
+
+**Docs (primary):**
+
+- `/guide/configuration/managing-users.html`
+  - Sections: Key concepts; Key terms; Default roles; User management
+- `/guide/configuration/manage-users.html`
+  - Sections: Prerequisites; View and search for users; Manage user invitations; Invite new users; Monitor user invitations; Manage user roles
+
+### Governance
+
+#### `/settings/workflow-states` — Workflow States
+
+**Docs (primary):**
+
+- `/guide/workflows/workflow-states.html`
+  - Sections: Prerequisites; Manage workflow states
+
+**Docs (related):**
+
+- `/faq/faq-workflows.html`
+  - Sections: Can I customize workflows within }?; What statuses are available for use in workflows?; Can we work with disconnected workflows?; You can also leverage the } once you are ready to document a specific record (model) for review and validation.; Learn more
+- `/guide/integrations/integrations-examples/use-webhooks-with-workflows.html`
+  - Sections: Prerequisites; Start a workflow via webhook; a. Configure workflow in }; b. Start workflow from external system; Trigger a paused workflow to continue; a. Configure workflow in }; b. Trigger workflow to continue from external system
+- `/guide/workflows/conditional-step-requirements.html`
+  - Sections: Prerequisites; Configure conditional requirements
+- `/guide/workflows/configure-workflows.html`
+  - Sections: Prerequisites; Create custom workflows; 1. Add new workflows; 2. Configure workflow steps; 3. Link workflow together; Workflow steps relationship unclear on your canvas?; 4. Publish workflow; Clone existing workflows
+- `/guide/workflows/introduction-to-workflows.html`
+  - Sections: Workflow elements; What's next
+- `/guide/workflows/manage-record-stages.html`
+  - Sections: Prerequisites; Add record stages; Edit or delete record stages
+
+#### `/settings/workflows` — Workflows
+
+**Docs (primary):**
+
+- `/guide/workflows/setting-up-workflows.html`
+  - Sections: View, sort, and filter workflows; Sort workflows; Filter workflows; How do I create effective filters?; Set up workflows; What's next
+
+**Docs (related):**
+
+- `/faq/faq-workflows.html`
+  - Sections: Can I customize workflows within }?; What statuses are available for use in workflows?; Can we work with disconnected workflows?; You can also leverage the } once you are ready to document a specific record (model) for review and validation.; Learn more
+- `/guide/integrations/integrations-examples/use-webhooks-with-workflows.html`
+  - Sections: Prerequisites; Start a workflow via webhook; a. Configure workflow in }; b. Start workflow from external system; Trigger a paused workflow to continue; a. Configure workflow in }; b. Trigger workflow to continue from external system
+- `/guide/workflows/conditional-step-requirements.html`
+  - Sections: Prerequisites; Configure conditional requirements
+- `/guide/workflows/configure-workflows.html`
+  - Sections: Prerequisites; Create custom workflows; 1. Add new workflows; 2. Configure workflow steps; 3. Link workflow together; Workflow steps relationship unclear on your canvas?; 4. Publish workflow; Clone existing workflows
+- `/guide/workflows/introduction-to-workflows.html`
+  - Sections: Workflow elements; What's next
+- `/guide/workflows/manage-record-stages.html`
+  - Sections: Prerequisites; Add record stages; Edit or delete record stages
+
+## Main application
+
+#### `/analytics` — sidebar.analytics
+
+**Docs (related):**
+
+- `/faq/faq-reporting.html`
+  - Sections: What analytic features are offered by }?; Learn more
+- `/guide/monitoring/enable-monitoring.html`
+  - Sections: Prerequisites; Steps; 1. Get monitoring code snippet; 2. Select monitoring template; 3. Run code snippet; A template must already be applied to your selected document to populate monitoring test results in the }.; What's next
+- `/guide/monitoring/ongoing-monitoring.html`
+  - Sections: Monitoring scenarios; Ongoing monitoring plan; Key concepts; Design and implementation; Testing; Manage ongoing monitoring; Code samples; } Available tests
+- `/guide/monitoring/review-monitoring-results.html`
+  - Sections: Prerequisites; Steps; Example monitoring test results; [} Satisfactory]; [} Requires Attention]
+- `/guide/monitoring/set-thresholds-and-alerts.html`
+  - Sections: Prerequisites; Use a custom function; Set the `passed` parameter; Output examples; Alert notifications
+- `/guide/monitoring/work-with-metrics-over-time.html`
+  - Sections: **Log metrics over time }**; Prerequisites; Add metrics over time; Add integration metrics; Use the global time range; View metric over time metadata
+
+- *No direct help link in frontend; related docs inferred from keywords.*
+
+#### `/artifacts` — Artifacts
+
+**Docs (related):**
+
+- `/guide/templates/customize-document-checker.html`
+  - Sections: Prerequisites; Manage regulations and policies; Manage assessments; Default assessments provided by } cannot be edited, only cloned.; Add or clone assessments; Add or edit assessment questions; Add assessment questions; Edit assessment questions
+- `/guide/templates/customize-document-templates.html`
+  - Sections: Prerequisites; Edit template outlines; Configure assessment options[^4]; Edit YAML templates; Template schema; Troubleshooting YAML templates; Add text blocks to templates; Add text blocks via template outlines
+- `/guide/templates/manage-document-templates.html`
+  - Sections: Prerequisites; View document templates; Edit document template outlines; Swap document templates; View currently applied templates; Swap between templates; Duplicate document templates; Delete document templates
+- `/guide/templates/manage-document-types.html`
+  - Sections: Prerequisites; Add document types; Edit or delete document types; Development, Validation, and Monitoring document types are stock types and cannot be deleted.
+- `/guide/templates/manage-documents.html`
+  - Sections: Prerequisites; Add record documents; How do I get the best results when converting PDFs into editable documents?; How can I trust that the conversion is accurate?; Troubleshooting; My PDF conversion is stuck. What can I do?; Edit record documents; Delete record documents
+- `/guide/templates/manage-text-block-library.html`
+  - Sections: Prerequisites; Add text blocks; Add existing text blocks to library; Duplicate text blocks; Edit text blocks; Delete text blocks
+
+- *No direct help link in frontend; related docs inferred from keywords.*
+
+#### `/attestations` — Attestations
+
+**Docs (related):**
+
+- `/guide/attestation/approve-attestations.html`
+  - Sections: Prerequisites; Steps
+- `/guide/attestation/manage-attestations.html`
+  - Sections: Prerequisites; Add attestation templates; Test attestation schedules; Edit attestation periods; Cancel attestation periods; View attestations dashboard; Progress; Responses
+- `/guide/attestation/review-attestations.html`
+  - Sections: Prerequisites; Steps
+- `/guide/attestation/submit-attestations.html`
+  - Sections: Prerequisites; Steps
+- `/guide/attestation/working-with-attestations.html`
+  - Sections: Prerequisites; Key concepts; Where do I access attestations?; How does the attestation process work?; How are attestation submissions organized?; How do I create meaningful attestation questionnaires?; Manage attestations
+
+- *No direct help link in frontend; related docs inferred from keywords.*
+
+#### `/dashboard` — Dashboard
+
+**Docs (related):**
+
+- `/guide/configuration/customize-your-dashboard.html`
+  - Sections: Prerequisites; Manage dashboards; Add dashboards; Edit or remove dashboards; Manage widgets; Arrange widgets; Add widgets; Remove widgets
+
+- *No direct help link in frontend; related docs inferred from keywords.*
+
+#### `/validation-issues` — Validation Issues
+
+- *No direct help link; content may be covered under scattered guide sections.*
+
+#### `/workflows` — Workflows
+
+**Docs (related):**
+
+- `/faq/faq-workflows.html`
+  - Sections: Can I customize workflows within }?; What statuses are available for use in workflows?; Can we work with disconnected workflows?; You can also leverage the } once you are ready to document a specific record (model) for review and validation.; Learn more
+- `/guide/integrations/integrations-examples/use-webhooks-with-workflows.html`
+  - Sections: Prerequisites; Start a workflow via webhook; a. Configure workflow in }; b. Start workflow from external system; Trigger a paused workflow to continue; a. Configure workflow in }; b. Trigger workflow to continue from external system
+- `/guide/workflows/conditional-step-requirements.html`
+  - Sections: Prerequisites; Configure conditional requirements
+- `/guide/workflows/configure-workflows.html`
+  - Sections: Prerequisites; Create custom workflows; 1. Add new workflows; 2. Configure workflow steps; 3. Link workflow together; Workflow steps relationship unclear on your canvas?; 4. Publish workflow; Clone existing workflows
+- `/guide/workflows/introduction-to-workflows.html`
+  - Sections: Workflow elements; What's next
+- `/guide/workflows/manage-record-stages.html`
+  - Sections: Prerequisites; Add record stages; Edit or delete record stages
+
+- *No direct help link in frontend; related docs inferred from keywords.*
+
+## Documentation index (human-oriented)
+
+See `AGENTS.md` and `about/using-the-documentation.md` in the LLM corpus for guides organized by feature area (Configuration, Workflows, Inventory, etc.).
diff --git a/site/llm/render.sh b/site/llm/render.sh
index 78f690302f..e4ef0c4240 100755
--- a/site/llm/render.sh
+++ b/site/llm/render.sh
@@ -30,7 +30,8 @@ project:
     - "**/*.qmd"
     - "!notebooks/"
     - "!404.qmd"
-    - "!about/contributing/"
+    - "!about/contributing/validmind-community.qmd"
+    - "!about/contributing/style-guide/"
     - "!about/deployment/"
     - "!about/fine-print/"
     - "!llm/"
@@ -51,6 +52,20 @@ EOF
 echo "=== Rendering site to GFM markdown ==="
 quarto render --to gfm
 
+# AGENTS.md lives at the repo root so IDE/agent tooling finds it there, but it
+# must also reach the LLM output so the docs chatbot can ingest it.
+echo ""
+echo "=== Generating chatbot product map ==="
+python3 scripts/generate_chatbot_product_map.py
+
+echo ""
+echo "=== Copying AGENTS.md from repo root into LLM output ==="
+cp ../AGENTS.md llm/_llm-output/AGENTS.md
+
+echo ""
+echo "=== Copying chatbot product map into LLM output ==="
+cp llm/chatbot-product-map.md llm/_llm-output/chatbot-product-map.md
+
 echo ""
 echo "=== Post-processing markdown files ==="
 bash llm/clean.sh
diff --git a/site/notebooks.zip b/site/notebooks.zip
index 4c7216bea5..f505f25d90 100644
Binary files a/site/notebooks.zip and b/site/notebooks.zip differ
diff --git a/site/notebooks/EXECUTED/development/1-set_up_validmind.ipynb b/site/notebooks/EXECUTED/development/1-set_up_validmind.ipynb
new file mode 100644
index 0000000000..9ba5431049
--- /dev/null
+++ b/site/notebooks/EXECUTED/development/1-set_up_validmind.ipynb
@@ -0,0 +1,481 @@
+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# ValidMind for development 1 — Set up the ValidMind Library\n",
+        "\n",
+        "Learn how to use ValidMind for your end-to-end documentation process based on common development scenarios with our series of four introductory notebooks. This first notebook walks you through the initial setup of the ValidMind Library.\n",
+        "\n",
+        "These notebooks use a binary classification model as an example, but the same principles shown here apply to other record (model) types.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
+        "<br></br>\n",
+        "Our course tailor-made for developers new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/developer-fundamentals/developer-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Developer Fundamentals</b></a></div>"
+      ],
+      "id": "3bd9bc41"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [Introduction](#toc1__)    \n",
+        "- [About ValidMind](#toc2__)    \n",
+        "  - [Before you begin](#toc2_1__)    \n",
+        "  - [New to ValidMind?](#toc2_2__)    \n",
+        "  - [Key concepts](#toc2_3__)    \n",
+        "- [Setting up](#toc3__)    \n",
+        "  - [Install the ValidMind Library](#toc3_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc3_2__)    \n",
+        "    - [Register sample model](#toc3_2_1__)    \n",
+        "    - [Apply documentation template](#toc3_2_2__)    \n",
+        "    - [Get your code snippet](#toc3_2_3__)    \n",
+        "- [Getting to know ValidMind](#toc4__)    \n",
+        "  - [Preview the documentation template](#toc4_1__)    \n",
+        "    - [View documentation in the ValidMind Platform](#toc4_1_1__)    \n",
+        "  - [Explore available tests](#toc4_2__)    \n",
+        "- [Upgrade ValidMind](#toc5__)    \n",
+        "- [In summary](#toc6__)    \n",
+        "- [Next steps](#toc7__)    \n",
+        "  - [Start the model development process](#toc7_1__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ],
+      "id": "b4b7c002"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## Introduction\n",
+        "\n",
+        "Development aims to produce a fit-for-purpose *champion* by conducting thorough testing and analysis, supporting the capabilities of the champion with evidence in the form of documentation and test results. Documentation should be clear and comprehensive, ideally following a structure or template covering all aspects of compliance with risk regulation.\n",
+        "\n",
+        "A *binary classification model* is a type of predictive model used in churn analysis to identify customers who are likely to leave a service or subscription by analyzing various behavioral, transactional, and demographic factors.\n",
+        "\n",
+        "- This model helps businesses take proactive measures to retain at-risk customers by offering personalized incentives, improving customer service, or adjusting pricing strategies.\n",
+        "- Effective validation of a churn prediction model ensures that businesses can accurately identify potential churners, optimize retention efforts, and enhance overall customer satisfaction while minimizing revenue loss."
+      ],
+      "id": "7b7de259"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models. \n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators."
+      ],
+      "id": "b68b9958"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
+      ],
+      "id": "3b520a7e"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+      ],
+      "id": "9b3108db"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ],
+      "id": "f97d4266"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Setting up"
+      ],
+      "id": "bf5cd6c2"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
+        "<br></br>\n",
+        "Python 3.8 <= x <= 3.14</div>\n",
+        "\n",
+        "To install the library:"
+      ],
+      "id": "95bf9e4b"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "827eb6bd"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library\n",
+        "\n",
+        "The ValidMind Library provides a rich collection of documentation tools and test suites, from documenting descriptions of datasets to validation and testing using a variety of open-source testing frameworks."
+      ],
+      "id": "ad74254d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ],
+      "id": "a48cd34d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Binary classification`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ],
+      "id": "8ad7e39a"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ],
+      "id": "3339f683"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "a58d951f"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Getting to know ValidMind"
+      ],
+      "id": "61a021f3"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ],
+      "id": "852db20d"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "819a40bc"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1_1__'></a>\n",
+        "\n",
+        "#### View documentation in the ValidMind Platform\n",
+        "\n",
+        "Next, let's head to the ValidMind Platform to see the template in action:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, navigate to **Inventory** and select the model you registered for this \"ValidMind for development\" series of notebooks.\n",
+        "\n",
+        "3. Click **Development** under Documents for your model and note how the structure of the documentation matches our preview above."
+      ],
+      "id": "65ed2873"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Explore available tests\n",
+        "\n",
+        "Next, let's explore the list of all available tests in the ValidMind Library with [the `vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) — we'll learn how to run tests shortly. \n",
+        "\n",
+        "You can see that the documentation template for this model has references to some of the **test `ID`s used to run tests listed below:**"
+      ],
+      "id": "cdbb94d2"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.list_tests()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "7ccc7776"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ],
+      "id": "786f0d9c"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "f5d3216d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ],
+      "id": "d2010ad4"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ],
+      "id": "b637c5c6"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## In summary\n",
+        "\n",
+        "In this first notebook, you learned how to:\n",
+        "\n",
+        "- [x] Register a record (model) within the ValidMind Platform\n",
+        "- [x] Install and initialize the ValidMind Library\n",
+        "- [x] Preview the documentation template for your model\n",
+        "- [x] Explore the available tests offered by the ValidMind Library"
+      ],
+      "id": "dfef8925"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Next steps"
+      ],
+      "id": "186bee4f"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_1__'></a>\n",
+        "\n",
+        "### Start the development process\n",
+        "\n",
+        "Now that the ValidMind Library is connected to your model in the ValidMind Library with the correct template applied, we can go ahead and start the development process: **[2 — Start the development process](2-start_development_process.ipynb)**"
+      ],
+      "id": "7dbb07a1"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-63fcb66be39b42d38ad874a72a66581b"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "name": "python",
+      "version": "3.10.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 5
+}
diff --git a/site/notebooks/EXECUTED/model_development/2-start_development_process.ipynb b/site/notebooks/EXECUTED/development/2-start_development_process.ipynb
similarity index 89%
rename from site/notebooks/EXECUTED/model_development/2-start_development_process.ipynb
rename to site/notebooks/EXECUTED/development/2-start_development_process.ipynb
index b01cb35361..4016e2a97a 100644
--- a/site/notebooks/EXECUTED/model_development/2-start_development_process.ipynb
+++ b/site/notebooks/EXECUTED/development/2-start_development_process.ipynb
@@ -4,17 +4,17 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "# ValidMind for model development 2 — Start the model development process\n",
+    "# ValidMind for development 2 — Start the development process\n",
     "\n",
-    "Learn how to use ValidMind for your end-to-end model documentation process with our series of four introductory notebooks. In this second notebook, you'll run tests and investigate results, then add the results or evidence to your documentation.\n",
+    "Learn how to use ValidMind for your end-to-end documentation process with our series of four introductory notebooks. In this second notebook, you'll run tests and investigate results, then add the results or evidence to your documentation.\n",
     "\n",
-    "You'll become familiar with the individual tests available in ValidMind, as well as how to run them and change parameters as necessary. Using ValidMind's repository of individual tests as building blocks helps you ensure that a model is being built appropriately. \n",
+    "You'll become familiar with the individual tests available in ValidMind, as well as how to run them and change parameters as necessary. Using ValidMind's repository of individual tests as building blocks helps you ensure that a record (model) is being built appropriately.\n",
     "\n",
-    "**For a full list of out-of-the-box tests,** refer to our [Test descriptions](https://docs.validmind.ai/developer/model-testing/test-descriptions.html) or try the interactive [Test sandbox](https://docs.validmind.ai/developer/model-testing/test-sandbox.html).\n",
+    "**For a full list of out-of-the-box tests and descriptions,** use the interactive [ValidMind test sandbox](https://docs.validmind.ai/developer/how-to/test-sandbox.html).\n",
     "\n",
     "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
     "<br></br>\n",
-    "Our course tailor-made for developers new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/developer-fundamentals/developer-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Developer Fundamentals</b></a></div>"
+    "Our course tailor-made for developers new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/developer-fundamentals/developer-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Developer Fundamentals</b></a></div>\n"
    ]
   },
   {
@@ -29,24 +29,25 @@
     "  - [Import sample dataset](#toc2_2__)    \n",
     "  - [Identify qualitative tests](#toc2_3__)    \n",
     "  - [Initialize the ValidMind dataset](#toc2_4__)    \n",
-    "- [Running tests](#toc3__)    \n",
+    "- [Running tests on datasets](#toc3__)    \n",
     "  - [Run tabular data tests](#toc3_1__)    \n",
     "  - [Utilize test output](#toc3_2__)    \n",
     "- [Documenting test results](#toc4__)    \n",
     "  - [Run and log multiple tests](#toc4_1__)    \n",
     "  - [Run and log an individual test](#toc4_2__)    \n",
-    "    - [Add individual test results to model documentation](#toc4_2_1__)    \n",
-    "- [Model testing](#toc5__)    \n",
+    "    - [Add individual test results to documentation](#toc4_2_1__)    \n",
+    "- [Running model evaluation tests](#toc5__)    \n",
     "  - [Train simple logistic regression model](#toc5_1__)    \n",
-    "  - [Initialize model evaluation objects](#toc5_2__)    \n",
-    "  - [Assign predictions](#toc5_3__)    \n",
+    "  - [Initialize ValidMind datasets](#toc5_2__)    \n",
+    "  - [Initialize a ValidMind model](#toc5_3__)    \n",
+    "    - [Assign predictions](#toc5_3_1__)    \n",
     "  - [Run the model evaluation tests](#toc5_4__)    \n",
     "- [In summary](#toc6__)    \n",
     "- [Next steps](#toc7__)    \n",
     "  - [Integrate custom tests](#toc7_1__)    \n",
     "\n",
     ":::\n",
-    "<!-- jn-toc-notebook-configgs \n",
+    "<!-- jn-toc-notebook-config\n",
     "\tnumbering=false\n",
     "\tanchor=true\n",
     "\tflat=false\n",
@@ -64,7 +65,7 @@
     "\n",
     "## Prerequisites\n",
     "\n",
-    "In order to log test results or evidence to your model documentation with this notebook, you'll need to first have:\n",
+    "In order to log test results or evidence to your documentation with this notebook, you'll need to first have:\n",
     "\n",
     "- [x] Registered a model within the ValidMind Platform with a predefined documentation template\n",
     "- [x] Installed the ValidMind Library in your local environment, allowing you to access all its features\n",
@@ -94,8 +95,10 @@
     "First, let's connect up the ValidMind Library to our model we previously registered in the ValidMind Platform:\n",
     "\n",
     "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+    "\n",
     "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+    "\n",
+    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
    ]
   },
   {
@@ -258,7 +261,7 @@
    "source": [
     "<a id='toc3__'></a>\n",
     "\n",
-    "## Running tests\n",
+    "## Running tests on datasets\n",
     "\n",
     "Now that we know how to initialize a ValidMind `dataset` object, we're ready to run some tests!\n",
     "\n",
@@ -276,9 +279,9 @@
     "\n",
     "### Run tabular data tests\n",
     "\n",
-    "The inputs expected by a test can also be found in the test definition — let's take [`validmind.data_validation.DescriptiveStatistics`](https://docs.validmind.ai/tests/data_validation/DescriptiveStatistics.html) as an example.\n",
+    "The inputs expected by a test can also be found in the test definition — let's take `validmind.data_validation.DescriptiveStatistics` as an example.\n",
     "\n",
-    "Note that the output of the [`describe_test()` function](https://docs.validmind.ai/validmind/validmind/tests.html#describe_test) below shows that this test expects a `dataset` as input:"
+    "Note that the output of the [`describe_test()` function](https://docs.validmind.ai/validmind/validmind/tests.html#describe_test) below shows that this test expects a `dataset` as input:\n"
    ]
   },
   {
@@ -326,9 +329,9 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "The output above shows that [the class imbalance test](https://docs.validmind.ai/tests/data_validation/ClassImbalance.html) did not pass according to the value we set for `min_percent_threshold`.\n",
+    "The output above shows that the `validmind.data_validation.ClassImbalance` test did not pass according to the value we set for `min_percent_threshold`.\n",
     "\n",
-    "To address this issue, we'll re-run the test on some processed data. In this case let's apply a very simple rebalancing technique to the dataset:"
+    "To address this issue, we'll re-run the test on some processed data. In this case let's apply a very simple rebalancing technique to the dataset:\n"
    ]
   },
   {
@@ -398,7 +401,7 @@
     "\n",
     "Below we demonstrate how to retrieve the list of features with the highest correlation coefficients and use them to reduce the final list of features for modeling.\n",
     "\n",
-    "First, we'll run [`validmind.data_validation.HighPearsonCorrelation`](https://docs.validmind.ai/tests/data_validation/HighPearsonCorrelation.html) with the `balanced_raw_dataset` we initialized previously as input as is for comparison with later runs:"
+    "First, we'll run `validmind.data_validation.HighPearsonCorrelation` with the `balanced_raw_dataset` we initialized previously as input as is for comparison with later runs:\n"
    ]
   },
   {
@@ -574,9 +577,9 @@
     "Every test result returned by the `run_test()` function has a [`.log()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#TestResult.log) that can be used to send the test results to the ValidMind Platform:\n",
     "\n",
     "- When using `run_documentation_tests()`, documentation sections will be automatically populated with the results of all tests registered in the documentation template.\n",
-    "- When logging individual test results to the platform, you'll need to manually add those results to the desired section of the model documentation.\n",
+    "- When logging individual test results to the platform, you'll need to manually add those results to the desired section of the documentation.\n",
     "\n",
-    "To demonstrate how to add test results to your model documentation, we'll populate the entire **Data Preparation** section of the documentation using the clean `vm_raw_dataset_preprocessed` dataset as input, and then document an additional individual result for the highly correlated dataset `vm_balanced_raw_dataset`."
+    "To demonstrate how to add test results to your documentation, we'll populate the entire **Data Preparation** section of the documentation using the clean `vm_raw_dataset_preprocessed` dataset as input, and then document an additional individual result for the highly correlated dataset `vm_balanced_raw_dataset`."
    ]
   },
   {
@@ -661,7 +664,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your model's documentation for this particular test ID. </b></span>\n",
+    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your documentation for this particular test ID. </b></span>\n",
     "<br></br>\n",
     "That's expected, as when we run individual tests the results logged need to be manually added to your documentation within the ValidMind Platform.</div>"
    ]
@@ -672,9 +675,9 @@
    "source": [
     "<a id='toc4_2_1__'></a>\n",
     "\n",
-    "#### Add individual test results to model documentation\n",
+    "#### Add individual test results to documentation\n",
     "\n",
-    "With the test results logged, let's head to the model we connected to at the beginning of this notebook and insert our test results into the documentation ([Need more help?](https://docs.validmind.ai/developer/model-documentation/work-with-test-results.html)):\n",
+    "With the test results logged, let's head to the model we connected to at the beginning of this notebook and insert our test results into the documentation (**Learn more:** [Work with test results](https://docs.validmind.ai/guide/documentation/work-with-test-results.html)):\n",
     "\n",
     "1. From the **Inventory** in the ValidMind Platform, go to the model you connected to earlier.\n",
     "\n",
@@ -713,7 +716,7 @@
    "source": [
     "<a id='toc5__'></a>\n",
     "\n",
-    "## Model testing\n",
+    "## Running model evaluation tests\n",
     "\n",
     "So far, we've focused on the data assessment and pre-processing that usually occurs prior to any models being built. Now, let's instead assume we have already built a model and we want to incorporate some model results into our documentation."
    ]
@@ -830,7 +833,7 @@
    "source": [
     "<a id='toc5_2__'></a>\n",
     "\n",
-    "### Initialize model evaluation objects\n",
+    "### Initialize ValidMind datasets\n",
     "\n",
     "The last step for evaluating the model's performance is to initialize the ValidMind `Dataset` and `Model` objects in preparation for assigning model predictions to each dataset."
    ]
@@ -859,9 +862,16 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
+    "<a id='toc5_3__'></a>\n",
+    "\n",
+    "### Initialize a ValidMind model\n",
+    "\n",
     "You'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for each of our three models.\n",
     "\n",
-    "You simply initialize this model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
+    "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+    "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
+    "\n",
+    "Initialize your model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
    ]
   },
   {
@@ -878,11 +888,11 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "<a id='toc5_3__'></a>\n",
+    "<a id='toc5_3_1__'></a>\n",
     "\n",
-    "### Assign predictions\n",
+    "#### Assign predictions\n",
     "\n",
-    "Once the model has been registered you can assign model predictions to the training and testing datasets.\n",
+    "Once the model has been registered you can assign predictions to the training and testing datasets.\n",
     "\n",
     "- The [`assign_predictions()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#assign_predictions) from the `Dataset` object can link existing predictions to any number of models.\n",
     "- This method links the model's class prediction values and probabilities to our `vm_train_ds` and `vm_test_ds` datasets.\n",
@@ -908,10 +918,10 @@
     "\n",
     "### Run the model evaluation tests\n",
     "\n",
-    "In this next example, we'll focus on running the tests within the Model Development section of the model documentation. Only tests associated with this section will be executed, and the corresponding results will be updated in the model documentation.\n",
+    "In this next example, we'll focus on running the tests within the Model Development section of the documentation. Only tests associated with this section will be executed, and the corresponding results will be updated in the documentation.\n",
     "\n",
     "- Note the additional config that is passed to `run_documentation_tests()` — this allows you to override `inputs` or `params` in certain tests.\n",
-    "- In our case, we want to explicitly use the `vm_train_ds` for the [`validmind.model_validation.sklearn.ClassifierPerformance:in_sample` test](https://docs.validmind.ai/tests/model_validation/sklearn/ClassifierPerformance.html), since it's supposed to run on the training dataset and not the test dataset."
+    "- In our case, we want to explicitly use the `vm_train_ds` for the `validmind.model_validation.sklearn.ClassifierPerformance:in_sample` test, since it's supposed to run on the training dataset and not the test dataset.\n"
    ]
   },
   {
@@ -959,7 +969,7 @@
     "- [x] Utilize the output from tests you've run\n",
     "- [x] Log test results from sets of or individual tests as evidence to the ValidMind Platform\n",
     "- [x] Add supplementary individual test results to your documentation\n",
-    "- [x] Assign model predictions to your ValidMind model objects"
+    "- [x] Assign predictions to your ValidMind model objects"
    ]
   },
   {
@@ -979,12 +989,12 @@
     "\n",
     "### Integrate custom tests\n",
     "\n",
-    "Now that you're familiar with the basics of using the ValidMind Library to run and log tests to provide evidence for your model documentation, let's learn how to incorporate your own custom tests into ValidMind: **[3 — Integrate custom tests](3-integrate_custom_tests.ipynb)**"
+    "Now that you're familiar with the basics of using the ValidMind Library to run and log tests to provide evidence for your documentation, let's learn how to incorporate your own custom tests into ValidMind: **[3 — Integrate custom tests](3-integrate_custom_tests.ipynb)**"
    ]
   },
   {
    "cell_type": "markdown",
-   "id": "copyright-b0df0754a7a74581809f22d50b198597",
+   "id": "copyright-f012d0fd2e1f44e38b70b6ad06ae0e67",
    "metadata": {},
    "source": [
     "<!-- VALIDMIND COPYRIGHT -->\n",
diff --git a/site/notebooks/tutorials/model_development/3-integrate_custom_tests.ipynb b/site/notebooks/EXECUTED/development/3-integrate_custom_tests.ipynb
similarity index 95%
rename from site/notebooks/tutorials/model_development/3-integrate_custom_tests.ipynb
rename to site/notebooks/EXECUTED/development/3-integrate_custom_tests.ipynb
index b4b990346b..7f32f3e454 100644
--- a/site/notebooks/tutorials/model_development/3-integrate_custom_tests.ipynb
+++ b/site/notebooks/EXECUTED/development/3-integrate_custom_tests.ipynb
@@ -4,14 +4,14 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "# ValidMind for model development 3 — Integrate custom tests\n",
+    "# ValidMind for development 3 — Integrate custom tests\n",
     "\n",
-    "Learn how to use ValidMind for your end-to-end model documentation process with our series of four introductory notebooks. In this third notebook, supplement ValidMind tests with your own and include them as additional evidence in your documentation.\n",
+    "Learn how to use ValidMind for your end-to-end documentation process with our series of four introductory notebooks. In this third notebook, supplement ValidMind tests with your own and include them as additional evidence in your documentation.\n",
     "\n",
     "This notebook assumes that you already have a repository of custom made tests considered critical to include in your documentation. A custom test is any function that takes a set of inputs and parameters as arguments and returns one or more outputs:\n",
     "\n",
     "- The function can be as simple or as complex as you need it to be — it can use external libraries, make API calls, or do anything else that you can do in Python.\n",
-    "- The only requirement is that the function signature and return values can be \"understood\" and handled by the ValidMind Library. As such, custom tests offer added flexibility by extending the default tests provided by ValidMind, enabling you to document any type of model or use case.\n",
+    "- The only requirement is that the function signature and return values can be \"understood\" and handled by the ValidMind Library. As such, custom tests offer added flexibility by extending the default tests provided by ValidMind, enabling you to document any type of record (model) or use case.\n",
     "\n",
     "**For a more in-depth introduction to custom tests,** refer to our [Implement custom tests](../../how_to/tests/custom_tests/implement_custom_tests.ipynb) notebook.\n",
     "\n",
@@ -69,7 +69,7 @@
     "\n",
     "## Prerequisites\n",
     "\n",
-    "In order to integrate custom tests with your model documentation with this notebook, you'll need to first have:\n",
+    "In order to integrate custom tests with your documentation with this notebook, you'll need to first have:\n",
     "\n",
     "- [x] Registered a model within the ValidMind Platform with a predefined documentation template\n",
     "- [x] Installed the ValidMind Library in your local environment, allowing you to access all its features\n",
@@ -82,7 +82,7 @@
     "Refer to the first two notebooks in this series:\n",
     "\n",
     "- <a href=\"1-set_up_validmind.ipynb\" style=\"color: #DE257E;\"><b>1 — Set up the ValidMind Library</b></a>\n",
-    "- <a href=\"2-start_development_process.ipynb\" style=\"color: #DE257E;\"><b>2 — Start the model development process</b></a>\n",
+    "- <a href=\"2-start_development_process.ipynb\" style=\"color: #DE257E;\"><b>2 — Start the development process</b></a>\n",
     "\n",
     "</div>\n"
    ]
@@ -95,7 +95,7 @@
     "\n",
     "## Setting up\n",
     "\n",
-    "This section should be quite familiar to you — as we performed the same actions in the previous notebook, **[2 — Start the model development process](2-start_development_process.ipynb)**."
+    "This section should be quite familiar to you — as we performed the same actions in the previous notebook, **[2 — Start the development process](2-start_development_process.ipynb)**."
    ]
   },
   {
@@ -109,8 +109,10 @@
     "As usual, let's first connect up the ValidMind Library to our model we previously registered in the ValidMind Platform:\n",
     "\n",
     "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+    "\n",
     "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+    "\n",
+    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
    ]
   },
   {
@@ -385,7 +387,7 @@
     "\n",
     "#### Initialize the ValidMind objects\n",
     "\n",
-    "Let's initialize the ValidMind `Dataset` and `Model` objects in preparation for assigning model predictions to each dataset:"
+    "Let's initialize the ValidMind `Dataset` and `Model` objects in preparation for assigning predictions to each dataset:"
    ]
   },
   {
@@ -394,7 +396,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "# Initialize the datasets into their own dataset objects\n",
+    "# Initialize the datasets into their own ValidMind dataset objects\n",
     "vm_train_ds = vm.init_dataset(\n",
     "    input_id=\"train_dataset_final\",\n",
     "    dataset=train_df,\n",
@@ -407,7 +409,7 @@
     "    target_column=\"Exited\",\n",
     ")\n",
     "\n",
-    "# Initialize a model object\n",
+    "# Initialize the ValidMind model object\n",
     "vm_model = vm.init_model(log_reg, input_id=\"log_reg_model_v1\")"
    ]
   },
@@ -487,7 +489,7 @@
     "\n",
     "- The function `confusion_matrix` takes two arguments `dataset` and `model`. This is a `VMDataset` and `VMModel` object respectively.\n",
     "  - `VMDataset` objects allow you to access the dataset's true (target) values by accessing the `.y` attribute.\n",
-    "  - `VMDataset` objects allow you to access the predictions for a given model by accessing the `.y_pred()` method.\n",
+    "  - `VMDataset` objects allow you to access the predictions for a given record (model) by accessing the `.y_pred()` method.\n",
     "- The function docstring provides a description of what the test does. This will be displayed along with the result in this notebook as well as in the ValidMind Platform.\n",
     "- The function body calculates the confusion matrix using the `sklearn.metrics.confusion_matrix` function as we just did above.\n",
     "- The function then returns the `ConfusionMatrixDisplay.figure_` object — this is important as the ValidMind Library expects the output of the custom test to be a plot or a table.\n",
@@ -672,7 +674,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your model's documentation for this particular test ID. </b></span>\n",
+    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your documentation for this particular test ID. </b></span>\n",
     "<br></br>\n",
     "That's expected, as when we run individual tests the results logged need to be manually added to your documentation within the ValidMind Platform.</div>"
    ]
@@ -685,7 +687,7 @@
     "\n",
     "## Using external test providers\n",
     "\n",
-    "Creating inline custom tests with a function is a great way to customize your model documentation. However, sometimes you may want to reuse the same set of tests across multiple models and share them with others in your organization. In this case, you can create an external custom *test provider* that will allow you to load custom tests from a local folder or a Git repository.\n",
+    "Creating inline custom tests with a function is a great way to customize your documentation. However, sometimes you may want to reuse the same set of tests across multiple records (models) and share them with others in your organization. In this case, you can create an external custom *test provider* that will allow you to load custom tests from a local folder or a Git repository.\n",
     "\n",
     "In this section you will learn how to declare a local filesystem test provider that allows loading tests from a local folder following these high level steps:\n",
     "\n",
@@ -738,7 +740,7 @@
     "After running the command above, confirm that a new `my_tests` directory was created successfully. For example:\n",
     "\n",
     "```\n",
-    "~/notebooks/tutorials/model_development/my_tests/\n",
+    "~/notebooks/tutorials/development/my_tests/\n",
     "```"
    ]
   },
@@ -901,7 +903,7 @@
     "\n",
     "## Add test results to documentation\n",
     "\n",
-    "With our custom tests run and results logged to the ValidMind Platform, let's head to the model we connected to at the beginning of this notebook and insert our test results into the documentation ([Need more help?](https://docs.validmind.ai/developer/model-documentation/work-with-test-results.html)):\n",
+    "With our custom tests run and results logged to the ValidMind Platform, let's head to the model we connected to at the beginning of this notebook and insert our test results into the documentation (**Learn more:** [Work with test results](https://docs.validmind.ai/guide/documentation/work-with-test-results.html)):\n",
     "\n",
     "1. From the **Inventory** in the ValidMind Platform, go to the model you connected to earlier.\n",
     "\n",
diff --git a/site/notebooks/tutorials/model_development/4-finalize_testing_documentation.ipynb b/site/notebooks/EXECUTED/development/4-finalize_testing_documentation.ipynb
similarity index 88%
rename from site/notebooks/tutorials/model_development/4-finalize_testing_documentation.ipynb
rename to site/notebooks/EXECUTED/development/4-finalize_testing_documentation.ipynb
index 086ccc2029..0dbc8d3be1 100644
--- a/site/notebooks/tutorials/model_development/4-finalize_testing_documentation.ipynb
+++ b/site/notebooks/EXECUTED/development/4-finalize_testing_documentation.ipynb
@@ -4,11 +4,11 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "# ValidMind for model development 4 — Finalize testing and documentation\n",
+    "# ValidMind for development 4 — Finalize testing and documentation\n",
     "\n",
-    "Learn how to use ValidMind for your end-to-end model documentation process with our introductory notebook series. In this last notebook, finalize the testing and documentation of your model and have a fully documented sample model ready for review.\n",
+    "Learn how to use ValidMind for your end-to-end documentation process with our introductory notebook series. In this last notebook, finalize the testing and documentation of your model and have a fully documented sample model ready for review.\n",
     "\n",
-    "We'll first use [`run_documentation_tests()`](https://docs.validmind.ai/validmind/validmind.html#run_documentation_tests) previously covered in **[2 — Start the model development process](2-start_development_process.ipynb)** to ensure that your custom test results generated in **[3 — Integrate custom tests](3-integrate_custom_tests.ipynb)** are included in your documentation. Then, we'll view and update the configuration for the entire model documentation template to suit your needs.\n",
+    "We'll first use [`run_documentation_tests()`](https://docs.validmind.ai/validmind/validmind.html#run_documentation_tests) previously covered in **[2 — Start the development process](2-start_development_process.ipynb)** to ensure that your custom test results generated in **[3 — Integrate custom tests](3-integrate_custom_tests.ipynb)** are included in your documentation. Then, we'll view and update the configuration for the entire documentation template to suit your needs.\n",
     "\n",
     "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
     "<br></br>\n",
@@ -34,11 +34,12 @@
     "    - [Add a local test provider](#toc2_4_2__)    \n",
     "- [Reconnect to ValidMind](#toc3__)    \n",
     "- [Include custom test results](#toc4__)    \n",
-    "- [Documentation template configuration](#toc5__)    \n",
-    "  - [Update the config](#toc5_1__)    \n",
+    "- [Configuring documentation template tests](#toc5__)    \n",
+    "  - [Preview test configuration](#toc5_1__)    \n",
+    "  - [Run updated documentation section tests](#toc5_2__)    \n",
     "- [In summary](#toc6__)    \n",
     "- [Next steps](#toc7__)    \n",
-    "  - [Work with your model documentation](#toc7_1__)    \n",
+    "  - [Work with your documentation](#toc7_1__)    \n",
     "  - [Learn more](#toc7_2__)    \n",
     "    - [Use cases](#toc7_2_1__)    \n",
     "    - [Discover more learning resources](#toc7_2_2__)    \n",
@@ -78,7 +79,7 @@
     "Refer to the first three notebooks in this series:\n",
     "\n",
     "- <a href=\"1-set_up_validmind.ipynb\" style=\"color: #DE257E;\"><b>1 — Set up the ValidMind Library</b></a>\n",
-    "- <a href=\"2-start_development_process.ipynb\" style=\"color: #DE257E;\"><b>2 — Start the model development process</b></a>\n",
+    "- <a href=\"2-start_development_process.ipynb\" style=\"color: #DE257E;\"><b>2 — Start the development process</b></a>\n",
     "- <a href=\"3-integrate_custom_tests.ipynb\" style=\"color: #DE257E;\"><b>3 — Integrate custom tests</b></a>\n",
     "\n",
     "</div>"
@@ -106,8 +107,10 @@
     "As usual, let's first connect up the ValidMind Library to our model we previously registered in the ValidMind Platform:\n",
     "\n",
     "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+    "\n",
     "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+    "\n",
+    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
    ]
   },
   {
@@ -391,7 +394,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "# Initialize the datasets into their own dataset objects\n",
+    "# Initialize the datasets into their own ValidMind dataset objects\n",
     "vm_train_ds = vm.init_dataset(\n",
     "    input_id=\"train_dataset_final\",\n",
     "    dataset=train_df,\n",
@@ -404,7 +407,7 @@
     "    target_column=\"Exited\",\n",
     ")\n",
     "\n",
-    "# Initialize a model object\n",
+    "# Initialize the ValidMind model object\n",
     "vm_model = vm.init_model(log_reg, input_id=\"log_reg_model_v1\")"
    ]
   },
@@ -637,7 +640,7 @@
     "\n",
     "Let's run all tests in the Model Evaluation section of the documentation. Note that we have been running the sample custom confusion matrix with `normalize=True` to demonstrate the ability to provide custom parameters.\n",
     "\n",
-    "In the **Run the model evaluation tests** section of **[2 — Start the model development process](2-start_development_process.ipynb)**, you learned how to assign inputs to individual tests with [`run_documentation_tests()`](https://docs.validmind.ai/validmind/validmind.html#run_documentation_tests). Assigning parameters is similar, you only need to provide assign a `params` dictionary to a given test ID, `my_test_provider.ConfusionMatrix` in this case."
+    "In the **Run the model evaluation tests** section of **[2 — Start the development process](2-start_development_process.ipynb)**, you learned how to assign inputs to individual tests with [`run_documentation_tests()`](https://docs.validmind.ai/validmind/validmind.html#run_documentation_tests). Assigning parameters is similar, you only need to provide assign a `params` dictionary to a given test ID, `my_test_provider.ConfusionMatrix` in this case."
    ]
   },
   {
@@ -678,7 +681,7 @@
    "source": [
     "<a id='toc5__'></a>\n",
     "\n",
-    "## Documentation template configuration\n",
+    "## Configuring documentation template tests\n",
     "\n",
     "Let's call the utility function [`vm.get_test_suite().get_default_config()`](https://docs.validmind.ai/validmind/validmind/vm_models.html#TestSuite.get_default_config) which will return the **default configuration for the entire documentation template as a dictionary:**\n",
     "\n",
@@ -706,11 +709,11 @@
    "source": [
     "<a id='toc5_1__'></a>\n",
     "\n",
-    "### Update the config\n",
+    "### Preview test configuration\n",
     "\n",
-    "The default config does not assign any inputs to a test, but you can assign inputs to individual tests as needed depending on the datasets and models you want to pass to individual tests.\n",
+    "The default config does not assign any inputs to a test, but you can assign inputs to individual tests as needed depending on the datasets and records (models) you want to pass to individual tests.\n",
     "\n",
-    "For this particular documentation template (binary classification), the ValidMind Library provides a sample configuration that can be used to populate the entire model documentation using the following inputs as placeholders:\n",
+    "For this particular documentation template (binary classification), the ValidMind Library provides a sample configuration that can be used to populate the entire documentation using the following inputs as placeholders:\n",
     "\n",
     "- A **`raw_dataset`** raw dataset\n",
     "- A **`train_dataset`** training dataset\n",
@@ -739,7 +742,11 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "Using this sample configuration, let's finish populating model documentation by running all tests for the Model Development section of the documentation.\n",
+    "<a id='toc5_2__'></a>\n",
+    "\n",
+    "### Run updated documentation section tests\n",
+    "\n",
+    "Using this sample configuration, let's finish populating documentation by running all tests for the Model Development section of the documentation.\n",
     "\n",
     "Recall that the training and test datasets in our exercise have the following `input_id` values:\n",
     "\n",
@@ -863,13 +870,13 @@
     "In this final notebook, you learned how to:\n",
     "\n",
     "- [x] Refresh the connection from the ValidMind Library to the ValidMind Platform after you've inserted test-driven blocks to your documentation\n",
-    "- [x] Include custom test results in your model documentation\n",
-    "- [x] View and configure the configuration for your model documentation template\n",
+    "- [x] Include custom test results in your documentation\n",
+    "- [x] View and configure the configuration for your documentation template\n",
     "\n",
-    "With our ValidMind for model development series of notebooks, you learned how to document a model end-to-end with the ValidMind Library by running through some common scenarios in a typical model development setting:\n",
+    "With our ValidMind for development series of notebooks, you learned how to document a record (model) end-to-end with the ValidMind Library by running through some common scenarios in a typical development setting:\n",
     "\n",
     "- Running out-of-the-box tests\n",
-    "- Documenting your model by adding evidence to model documentation\n",
+    "- Documenting your record (model) by adding evidence to documentation\n",
     "- Extending the capabilities of the ValidMind Library by implementing custom tests\n",
     "- Ensuring that the documentation is complete by running all tests in the documentation template"
    ]
@@ -889,21 +896,21 @@
    "source": [
     "<a id='toc7_1__'></a>\n",
     "\n",
-    "### Work with your model documentation\n",
+    "### Work with your documentation\n",
     "\n",
-    "Now that you've logged all your test results and generated a draft for your model documentation, head to the ValidMind Platform to wrap up your model documentation. Continue to work on your model documentation by:\n",
+    "Now that you've logged all your test results and generated a draft for your documentation, head to the ValidMind Platform to wrap up your documentation. Continue to work on your documentation by:\n",
     "\n",
     "- **Run and log more tests:** Use the skills you learned in this series of notebooks to run and log more individual tests, including custom tests, then insert them into your documentation as supplementary evidence. (Learn more: [`validmind.tests`](https://docs.validmind.ai/validmind/validmind/tests.html))\n",
     "\n",
-    "- **Inserting additional test results:** Add **Test-Driven Blocks** under any relevant section of your model documentation. (Learn more: [Work with test results](https://docs.validmind.ai/guide/model-documentation/work-with-test-results.html))\n",
+    "- **Inserting additional test results:** Add **Test-Driven Blocks** under any relevant section of your documentation. (Learn more: [Work with test results](https://docs.validmind.ai/guide/documentation/work-with-test-results.html))\n",
     "\n",
-    "- **Making qualitative edits to your test descriptions:** Click on the description of any inserted test results to review and edit the ValidMind-generated test descriptions for quality and accuracy. (Learn more: [Working with model documentation](https://docs.validmind.ai/guide/model-documentation/working-with-model-documentation.html#add-or-edit-documentation))\n",
+    "- **Making qualitative edits to your test descriptions:** Click on the description of any inserted test results to review and edit the ValidMind-generated test descriptions for quality and accuracy. (Learn more: [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html#add-or-edit-documentation))\n",
     "\n",
-    "- **View guidelines:** In any section of your model documentation, click **​ValidMind Insights** in the top right corner to reveal the Documentation Guidelines for each section to help guide the contents of your model documentation. (Learn more: [View documentation guidelines](https://docs.validmind.ai/guide/model-documentation/view-documentation-guidelines.html))\n",
+    "- **View guidelines:** In any section of your documentation, click **ValidMind Insights** in the top right corner to reveal the Documentation Guidelines for each section to help guide the contents of your documentation. (Learn more: [View development guidelines](https://docs.validmind.ai/guide/documentation/view-development-guidelines.html))\n",
     "\n",
-    "- **Collaborate with other stakeholders:** Use the ValidMind Platform's real-time collaborative features to work seamlessly together with the rest of your organization, including model validators. Review suggested changes in your content blocks, work with versioned history, and use comments to discuss specific portions of your model documentation. (Learn more: [Collaborate with others](https://docs.validmind.ai/guide/model-documentation/collaborate-with-others.html))\n",
+    "- **Collaborate with other stakeholders:** Use the ValidMind Platform's real-time collaborative features to work seamlessly together with the rest of your organization, including validators. Review suggested changes in your content blocks, work with versioned history, and use comments to discuss specific portions of your documentation. (Learn more: [Collaborate with others](https://docs.validmind.ai/guide/documentation/collaborate-with-others.html))\n",
     "\n",
-    "When your model documentation is complete and ready for review, submit it for approval from the same ValidMind Platform where you made your edits and collaborated with the rest of your organization, ensuring transparency and a thorough model development history. (Learn more: [Submit for approval](https://docs.validmind.ai/guide/model-documentation/submit-for-approval.html))"
+    "When your documentation is complete and ready for review, submit it for approval from the same ValidMind Platform where you made your edits and collaborated with the rest of your organization, ensuring transparency and a thorough development history. (Learn more: [Submit documents](https://docs.validmind.ai/guide/documentation/submit-documents.html))"
    ]
   },
   {
@@ -914,7 +921,7 @@
     "\n",
     "### Learn more\n",
     "\n",
-    "Now that you're familiar with the basics, you can explore the following notebooks to get a deeper understanding on how the ValidMind Library allows you generate model documentation for any use case:"
+    "Now that you're familiar with the basics, you can explore the following notebooks to get a deeper understanding on how the ValidMind Library allows you generate documentation for any use case:"
    ]
   },
   {
@@ -941,7 +948,7 @@
     "Learn more about the ValidMind Library tools we used in this notebook:\n",
     "\n",
     "- [Explore tests](../../how_to/tests/explore_tests/explore_tests.ipynb)\n",
-    "- [Run dataset-based tests](../../how_to/tests/run_tests/1_run_dataset_based_tests.ipynb)\n",
+    "- [Run dataset-based tests](../../how_to/tests/run_tests/1-run_dataset-based_tests.ipynb)\n",
     "- [Implement custom tests](../../how_to/tests/custom_tests/implement_custom_tests.ipynb)\n",
     "- [Integrate external test providers](../../how_to/tests/custom_tests/integrate_external_test_providers.ipynb)\n",
     "- [Configure dataset features](../../how_to/data_and_datasets/dataset_inputs/configure_dataset_features.ipynb)\n",
@@ -950,14 +957,14 @@
     "\n",
     "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
     "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
+    "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
     "\n",
     "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
    ]
   },
   {
    "cell_type": "markdown",
-   "id": "copyright-2efae7bbb0f74bd5abe37252cd48b951",
+   "id": "copyright-9be88159d1f24db999931c13536a491c",
    "metadata": {},
    "source": [
     "<!-- VALIDMIND COPYRIGHT -->\n",
diff --git a/site/notebooks/EXECUTED/model_development/add-content-block.gif b/site/notebooks/EXECUTED/development/add-content-block.gif
similarity index 100%
rename from site/notebooks/EXECUTED/model_development/add-content-block.gif
rename to site/notebooks/EXECUTED/development/add-content-block.gif
diff --git a/site/notebooks/EXECUTED/model_development/high-pearson-correlation-block.png b/site/notebooks/EXECUTED/development/high-pearson-correlation-block.png
similarity index 100%
rename from site/notebooks/EXECUTED/model_development/high-pearson-correlation-block.png
rename to site/notebooks/EXECUTED/development/high-pearson-correlation-block.png
diff --git a/site/notebooks/EXECUTED/model_development/selecting-confusion-matrix-test.png b/site/notebooks/EXECUTED/development/selecting-confusion-matrix-test.png
similarity index 100%
rename from site/notebooks/EXECUTED/model_development/selecting-confusion-matrix-test.png
rename to site/notebooks/EXECUTED/development/selecting-confusion-matrix-test.png
diff --git a/site/notebooks/EXECUTED/model_development/selecting-high-pearson-correlation-test.png b/site/notebooks/EXECUTED/development/selecting-high-pearson-correlation-test.png
similarity index 100%
rename from site/notebooks/EXECUTED/model_development/selecting-high-pearson-correlation-test.png
rename to site/notebooks/EXECUTED/development/selecting-high-pearson-correlation-test.png
diff --git a/site/notebooks/EXECUTED/model_development/1-set_up_validmind.ipynb b/site/notebooks/EXECUTED/model_development/1-set_up_validmind.ipynb
deleted file mode 100644
index 4244924b9a..0000000000
--- a/site/notebooks/EXECUTED/model_development/1-set_up_validmind.ipynb
+++ /dev/null
@@ -1,471 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "id": "06993494",
-   "metadata": {},
-   "source": [
-    "# ValidMind for model development 1 — Set up the ValidMind Library\n",
-    "\n",
-    "Learn how to use ValidMind for your end-to-end model documentation process based on common model development scenarios with our series of four introductory notebooks. This first notebook walks you through the initial setup of the ValidMind Library.\n",
-    "\n",
-    "These notebooks use a binary classification model as an example, but the same principles shown here apply to other model types.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
-    "<br></br>\n",
-    "Our course tailor-made for developers new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/developer-fundamentals/developer-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Developer Fundamentals</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "5269a388",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [Introduction](#toc1__)    \n",
-    "- [About ValidMind](#toc2__)    \n",
-    "  - [Before you begin](#toc2_1__)    \n",
-    "  - [New to ValidMind?](#toc2_2__)    \n",
-    "  - [Key concepts](#toc2_3__)    \n",
-    "- [Setting up](#toc3__)    \n",
-    "  - [Install the ValidMind Library](#toc3_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc3_2__)    \n",
-    "    - [Register sample model](#toc3_2_1__)    \n",
-    "    - [Apply documentation template](#toc3_2_2__)    \n",
-    "    - [Get your code snippet](#toc3_2_3__)    \n",
-    "- [Getting to know ValidMind](#toc4__)    \n",
-    "  - [Preview the documentation template](#toc4_1__)    \n",
-    "    - [View model documentation in the ValidMind Platform](#toc4_1_1__)    \n",
-    "  - [Explore available tests](#toc4_2__)    \n",
-    "- [Upgrade ValidMind](#toc5__)    \n",
-    "- [In summary](#toc6__)    \n",
-    "- [Next steps](#toc7__)    \n",
-    "  - [Start the model development process](#toc7_1__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "1020f3fa",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## Introduction\n",
-    "\n",
-    "Model development aims to produce a fit-for-purpose *champion model* by conducting thorough testing and analysis, supporting the capabilities of the model with evidence in the form of documentation and test results. Model documentation should be clear and comprehensive, ideally following a structure or template covering all aspects of compliance with model risk regulation.\n",
-    "\n",
-    "A *binary classification model* is a type of predictive model used in churn analysis to identify customers who are likely to leave a service or subscription by analyzing various behavioral, transactional, and demographic factors.\n",
-    "\n",
-    "- This model helps businesses take proactive measures to retain at-risk customers by offering personalized incentives, improving customer service, or adjusting pricing strategies.\n",
-    "- Effective validation of a churn prediction model ensures that businesses can accurately identify potential churners, optimize retention efforts, and enhance overall customer satisfaction while minimizing revenue loss."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "4424a3e8",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models. \n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "ed8cfd11",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "353613e5",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "63912e66",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Metrics**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
-    "\n",
-    "**Custom metrics**: Custom metrics are functions that you define to evaluate your model or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom metric.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom metric. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a metric, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom metrics can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "7d039206",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "d6758437",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
-    "<br></br>\n",
-    "Python 3.8 <= x <= 3.14</div>\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "827eb6bd",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "02f8b26f",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library\n",
-    "\n",
-    "The ValidMind Library provides a rich collection of documentation tools and test suites, from documenting descriptions of datasets to validation and testing of models using a variety of open-source testing frameworks."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "706a1004",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "8ceb6261",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Binary classification`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "acf3e1db",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "a58d951f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "3e0596f8",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Getting to know ValidMind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "bcd77028",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "819a40bc",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "025a518c",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1_1__'></a>\n",
-    "\n",
-    "#### View model documentation in the ValidMind Platform\n",
-    "\n",
-    "Next, let's head to the ValidMind Platform to see the template in action:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and select the model you registered for this \"ValidMind for model development\" series of notebooks.\n",
-    "\n",
-    "3. Click **Development** under Documents for your model and note how the structure of the documentation matches our preview above."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "596d6d16",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Explore available tests\n",
-    "\n",
-    "Next, let's explore the list of all available tests in the ValidMind Library with [the `vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) — we'll learn how to run tests shortly. \n",
-    "\n",
-    "You can see that the documentation template for this model has references to some of the **test `ID`s used to run tests listed below:**"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "7ccc7776",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.list_tests()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "30c4a1bc",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "f5d3216d",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e27b286f",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "75bf527b",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b919c3a0",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## In summary\n",
-    "\n",
-    "In this first notebook, you learned how to:\n",
-    "\n",
-    "- [x] Register a model within the ValidMind Platform\n",
-    "- [x] Install and initialize the ValidMind Library\n",
-    "- [x] Preview the documentation template for your model\n",
-    "- [x] Explore the available tests offered by the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e9c62e9d",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Next steps"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "8f1a7063",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_1__'></a>\n",
-    "\n",
-    "### Start the model development process\n",
-    "\n",
-    "Now that the ValidMind Library is connected to your model in the ValidMind Library with the correct template applied, we can go ahead and start the model development process: **[2 — Start the model development process](2-start_development_process.ipynb)**"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-3e02e70c1d4d4840bf8d9ef44e2cf20c",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
-  },
-  "language_info": {
-   "name": "python",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
-}
diff --git a/site/notebooks/EXECUTED/model_validation/1-set_up_validmind_for_validation.ipynb b/site/notebooks/EXECUTED/model_validation/1-set_up_validmind_for_validation.ipynb
deleted file mode 100644
index 05ad11c2c3..0000000000
--- a/site/notebooks/EXECUTED/model_validation/1-set_up_validmind_for_validation.ipynb
+++ /dev/null
@@ -1,517 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "id": "821a881e",
-   "metadata": {},
-   "source": [
-    "# ValidMind for model validation 1 — Set up the ValidMind Library for validation\n",
-    "\n",
-    "Learn how to use ValidMind for your end-to-end model validation process based on common scenarios with our series of four introductory notebooks. In this first notebook, set up the ValidMind Library in preparation for validating a champion model.\n",
-    "\n",
-    "These notebooks use a binary classification model as an example, but the same principles shown here apply to other model types.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
-    "<br></br>\n",
-    "Our course tailor-made for validators new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/validator-fundamentals/validator-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Validator Fundamentals</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "19ea797c",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [Introduction](#toc1__)    \n",
-    "- [About ValidMind](#toc2__)    \n",
-    "  - [Before you begin](#toc2_1__)    \n",
-    "  - [New to ValidMind?](#toc2_2__)    \n",
-    "  - [Key concepts](#toc2_3__)    \n",
-    "- [Setting up](#toc3__)    \n",
-    "  - [Register a sample model](#toc3_1__)    \n",
-    "    - [Assign validator credentials](#toc3_1_1__)    \n",
-    "    - [Apply documentation template](#toc3_1_2__)    \n",
-    "    - [Apply validation report template](#toc3_1_3__)    \n",
-    "  - [Install the ValidMind Library](#toc3_2__)    \n",
-    "  - [Initialize the ValidMind Library](#toc3_3__)    \n",
-    "    - [Get your code snippet](#toc3_3_1__)    \n",
-    "- [Getting to know ValidMind](#toc4__)    \n",
-    "  - [Preview the validation report template](#toc4_1__)    \n",
-    "    - [View validation report in the ValidMind Platform](#toc4_1_1__)    \n",
-    "  - [Explore available tests](#toc4_2__)    \n",
-    "- [Upgrade ValidMind](#toc5__)    \n",
-    "- [In summary](#toc6__)    \n",
-    "- [Next steps](#toc7__)    \n",
-    "  - [Start the model validation process](#toc7_1__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "d624f88d",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## Introduction\n",
-    "\n",
-    "Model validation aims to independently assess the compliance of *champion models* created by model developers with regulatory guidance by conducting thorough testing and analysis, potentially including the use of challenger models to benchmark performance. Assessments, presented in the form of a validation report, typically include *artifacts (findings)* and recommendations to address those issues.\n",
-    "\n",
-    "A *binary classification model* is a type of predictive model used in churn analysis to identify customers who are likely to leave a service or subscription by analyzing various behavioral, transactional, and demographic factors.\n",
-    "\n",
-    "- This model helps businesses take proactive measures to retain at-risk customers by offering personalized incentives, improving customer service, or adjusting pricing strategies.\n",
-    "- Effective validation of a churn prediction model ensures that businesses can accurately identify potential churners, optimize retention efforts, and enhance overall customer satisfaction while minimizing revenue loss."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "4fb1ef5a",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate comparison and other validation tests, and then use the ValidMind Platform to submit compliance assessments of champion models via comprehensive validation reports. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model developers."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "594f9fd4",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "262ed111",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "0eb67fe9",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Validation report**: A comprehensive and structured assessment of a model’s development and performance, focusing on verifying its integrity, appropriateness, and alignment with its intended use. It includes analyses of model assumptions, data quality, performance metrics, outcomes of testing procedures, and risk considerations. The validation report supports transparency, regulatory compliance, and informed decision-making by documenting the validator’s independent review and conclusions.\n",
-    "\n",
-    "**Validation report template**: Serves as a standardized framework for conducting and documenting model validation activities. It outlines the required sections, recommended analyses, and expected validation tests, ensuring consistency and completeness across validation reports. The template helps guide validators through a systematic review process while promoting comparability and traceability of validation outcomes.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets.\n",
-    "\n",
-    "**Metrics**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
-    "\n",
-    "**Custom metrics**: Custom metrics are functions that you define to evaluate your model or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom metric.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom metric. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a metric, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom metrics can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e0e1cf3d",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "609fe59b",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Register a sample model\n",
-    "\n",
-    "In a usual model lifecycle, a champion model will have been independently registered in your model inventory and submitted to you for validation by your model development team as part of the effective challenge process. (**Learn more:** [Submit for approval](https://docs.validmind.ai/guide/model-documentation/submit-for-approval.html))\n",
-    "\n",
-    "For this notebook, we'll have you register a dummy model in the ValidMind Platform inventory and assign yourself as the validator to familiarize you with the ValidMind interface and circumvent the need for an existing model:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down — don’t worry, we’ll adjust these permissions next for validation.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "58e552bb",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1_1__'></a>\n",
-    "\n",
-    "#### Assign validator credentials\n",
-    "\n",
-    "In order to log tests as a validator instead of as a developer, on the model details page that appears after you've successfully registered your sample model:\n",
-    "\n",
-    "1. Remove yourself as a model owner: \n",
-    "\n",
-    "    - Click on the **OWNERS** tile.\n",
-    "    - Click the **x** next to your name to remove yourself from that model's role.\n",
-    "    - Click **Save** to apply your changes to that role.\n",
-    "\n",
-    "2. Remove yourself as a developer: \n",
-    "\n",
-    "    - Click on the **DEVELOPERS** tile.\n",
-    "    - Click the **x** next to your name to remove yourself from that model's role.\n",
-    "    - Click **Save** to apply your changes to that role.\n",
-    "\n",
-    "3. Add yourself as a validator: \n",
-    "\n",
-    "    - Click on the **VALIDATORS** tile.\n",
-    "    - Select your name from the drop-down menu.\n",
-    "    - Click **Save** to apply your changes to that role."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "84251589",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier for developers.\n",
-    "\n",
-    "We'll need this documentation template later for reference as we draft our validation report:\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Documentation**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Binary classification`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "fdfb5dc5",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1_3__'></a>\n",
-    "\n",
-    "#### Apply validation report template\n",
-    "\n",
-    "Next, let's select a validation report template. A template predefines sections for your report and provides a general outline to follow, making the validation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Validation**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Generic Validation Report`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f656d0d6",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
-    "<br></br>\n",
-    "Python 3.8 <= x <= 3.14</div>\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "931d8f7f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "1435fd5b",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_3__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b375b341",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_3_1__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Validation` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "d5d87e2d",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"validation-report\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "331e1c07",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Getting to know ValidMind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f6331a98",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Preview the validation report template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will attach evidence to this template in the form of risk assessment notes, artifacts, and test results later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "13d34bbb",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "20717133",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1_1__'></a>\n",
-    "\n",
-    "#### View validation report in the ValidMind Platform\n",
-    "\n",
-    "Next, let's head to the ValidMind Platform to see the template in action:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and select the model you registered for this \"ValidMind for model validation\" series of notebooks.\n",
-    "\n",
-    "3. Click **Validation** under Documents for your model and note:\n",
-    "\n",
-    "    - [x] The risk assessment compliance summary at the top of the report (screenshot below)\n",
-    "    - [x] How the structure of the validation report reflects the previewed template\n",
-    "\n",
-    "    <img src= \"compliance-summary.png\" alt=\"Screenshot showing the risk assessment compliance summary\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
-    "    <br><br>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f5d0aaab",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Explore available tests\n",
-    "\n",
-    "Next, let's explore the list of all available tests in the ValidMind Library with [the `vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) — we'll later narrow down the tests we want to run from this list when we learn to run tests."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "de6abc2a",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.list_tests()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "dce47e40",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "10272aa9",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "7a0c3cc2",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "2dac11d5",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "174d2c8d",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## In summary\n",
-    "\n",
-    "In this first notebook, you learned how to:\n",
-    "\n",
-    "- [x] Register a model within the ValidMind Platform and assign yourself as the validator\n",
-    "- [x] Install and initialize the ValidMind Library\n",
-    "- [x] Preview the validation report template for your model\n",
-    "- [x] Explore the available tests offered by the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "d8ffdcf7",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "<a id='toc7_1__'></a>\n",
-    "\n",
-    "### Start the model validation process\n",
-    "\n",
-    "Now that the ValidMind Library is connected to your model in the ValidMind Library with the correct template applied, we can go ahead and start the model validation process: **[2 — Start the model validation process](2-start_validation_process.ipynb)**"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-5d7a1c159e4840fca79011d1c0380725",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
-  },
-  "language_info": {
-   "name": "python",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
-}
diff --git a/site/notebooks/EXECUTED/model_validation/2-start_validation_process.ipynb b/site/notebooks/EXECUTED/model_validation/2-start_validation_process.ipynb
deleted file mode 100644
index 7fafa5ab50..0000000000
--- a/site/notebooks/EXECUTED/model_validation/2-start_validation_process.ipynb
+++ /dev/null
@@ -1,889 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# ValidMind for model validation 2 — Start the model validation process\n",
-    "\n",
-    "Learn how to use ValidMind for your end-to-end model validation process with our series of four introductory notebooks. In this second notebook, independently verify the data quality tests performed on the dataset used to train the champion model.\n",
-    "\n",
-    "You'll learn how to run relevant validation tests with ValidMind, log the results of those tests to the ValidMind Platform, and insert your logged test results as evidence into your validation report. You'll become familiar with the tests available in ValidMind, as well as how to run them. Running tests during model validation is crucial to the effective challenge process, as we want to independently evaluate the evidence and assessments provided by the model development team.\n",
-    "\n",
-    "While running our tests in this notebook, we'll focus on:\n",
-    "\n",
-    "- Ensuring that data used for training and testing the model is of appropriate data quality\n",
-    "- Ensuring that the raw data has been preprocessed appropriately and that the resulting final datasets reflects this\n",
-    "\n",
-    "**For a full list of out-of-the-box tests,** refer to our [Test descriptions](https://docs.validmind.ai/developer/model-testing/test-descriptions.html) or try the interactive [Test sandbox](https://docs.validmind.ai/developer/model-testing/test-sandbox.html).\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
-    "<br></br>\n",
-    "Our course tailor-made for validators new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/validator-fundamentals/validator-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Validator Fundamentals</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [Prerequisites](#toc1__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_1__)    \n",
-    "- [Load the sample dataset](#toc3__)    \n",
-    "- [Verifying data quality adjustments](#toc4__)    \n",
-    "  - [Identify qualitative tests](#toc4_1__)    \n",
-    "  - [Initialize the ValidMind dataset](#toc4_2__)    \n",
-    "  - [Run data quality tests](#toc4_3__)    \n",
-    "    - [Run tabular data tests](#toc4_3_1__)    \n",
-    "  - [Remove highly correlated features](#toc4_4__)    \n",
-    "- [Documenting test results](#toc5__)    \n",
-    "  - [Configure and run comparison tests](#toc5_1__)    \n",
-    "  - [Log tests with unique identifiers](#toc5_2__)    \n",
-    "  - [Add test results to reporting](#toc5_3__)    \n",
-    "- [Split the preprocessed dataset](#toc6__)    \n",
-    "  - [Initialize the split datasets](#toc6_1__)    \n",
-    "- [In summary](#toc7__)    \n",
-    "- [Next steps](#toc8__)    \n",
-    "  - [Develop potential challenger models](#toc8_1__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## Prerequisites\n",
-    "\n",
-    "In order to independently assess the quality of your datasets with notebook, you'll need to first have:\n",
-    "\n",
-    "- [x] Registered a model within the ValidMind Platform and granted yourself access to the model as a validator\n",
-    "- [x] Installed the ValidMind Library in your local environment, allowing you to access all its features\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Need help with the above steps?</b></span>\n",
-    "<br></br>\n",
-    "Refer to the first notebook in this series: <a href=\"1-set_up_validmind_for_validation.ipynb\" style=\"color: #DE257E;\"><b>1 — Set up the ValidMind Library for validation</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library\n",
-    "\n",
-    "First, let's connect up the ValidMind Library to our model we previously registered in the ValidMind Platform:\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Validation` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Make sure the ValidMind Library is installed\n",
-    "\n",
-    "%pip install -q validmind\n",
-    "\n",
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"validation-report\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Load the sample dataset\n",
-    "\n",
-    "Let's first import the public [Bank Customer Churn Prediction](https://www.kaggle.com/datasets/shantanudhakadd/bank-customer-churn-prediction) dataset from Kaggle, which was used to develop the dummy champion model.\n",
-    "\n",
-    "We'll use this dataset to review steps that should have been conducted during the initial development and documentation of the model to ensure that the model was built correctly. By independently performing steps taken by the model development team, we can confirm whether the model was built using appropriate and properly processed data.\n",
-    "\n",
-    "In our below example, note that:\n",
-    "\n",
-    "- The target column, `Exited` has a value of `1` when a customer has churned and `0` otherwise.\n",
-    "- The ValidMind Library provides a wrapper to automatically load the dataset as a [Pandas DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html) object. A Pandas Dataframe is a two-dimensional tabular data structure that makes use of rows and columns."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.datasets.classification import customer_churn as demo_dataset\n",
-    "\n",
-    "print(\n",
-    "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{demo_dataset.target_column}' \\n\\t• Class labels: {demo_dataset.class_labels}\"\n",
-    ")\n",
-    "\n",
-    "raw_df = demo_dataset.load_data()\n",
-    "raw_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Verifying data quality adjustments\n",
-    "\n",
-    "Let's say that thanks to the documentation submitted by the model development team ([Learn more ...](https://docs.validmind.ai/developer/validmind-library.html#for-model-development)), we know that the sample dataset was first modified before being used to train the champion model. After performing some data quality assessments on the raw dataset, it was determined that the dataset required rebalancing, and highly correlated features were also removed."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Identify qualitative tests\n",
-    "\n",
-    "During model validation, we use the same data processing logic and training procedure to confirm that the model's results can be reproduced independently, so let's start by doing some data quality assessments by running a few individual tests just like the development team did.\n",
-    "\n",
-    "Use the [`vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) introduced by the first notebook in this series in combination with [`vm.tests.list_tags()`](https://docs.validmind.ai/validmind/validmind/tests.html#list_tags) and [`vm.tests.list_tasks()`](https://docs.validmind.ai/validmind/validmind/tests.html#list_tasks) to find which prebuilt tests are relevant for data quality assessment:\n",
-    "\n",
-    "- **`tasks`** represent the kind of modeling task associated with a test. Here we'll focus on `classification` tasks.\n",
-    "- **`tags`** are free-form descriptions providing more details about the test, for example, what category the test falls into. Here we'll focus on the `data_quality` tag."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Get the list of available task types\n",
-    "sorted(vm.tests.list_tasks())"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Get the list of available tags\n",
-    "sorted(vm.tests.list_tags())"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You can pass `tags` and `tasks` as parameters to the `vm.tests.list_tests()` function to filter the tests based on the tags and task types.\n",
-    "\n",
-    "For example, to find tests related to tabular data quality for classification models, you can call `list_tests()` like this:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.list_tests(task=\"classification\", tags=[\"tabular_data\", \"data_quality\"])"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about navigating ValidMind tests?</b></span>\n",
-    "<br></br>\n",
-    "Refer to our notebook outlining the utilities available for viewing and understanding available ValidMind tests: <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/explore_tests/explore_tests.html\" style=\"color: #DE257E;\"><b>Explore tests</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind dataset\n",
-    "\n",
-    "With the individual tests we want to run identified, the next step is to connect your data with a ValidMind `Dataset` object. **This step is always necessary every time you want to connect a dataset to documentation and produce test results through ValidMind,** but you only need to do it once per dataset.\n",
-    "\n",
-    "Initialize a ValidMind dataset object using the [`init_dataset` function](https://docs.validmind.ai/validmind/validmind.html#init_dataset) from the ValidMind (`vm`) module. For this example, we'll pass in the following arguments:\n",
-    "\n",
-    "- **`dataset`** — The raw dataset that you want to provide as input to tests.\n",
-    "- **`input_id`** — A unique identifier that allows tracking what inputs are used when running each individual test.\n",
-    "- **`target_column`** — A required argument if tests require access to true values. This is the name of the target column in the dataset."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# vm_raw_dataset is now a VMDataset object that you can pass to any ValidMind test\n",
-    "vm_raw_dataset = vm.init_dataset(\n",
-    "    dataset=raw_df,\n",
-    "    input_id=\"raw_dataset\",\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_3__'></a>\n",
-    "\n",
-    "### Run data quality tests\n",
-    "\n",
-    "Now that we know how to initialize a ValidMind `dataset` object, we're ready to run some tests!\n",
-    "\n",
-    "You run individual tests by calling [the `run_test` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test) provided by the `validmind.tests` module. For the examples below, we'll pass in the following arguments:\n",
-    "\n",
-    "- **`test_id`** — The ID of the test to run, as seen in the `ID` column when you run `list_tests`. \n",
-    "- **`params`** — A dictionary of parameters for the test. These will override any `default_params` set in the test definition. "
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_3_1__'></a>\n",
-    "\n",
-    "#### Run tabular data tests\n",
-    "\n",
-    "The inputs expected by a test can also be found in the test definition — let's take [`validmind.data_validation.DescriptiveStatistics`](https://docs.validmind.ai/tests/data_validation/DescriptiveStatistics.html) as an example.\n",
-    "\n",
-    "Note that the output of the [`describe_test()` function](https://docs.validmind.ai/validmind/validmind/tests.html#describe_test) below shows that this test expects a `dataset` as input:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.describe_test(\"validmind.data_validation.DescriptiveStatistics\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Now, let's run a few tests to assess the quality of the dataset:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result2 = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.ClassImbalance\",\n",
-    "    inputs={\"dataset\": vm_raw_dataset},\n",
-    "    params={\"min_percent_threshold\": 30},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "The output above shows that [the class imbalance test](https://docs.validmind.ai/tests/data_validation/ClassImbalance.html) did not pass according to the value we set for `min_percent_threshold` — great, this matches what was reported by the model development team.\n",
-    "\n",
-    "To address this issue, we'll re-run the test on some processed data. In this case let's apply a very simple rebalancing technique to the dataset:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import pandas as pd\n",
-    "\n",
-    "raw_copy_df = raw_df.sample(frac=1)  # Create a copy of the raw dataset\n",
-    "\n",
-    "# Create a balanced dataset with the same number of exited and not exited customers\n",
-    "exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 1]\n",
-    "not_exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 0].sample(n=exited_df.shape[0])\n",
-    "\n",
-    "balanced_raw_df = pd.concat([exited_df, not_exited_df])\n",
-    "balanced_raw_df = balanced_raw_df.sample(frac=1, random_state=42)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "With this new balanced dataset, you can re-run the individual test to see if it now passes the class imbalance test requirement.\n",
-    "\n",
-    "As this is technically a different dataset, **remember to first initialize a new ValidMind `Dataset` object** to pass in as input as required by `run_test()`:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Register new data and now 'balanced_raw_dataset' is the new dataset object of interest\n",
-    "vm_balanced_raw_dataset = vm.init_dataset(\n",
-    "    dataset=balanced_raw_df,\n",
-    "    input_id=\"balanced_raw_dataset\",\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Pass the initialized `balanced_raw_dataset` as input into the test run\n",
-    "result = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.ClassImbalance\",\n",
-    "    inputs={\"dataset\": vm_balanced_raw_dataset},\n",
-    "    params={\"min_percent_threshold\": 30},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_4__'></a>\n",
-    "\n",
-    "### Remove highly correlated features\n",
-    "\n",
-    "Next, let's also remove highly correlated features from our dataset as outlined by the development team. Removing highly correlated features helps make the model simpler, more stable, and easier to understand.\n",
-    "\n",
-    "You can utilize the output from a ValidMind test for further use — in this below example, to retrieve the list of features with the highest correlation coefficients and use them to reduce the final list of features for modeling.\n",
-    "\n",
-    "First, we'll run [`validmind.data_validation.HighPearsonCorrelation`](https://docs.validmind.ai/tests/data_validation/HighPearsonCorrelation.html) with the `balanced_raw_dataset` we initialized previously as input as is for comparison with later runs:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "corr_result = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
-    "    params={\"max_threshold\": 0.3},\n",
-    "    inputs={\"dataset\": vm_balanced_raw_dataset},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "The output above shows that the test did not pass according to the value we set for `max_threshold` — as reported and expected.\n",
-    "\n",
-    "`corr_result` is an object of type `TestResult`. We can inspect the result object to see what the test has produced:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "print(type(corr_result))\n",
-    "print(\"Result ID: \", corr_result.result_id)\n",
-    "print(\"Params: \", corr_result.params)\n",
-    "print(\"Passed: \", corr_result.passed)\n",
-    "print(\"Tables: \", corr_result.tables)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Let's remove the highly correlated features and create a new VM `dataset` object.\n",
-    "\n",
-    "We'll begin by checking out the table in the result and extracting a list of features that failed the test:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Extract table from `corr_result.tables`\n",
-    "features_df = corr_result.tables[0].data\n",
-    "features_df"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Extract list of features that failed the test\n",
-    "high_correlation_features = features_df[features_df[\"Pass/Fail\"] == \"Fail\"][\"Columns\"].tolist()\n",
-    "high_correlation_features"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Next, extract the feature names from the list of strings (example: `(Age, Exited)` > `Age`):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "high_correlation_features = [feature.split(\",\")[0].strip(\"()\") for feature in high_correlation_features]\n",
-    "high_correlation_features"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Now, it's time to re-initialize the dataset with the highly correlated features removed.\n",
-    "\n",
-    "**Note the use of a different `input_id`.** This allows tracking the inputs used when running each individual test."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Remove the highly correlated features from the dataset\n",
-    "balanced_raw_no_age_df = balanced_raw_df.drop(columns=high_correlation_features)\n",
-    "\n",
-    "# Re-initialize the dataset object\n",
-    "vm_raw_dataset_preprocessed = vm.init_dataset(\n",
-    "    dataset=balanced_raw_no_age_df,\n",
-    "    input_id=\"raw_dataset_preprocessed\",\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Re-running the test with the reduced feature set should pass the test:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "corr_result = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
-    "    params={\"max_threshold\": 0.3},\n",
-    "    inputs={\"dataset\": vm_raw_dataset_preprocessed},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You can also plot the correlation matrix to visualize the new correlation between features:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "corr_result = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.PearsonCorrelationMatrix\",\n",
-    "    inputs={\"dataset\": vm_raw_dataset_preprocessed},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Documenting test results\n",
-    "\n",
-    "Now that we've done some analysis on two different datasets, we can use ValidMind to easily document why certain things were done to our raw data with testing to support it. Every test result returned by the `run_test()` function has a `.log()` method that can be used to send the test results to the ValidMind Platform.\n",
-    "\n",
-    "When logging validation test results to the platform, you'll need to manually add those results to the desired section of the validation report. To demonstrate how to add test results to your validation report, we'll log our data quality tests and insert the results via the ValidMind Platform."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_1__'></a>\n",
-    "\n",
-    "### Configure and run comparison tests\n",
-    "\n",
-    "Below, we'll perform comparison tests between the original raw dataset (`raw_dataset`) and the final preprocessed (`raw_dataset_preprocessed`) dataset, again logging the results to the ValidMind Platform. \n",
-    "\n",
-    "We can specify all the tests we'd ike to run in a dictionary called `test_config`, and we'll pass in the following arguments for each test:\n",
-    "\n",
-    "  - **`params`:** Individual test parameters.\n",
-    "  - **`input_grid`:** Individual test inputs to compare. In this case, we'll input our two datasets for comparison.\n",
-    "\n",
-    "**Note here that the `input_grid` expects the `input_id` of the dataset as the value rather than the variable name we specified:**"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Individual test config with inputs specified\n",
-    "test_config = {\n",
-    "    \"validmind.data_validation.ClassImbalance\": {\n",
-    "        \"input_grid\": {\"dataset\": [\"raw_dataset\", \"raw_dataset_preprocessed\"]},\n",
-    "        \"params\": {\"min_percent_threshold\": 30}\n",
-    "    },\n",
-    "    \"validmind.data_validation.HighPearsonCorrelation\": {\n",
-    "        \"input_grid\": {\"dataset\": [\"raw_dataset\", \"raw_dataset_preprocessed\"]},\n",
-    "        \"params\": {\"max_threshold\": 0.3}\n",
-    "    },\n",
-    "}"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Then batch run and log our tests in `test_config`:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "for t in test_config:\n",
-    "    print(t)\n",
-    "    try:\n",
-    "        # Check if test has input_grid\n",
-    "        if 'input_grid' in test_config[t]:\n",
-    "            # For tests with input_grid, pass the input_grid configuration\n",
-    "            if 'params' in test_config[t]:\n",
-    "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid'], params=test_config[t]['params']).log()\n",
-    "            else:\n",
-    "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid']).log()\n",
-    "        else:\n",
-    "            # Original logic for regular inputs\n",
-    "            if 'params' in test_config[t]:\n",
-    "                vm.tests.run_test(t, inputs=test_config[t]['inputs'], params=test_config[t]['params']).log()\n",
-    "            else:\n",
-    "                vm.tests.run_test(t, inputs=test_config[t]['inputs']).log()\n",
-    "    except Exception as e:\n",
-    "        print(f\"Error running test {t}: {str(e)}\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your model's documentation for some test IDs. </b></span>\n",
-    "<br></br>\n",
-    "That's expected, as when we run validations tests the results logged need to be manually added to your report as part of your compliance assessment process within the ValidMind Platform.</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2__'></a>\n",
-    "\n",
-    "### Log tests with unique identifiers\n",
-    "\n",
-    "Next, we'll use the previously initialized `vm_balanced_raw_dataset` (that still has a highly correlated `Age` column) as input to run an individual test, then log the result to the ValidMind Platform.\n",
-    "\n",
-    "When running individual tests, **you can use a custom `result_id` to tag the individual result with a unique identifier:**\n",
-    "\n",
-    "- This `result_id` can be appended to `test_id` with a `:` separator.\n",
-    "- The `balanced_raw_dataset` result identifier will correspond to the `balanced_raw_dataset` input, the dataset that still has the `Age` column."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.HighPearsonCorrelation:balanced_raw_dataset\",\n",
-    "    params={\"max_threshold\": 0.3},\n",
-    "    inputs={\"dataset\": vm_balanced_raw_dataset},\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_3__'></a>\n",
-    "\n",
-    "### Add test results to reporting\n",
-    "\n",
-    "With some test results logged, let's head to the model we connected to at the beginning of this notebook and learn how to insert a test result into our validation report ([Need more help?](https://docs.validmind.ai/guide/model-validation/assess-compliance.html#link-validator-evidence)).\n",
-    "\n",
-    "While the example below focuses on a specific test result, you can follow the same general procedure for your other results:\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you connected to earlier.\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Validation** under Documents.\n",
-    "\n",
-    "3. Locate the Data Preparation section and click on **2.2.1. Data Quality** to expand that section.\n",
-    "\n",
-    "4. Under the Class Imbalance Assessment section, locate Validator Evidence then click **Link Evidence to Report**:\n",
-    "\n",
-    "    <img src= \"link-validator-evidence.png\" alt=\"Screenshot showing the validation report with the link validator evidence to report option highlighted\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
-    "    <br><br>\n",
-    "\n",
-    "5. Select the Class Imbalance test results we logged: **ValidMind Data Validation Class Imbalance** \n",
-    "\n",
-    "    <img src= \"selecting-class-imbalance-results.png\" alt=\"Screenshot showing the ClassImbalance test selected\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
-    "    <br><br>\n",
-    "\n",
-    "6. Click **Update Linked Evidence** to add the test results to the validation report.\n",
-    "\n",
-    "    Confirm that the results for the Class Imbalance test you inserted has been correctly inserted into section **2.2.1. Data Quality** of the report:\n",
-    "\n",
-    "    <img src= \"inserted-class-imbalance-results.png\" alt=\"Screenshot showing the ClassImbalance test inserted into the validation report\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
-    "    <br><br>\n",
-    "\n",
-    "7. Note that these test results are flagged as **Requires Attention** — as they include comparative results from our initial raw dataset.\n",
-    "\n",
-    "    Click **See evidence details** to review the LLM-generated description that summarizes the test results, that confirm that our final preprocessed dataset actually passes our test:\n",
-    "\n",
-    "    <img src= \"class-imbalance-results-detail.png\" alt=\"Screenshot showing the ClassImbalance test generated description in the text editor\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
-    "    <br><br>\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>    Here in this text editor, you can make qualitative edits to the draft that ValidMind generated to finalize the test results.</b></span>\n",
-    "<br></br>\n",
-    "Learn more: <a href=\"https://docs.validmind.ai/guide/model-documentation/work-with-content-blocks.html\" style=\"color: #DE257E;\"><b>Work with content blocks</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Split the preprocessed dataset\n",
-    "\n",
-    "With our raw dataset rebalanced with highly correlated features removed, let's now **spilt our dataset into train and test** in preparation for model evaluation testing.\n",
-    "\n",
-    "To start, let's grab the first few rows from the `balanced_raw_no_age_df` dataset we initialized earlier:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "balanced_raw_no_age_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Before training the model, we need to encode the categorical features in the dataset:\n",
-    "\n",
-    "- Use the `OneHotEncoder` class from the `sklearn.preprocessing` module to encode the categorical features.\n",
-    "- The categorical features in the dataset are `Geography` and `Gender`."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "balanced_raw_no_age_df = pd.get_dummies(\n",
-    "    balanced_raw_no_age_df, columns=[\"Geography\", \"Gender\"], drop_first=True\n",
-    ")\n",
-    "balanced_raw_no_age_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Splitting our dataset into training and testing is essential for proper validation testing, as this helps assess how well the model generalizes to unseen data:\n",
-    "\n",
-    "- We start by dividing our `balanced_raw_no_age_df` dataset into training and test subsets using `train_test_split`, with 80% of the data allocated to training (`train_df`) and 20% to testing (`test_df`).\n",
-    "- From each subset, we separate the features (all columns except \"Exited\") into `X_train` and `X_test`, and the target column (\"Exited\") into `y_train` and `y_test`."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from sklearn.model_selection import train_test_split\n",
-    "\n",
-    "train_df, test_df = train_test_split(balanced_raw_no_age_df, test_size=0.20)\n",
-    "\n",
-    "X_train = train_df.drop(\"Exited\", axis=1)\n",
-    "y_train = train_df[\"Exited\"]\n",
-    "X_test = test_df.drop(\"Exited\", axis=1)\n",
-    "y_test = test_df[\"Exited\"]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1__'></a>\n",
-    "\n",
-    "### Initialize the split datasets\n",
-    "\n",
-    "Next, let's initialize the training and testing datasets so they are available for use:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds = vm.init_dataset(\n",
-    "    input_id=\"train_dataset_final\",\n",
-    "    dataset=train_df,\n",
-    "    target_column=\"Exited\",\n",
-    ")\n",
-    "\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    input_id=\"test_dataset_final\",\n",
-    "    dataset=test_df,\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## In summary\n",
-    "\n",
-    "In this second notebook, you learned how to:\n",
-    "\n",
-    "- [x] Import a sample dataset\n",
-    "- [x] Identify which tests you might want to run with ValidMind\n",
-    "- [x] Initialize ValidMind datasets\n",
-    "- [x] Run individual tests\n",
-    "- [x] Utilize the output from tests you’ve run\n",
-    "- [x] Log test results as evidence to the ValidMind Platform\n",
-    "- [x] Insert test results into your validation report"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc8__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "<a id='toc8_1__'></a>\n",
-    "\n",
-    "### Develop potential challenger models\n",
-    "\n",
-    "Now that you're familiar with the basics of using the ValidMind Library, let's use it to develop a challenger model: **[3 — Developing a potential challenger model](3-developing_challenger_model.ipynb)**"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-a798ee72616640f5bead3af25e6e9434",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
-  },
-  "language_info": {
-   "name": "python",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
-}
diff --git a/site/notebooks/EXECUTED/model_validation/3-developing_challenger_model.ipynb b/site/notebooks/EXECUTED/model_validation/3-developing_challenger_model.ipynb
deleted file mode 100644
index e86fde85de..0000000000
--- a/site/notebooks/EXECUTED/model_validation/3-developing_challenger_model.ipynb
+++ /dev/null
@@ -1,893 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# ValidMind for model validation 3 — Developing a potential challenger model\n",
-    "\n",
-    "Learn how to use ValidMind for your end-to-end model validation process with our series of four introductory notebooks. In this third notebook, develop a potential challenger model and then pass your model and its predictions to ValidMind.\n",
-    "\n",
-    "A *challenger model* is an alternate model that attempts to outperform the champion model, ensuring that the best performing fit-for-purpose model is always considered for deployment. Challenger models also help avoid over-reliance on a single model, and allow testing of new features, algorithms, or data sources without disrupting the production lifecycle.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
-    "<br></br>\n",
-    "Our course tailor-made for validators new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/validator-fundamentals/validator-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Validator Fundamentals</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [Prerequisites](#toc1_)    \n",
-    "- [Setting up](#toc2_)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_1_)    \n",
-    "  - [Import the sample dataset](#toc2_2_)    \n",
-    "    - [Preprocess the dataset](#toc2_2_1_)    \n",
-    "  - [Split the preprocessed dataset](#toc2_3_)    \n",
-    "- [Import the champion model](#toc3_)    \n",
-    "- [Training a potential challenger model](#toc4_)    \n",
-    "  - [Random forest classification model](#toc4_1_)    \n",
-    "- [Initializing the model objects](#toc5_)    \n",
-    "  - [Initialize the model objects](#toc5_1_)    \n",
-    "  - [Assign predictions](#toc5_2_)    \n",
-    "- [Running model evaluation tests](#toc6_)    \n",
-    "  - [Run model performance tests](#toc6_1_)    \n",
-    "    - [Evaluate performance of the champion model](#toc6_1_1_)    \n",
-    "    - [Log an artifact](#toc6_1_2_)    \n",
-    "    - [Evaluate performance of challenger model](#toc6_1_3_)    \n",
-    "  - [Run diagnostic tests](#toc6_2_)    \n",
-    "  - [Run feature importance tests](#toc6_3_)    \n",
-    "- [In summary](#toc7_)    \n",
-    "- [Next steps](#toc8_)    \n",
-    "  - [Finalize validation and reporting](#toc8_1_)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_'></a>\n",
-    "\n",
-    "## Prerequisites\n",
-    "\n",
-    "In order to develop potential challenger models with this notebook, you'll need to first have:\n",
-    "\n",
-    "- [x] Registered a model within the ValidMind Platform and granted yourself access to the model as a validator\n",
-    "- [x] Installed the ValidMind Library in your local environment, allowing you to access all its features\n",
-    "- [x] Learned how to import and initialize datasets for use with ValidMind\n",
-    "- [x] Understood the basics of how to run and log tests with ValidMind\n",
-    "- [x] Run data quality tests on the datasets used to train the champion model, and logged the results of those tests to ValidMind\n",
-    "- [x] Inserted your logged test results into your validation report\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Need help with the above steps?</b></span>\n",
-    "<br></br>\n",
-    "Refer to the first two notebooks in this series:\n",
-    "\n",
-    "- <a href=\"1-set_up_validmind_for_validation.ipynb\" style=\"color: #DE257E;\"><b>1 — Set up the ValidMind Library for validation</b></a>\n",
-    "- <a href=\"2-start_validation_process.ipynb\" style=\"color: #DE257E;\"><b>2 — Start the model validation process</b></a>\n",
-    "\n",
-    "</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_'></a>\n",
-    "\n",
-    "## Setting up\n",
-    "\n",
-    "This section should be quite familiar to you — as we performed the same actions in the previous notebook, **[2 — Start the model validation process](2-start_validation_process.ipynb)**."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1_'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library\n",
-    "\n",
-    "As usual, let's first connect up the ValidMind Library to our model we previously registered in the ValidMind Platform:\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Validation` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Make sure the ValidMind Library is installed\n",
-    "\n",
-    "%pip install -q validmind\n",
-    "\n",
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"validation-report\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_'></a>\n",
-    "\n",
-    "### Import the sample dataset\n",
-    "\n",
-    "Next, we'll load in the sample [Bank Customer Churn Prediction](https://www.kaggle.com/datasets/shantanudhakadd/bank-customer-churn-prediction) dataset used to develop the champion model that we will independently preprocess:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load the sample dataset\n",
-    "from validmind.datasets.classification import customer_churn as demo_dataset\n",
-    "\n",
-    "print(\n",
-    "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{demo_dataset.target_column}' \\n\\t• Class labels: {demo_dataset.class_labels}\"\n",
-    ")\n",
-    "\n",
-    "raw_df = demo_dataset.load_data()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1_'></a>\n",
-    "\n",
-    "#### Preprocess the dataset\n",
-    "\n",
-    "We’ll apply a simple rebalancing technique to the dataset before continuing:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import pandas as pd\n",
-    "\n",
-    "raw_copy_df = raw_df.sample(frac=1)  # Create a copy of the raw dataset\n",
-    "\n",
-    "# Create a balanced dataset with the same number of exited and not exited customers\n",
-    "exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 1]\n",
-    "not_exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 0].sample(n=exited_df.shape[0])\n",
-    "\n",
-    "balanced_raw_df = pd.concat([exited_df, not_exited_df])\n",
-    "balanced_raw_df = balanced_raw_df.sample(frac=1, random_state=42)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Let’s also quickly remove highly correlated features from the dataset using the output from a ValidMind test.\n",
-    "\n",
-    "As you know, before we can run tests you’ll need to initialize a ValidMind dataset object with the [`init_dataset` function](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Register new data and now 'balanced_raw_dataset' is the new dataset object of interest\n",
-    "vm_balanced_raw_dataset = vm.init_dataset(\n",
-    "    dataset=balanced_raw_df,\n",
-    "    input_id=\"balanced_raw_dataset\",\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "With our balanced dataset initialized, we can then run our test and utilize the output to help us identify the features we want to remove:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Run HighPearsonCorrelation test with our balanced dataset as input and return a result object\n",
-    "corr_result = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
-    "    params={\"max_threshold\": 0.3},\n",
-    "    inputs={\"dataset\": vm_balanced_raw_dataset},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# From result object, extract table from `corr_result.tables`\n",
-    "features_df = corr_result.tables[0].data\n",
-    "features_df"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Extract list of features that failed the test\n",
-    "high_correlation_features = features_df[features_df[\"Pass/Fail\"] == \"Fail\"][\"Columns\"].tolist()\n",
-    "high_correlation_features"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Extract feature names from the list of strings\n",
-    "high_correlation_features = [feature.split(\",\")[0].strip(\"()\") for feature in high_correlation_features]\n",
-    "high_correlation_features"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "We can then re-initialize the dataset with a different `input_id` and the highly correlated features removed and re-run the test for confirmation:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Remove the highly correlated features from the dataset\n",
-    "balanced_raw_no_age_df = balanced_raw_df.drop(columns=high_correlation_features)\n",
-    "\n",
-    "# Re-initialize the dataset object\n",
-    "vm_raw_dataset_preprocessed = vm.init_dataset(\n",
-    "    dataset=balanced_raw_no_age_df,\n",
-    "    input_id=\"raw_dataset_preprocessed\",\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Re-run the test with the reduced feature set\n",
-    "corr_result = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
-    "    params={\"max_threshold\": 0.3},\n",
-    "    inputs={\"dataset\": vm_raw_dataset_preprocessed},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3_'></a>\n",
-    "\n",
-    "### Split the preprocessed dataset\n",
-    "\n",
-    "With our raw dataset rebalanced with highly correlated features removed, let's now **spilt our dataset into train and test** in preparation for model evaluation testing:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Encode categorical features in the dataset\n",
-    "balanced_raw_no_age_df = pd.get_dummies(\n",
-    "    balanced_raw_no_age_df, columns=[\"Geography\", \"Gender\"], drop_first=True\n",
-    ")\n",
-    "balanced_raw_no_age_df.head()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from sklearn.model_selection import train_test_split\n",
-    "\n",
-    "# Split the dataset into train and test\n",
-    "train_df, test_df = train_test_split(balanced_raw_no_age_df, test_size=0.20)\n",
-    "\n",
-    "X_train = train_df.drop(\"Exited\", axis=1)\n",
-    "y_train = train_df[\"Exited\"]\n",
-    "X_test = test_df.drop(\"Exited\", axis=1)\n",
-    "y_test = test_df[\"Exited\"]"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize the split datasets\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    input_id=\"train_dataset_final\",\n",
-    "    dataset=train_df,\n",
-    "    target_column=\"Exited\",\n",
-    ")\n",
-    "\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    input_id=\"test_dataset_final\",\n",
-    "    dataset=test_df,\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_'></a>\n",
-    "\n",
-    "## Import the champion model\n",
-    "\n",
-    "With our raw dataset assessed and preprocessed, let's go ahead and import the champion model submitted by the model development team in the format of a `.pkl` file: **[lr_model_champion.pkl](lr_model_champion.pkl)**"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Import the champion model\n",
-    "import pickle as pkl\n",
-    "\n",
-    "with open(\"lr_model_champion.pkl\", \"rb\") as f:\n",
-    "    log_reg = pkl.load(f)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_'></a>\n",
-    "\n",
-    "## Training a potential challenger model\n",
-    "\n",
-    "We're curious how an alternate model compares to our champion model, so let's train a challenger model as a basis for our testing.\n",
-    "\n",
-    "Our champion *logistic regression model* is a simpler, parametric model that assumes a linear relationship between the independent variables and the log-odds of the outcome. While logistic regression may not capture complex patterns as effectively, it offers a high degree of interpretability and is easier to explain to stakeholders. However, model risk is not calculated in isolation from a single factor, but rather in consideration with trade-offs in predictive performance, ease of interpretability, and overall alignment with business objectives."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1_'></a>\n",
-    "\n",
-    "### Random forest classification model\n",
-    "\n",
-    "A *random forest classification model* is an ensemble machine learning algorithm that uses multiple decision trees to classify data. In ensemble learning, multiple models are combined to improve prediction accuracy and robustness.\n",
-    "\n",
-    "Random forest classification models generally have higher accuracy because they capture complex, non-linear relationships, but as a result they lack transparency in their predictions."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Import the Random Forest Classification model\n",
-    "from sklearn.ensemble import RandomForestClassifier\n",
-    "\n",
-    "# Create the model instance with 50 decision trees\n",
-    "rf_model = RandomForestClassifier(\n",
-    "    n_estimators=50,\n",
-    "    random_state=42,\n",
-    ")\n",
-    "\n",
-    "# Train the model\n",
-    "rf_model.fit(X_train, y_train)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_'></a>\n",
-    "\n",
-    "## Initializing the model objects"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_1_'></a>\n",
-    "\n",
-    "### Initialize the model objects\n",
-    "\n",
-    "In addition to the initialized datasets, you'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for each of our two models.\n",
-    "\n",
-    "You simply initialize this model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize the champion logistic regression model\n",
-    "vm_log_model = vm.init_model(\n",
-    "    log_reg,\n",
-    "    input_id=\"log_model_champion\",\n",
-    ")\n",
-    "\n",
-    "# Initialize the challenger random forest classification model\n",
-    "vm_rf_model = vm.init_model(\n",
-    "    rf_model,\n",
-    "    input_id=\"rf_model\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2_'></a>\n",
-    "\n",
-    "### Assign predictions\n",
-    "\n",
-    "With our models registered, we'll move on to assigning both the predictive probabilities coming directly from each model's predictions, and the binary prediction after applying the cutoff threshold described in the Compute binary predictions step above.\n",
-    "\n",
-    "- The [`assign_predictions()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#assign_predictions) from the `Dataset` object can link existing predictions to any number of models.\n",
-    "- This method links the model's class prediction values and probabilities to our `vm_train_ds` and `vm_test_ds` datasets.\n",
-    "\n",
-    "If no prediction values are passed, the method will compute predictions automatically:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Champion — Logistic regression model\n",
-    "vm_train_ds.assign_predictions(model=vm_log_model)\n",
-    "vm_test_ds.assign_predictions(model=vm_log_model)\n",
-    "\n",
-    "# Challenger — Random forest classification model\n",
-    "vm_train_ds.assign_predictions(model=vm_rf_model)\n",
-    "vm_test_ds.assign_predictions(model=vm_rf_model)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_'></a>\n",
-    "\n",
-    "## Running model evaluation tests\n",
-    "\n",
-    "With our setup complete, let's run the rest of our validation tests. Since we have already verified the data quality of the dataset used to train our champion model, we will now focus on comprehensive performance evaluations of both the champion and challenger models."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1_'></a>\n",
-    "\n",
-    "### Run model performance tests\n",
-    "\n",
-    "Let's run some performance tests, beginning with independent testing of our champion logistic regression model, then moving on to our potential challenger model.\n",
-    "\n",
-    "Use [`vm.tests.list_tests()`](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) to identify all the model performance tests for classification:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "\n",
-    "vm.tests.list_tests(tags=[\"model_performance\"], task=\"classification\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "We'll isolate the specific tests we want to run in `mpt`:\n",
-    "\n",
-    "- [`ClassifierPerformance`](https://docs.validmind.ai/tests/model_validation/sklearn/ClassifierPerformance.html)\n",
-    "- [`ConfusionMatrix`](https://docs.validmind.ai/tests/model_validation/sklearn/ConfusionMatrix.html)\n",
-    "- [`MinimumAccuracy`](https://docs.validmind.ai/tests/model_validation/sklearn/MinimumAccuracy.html)\n",
-    "- [`MinimumF1Score`](https://docs.validmind.ai/tests/model_validation/sklearn/MinimumF1Score.html)\n",
-    "- [`ROCCurve`](https://docs.validmind.ai/tests/model_validation/sklearn/ROCCurve.html)\n",
-    "\n",
-    "As we learned in the previous notebook [2 — Start the model validation process](2-start_validation_process.ipynb), you can use a custom `result_id` to tag the individual result with a unique identifier by appending this `result_id` to the `test_id` with a `:` separator. We'll append an identifier for our champion model here:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "mpt = [\n",
-    "    \"validmind.model_validation.sklearn.ClassifierPerformance:logreg_champion\",\n",
-    "    \"validmind.model_validation.sklearn.ConfusionMatrix:logreg_champion\",\n",
-    "    \"validmind.model_validation.sklearn.MinimumAccuracy:logreg_champion\",\n",
-    "    \"validmind.model_validation.sklearn.MinimumF1Score:logreg_champion\",\n",
-    "    \"validmind.model_validation.sklearn.ROCCurve:logreg_champion\"\n",
-    "]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1_1_'></a>\n",
-    "\n",
-    "#### Evaluate performance of the champion model\n",
-    "\n",
-    "Now, let's run and log our batch of model performance tests using our testing dataset (`vm_test_ds`) for our champion model:\n",
-    "\n",
-    "- The test set serves as a proxy for real-world data, providing an unbiased estimate of model performance since it was not used during training or tuning.\n",
-    "- The test set also acts as protection against selection bias and model tweaking, giving a final, more unbiased checkpoint."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "for test in mpt:\n",
-    "    vm.tests.run_test(\n",
-    "        test,\n",
-    "        inputs={\n",
-    "            \"dataset\": vm_test_ds, \"model\" : vm_log_model,\n",
-    "        },\n",
-    "    ).log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your model's documentation for some test IDs. </b></span>\n",
-    "<br></br>\n",
-    "That's expected, as when we run validations tests the results logged need to be manually added to your report as part of your compliance assessment process within the ValidMind Platform.</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1_2_'></a>\n",
-    "\n",
-    "#### Log an artifact\n",
-    "\n",
-    "As we can observe from the output above, our champion model doesn't pass the `MinimumAccuracy` based on the default thresholds of the out-of-the-box test, so let's log an artifact (finding) in the ValidMind Platform  ([Need more help?](https://docs.validmind.ai/guide/model-validation/add-manage-artifacts.html)):\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you connected to earlier.\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Validation** under Documents.\n",
-    "\n",
-    "3. Locate the Data Preparation section and click on **2.2.2. Model Performance** to expand that section.\n",
-    "\n",
-    "4. Under the Model Performance Metrics section, locate Artifacts then click **Link Artifact to Report**:\n",
-    "\n",
-    "    <img src=\"link-artifact.png\" alt=\"Screenshot showing the validation report with the link artifact option highlighted\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
-    "    <br><br>\n",
-    "\n",
-    "5. Select **Validation Issue** as the type of artifact.\n",
-    "\n",
-    "6. Click **+ Add Validation Issue** to add a validation issue type artifact.\n",
-    "\n",
-    "76. Enter in the details for your validation issue, for example:\n",
-    "\n",
-    "    - **TITLE** — Champion Logistic Regression Model Fails Minimum Accuracy Threshold\n",
-    "    - **RISK AREA** — Model Performance\n",
-    "    - **DOCUMENTATION SECTION** — 3.2. Model Evaluation\n",
-    "    - **DESCRIPTION** — The logistic regression champion model was subjected to a Minimum Accuracy test to determine whether its predictive accuracy meets the predefined performance threshold of 0.7. The model achieved an accuracy score of 0.6136, which falls below the required minimum. As a result, the test produced a Fail outcome.\n",
-    "\n",
-    "8. Click **Save**.\n",
-    "\n",
-    "9. Select the validation issue you just added to link to your validation report and click **Update Linked Artifacts** to insert your validation issue.\n",
-    "\n",
-    "10. Click on the validation issue to expand the issue, where you can adjust details such as severity, owner, due date, status, etc. as well as include proposed remediation plans or supporting documentation as attachments."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1_3_'></a>\n",
-    "\n",
-    "#### Evaluate performance of challenger model\n",
-    "\n",
-    "We've now conducted similar tests as the model development team for our champion model, with the aim of verifying their test results.\n",
-    "\n",
-    "Next, let's see how our challenger models compare. We'll use the same batch of tests here as we did in `mpt`, but append a different `result_id` to indicate that these results should be associated with our challenger model:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "mpt_chall = [\n",
-    "    \"validmind.model_validation.sklearn.ClassifierPerformance:champion_vs_challenger\",\n",
-    "    \"validmind.model_validation.sklearn.ConfusionMatrix:champion_vs_challenger\",\n",
-    "    \"validmind.model_validation.sklearn.MinimumAccuracy:champion_vs_challenger\",\n",
-    "    \"validmind.model_validation.sklearn.MinimumF1Score:champion_vs_challenger\",\n",
-    "    \"validmind.model_validation.sklearn.ROCCurve:champion_vs_challenger\"\n",
-    "]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "We'll run each test once for each model with the same `vm_test_ds` dataset to compare them:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "for test in mpt_chall:\n",
-    "    vm.tests.run_test(\n",
-    "        test,\n",
-    "        input_grid={\n",
-    "            \"dataset\": [vm_test_ds], \"model\" : [vm_log_model,vm_rf_model]\n",
-    "        }\n",
-    "    ).log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Based on the performance metrics, our challenger random forest classification model passes the <code>MinimumAccuracy</code> where our champion did not.</b></span>\n",
-    "<br></br>\n",
-    "In your validation report, support your recommendation in your validation issue's <b>Proposed Remediation Plan</b> to investigate the usage of our challenger model by inserting the performance tests we logged with this notebook into the appropriate section.</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2_'></a>\n",
-    "\n",
-    "### Run diagnostic tests\n",
-    "\n",
-    "Next, we want to inspect the robustness and stability testing comparison between our champion and challenger model.\n",
-    "\n",
-    "Use `list_tests()` to list all available diagnosis tests applicable to classification tasks:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.list_tests(tags=[\"model_diagnosis\"], task=\"classification\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Let’s now assess the models for potential signs of *overfitting* and identify any sub-segments where performance may inconsistent with the [`OverfitDiagnosis` test](https://docs.validmind.ai/tests/model_validation/sklearn/OverfitDiagnosis.html).\n",
-    "\n",
-    "Overfitting occurs when a model learns the training data too well, capturing not only the true pattern but noise and random fluctuations resulting in excellent performance on the training dataset but poor generalization to new, unseen data:\n",
-    "\n",
-    "- Since the training dataset (`vm_train_ds`) was used to fit the model, we use this set to establish a baseline performance for how well the model performs on data it has already seen.\n",
-    "- The testing dataset (`vm_test_ds`) was never seen during training, and here simulates real-world generalization, or how well the model performs on new, unseen data. "
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    test_id=\"validmind.model_validation.sklearn.OverfitDiagnosis:champion_vs_challenger\",\n",
-    "    input_grid={\n",
-    "        \"datasets\": [[vm_train_ds,vm_test_ds]],\n",
-    "        \"model\" : [vm_log_model,vm_rf_model]\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Let's also conduct *robustness* and *stability* testing of the two models with the [`RobustnessDiagnosis` test](https://docs.validmind.ai/tests/model_validation/sklearn/RobustnessDiagnosis.html). Robustness refers to a model's ability to maintain consistent performance, and stability refers to a model's ability to produce consistent outputs over time across different data subsets.\n",
-    "\n",
-    "Again, we'll use both the training and testing datasets to establish baseline performance and to simulate real-world generalization:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    test_id=\"validmind.model_validation.sklearn.RobustnessDiagnosis:Champion_vs_LogRegression\",\n",
-    "    input_grid={\n",
-    "        \"datasets\": [[vm_train_ds,vm_test_ds]],\n",
-    "        \"model\" : [vm_log_model,vm_rf_model]\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_3_'></a>\n",
-    "\n",
-    "### Run feature importance tests\n",
-    "\n",
-    "We also want to verify the relative influence of different input features on our models' predictions, as well as inspect the differences between our champion and challenger model to see if a certain model offers more understandable or logical importance scores for features.\n",
-    "\n",
-    "Use `list_tests()` to identify all the feature importance tests for classification:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Store the feature importance tests\n",
-    "FI = vm.tests.list_tests(tags=[\"feature_importance\"], task=\"classification\",pretty=False)\n",
-    "FI"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "We'll only use our testing dataset (`vm_test_ds`) here, to provide a realistic, unseen sample that mimic future or production data, as the training dataset has already influenced our model during learning:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Run and log our feature importance tests for both models for the testing dataset\n",
-    "for test in FI:\n",
-    "    vm.tests.run_test(\n",
-    "        \"\".join((test,':champion_vs_challenger')),\n",
-    "        input_grid={\n",
-    "            \"dataset\": [vm_test_ds], \"model\" : [vm_log_model,vm_rf_model]\n",
-    "        },\n",
-    "    ).log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_'></a>\n",
-    "\n",
-    "## In summary\n",
-    "\n",
-    "In this third notebook, you learned how to:\n",
-    "\n",
-    "- [x] Initialize ValidMind model objects\n",
-    "- [x] Assign predictions and probabilities to your ValidMind model objects\n",
-    "- [x] Use tests from ValidMind to evaluate the potential of models, including comparative tests between champion and challenger models\n",
-    "- [x] Log an artifact in the ValidMind Platform"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc8_'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "<a id='toc8_1_'></a>\n",
-    "\n",
-    "### Finalize validation and reporting\n",
-    "\n",
-    "Now that you're familiar with the basics of using the ValidMind Library to run and log validation tests, let's learn how to implement some custom tests and wrap up our validation: **[4 — Finalize validation and reporting](4-finalize_validation_reporting.ipynb)**"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-0b98aebe3459409f848c2c03b413d181",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
-  },
-  "language_info": {
-   "name": "python",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
-}
diff --git a/site/notebooks/EXECUTED/model_validation/4-finalize_validation_reporting.ipynb b/site/notebooks/EXECUTED/model_validation/4-finalize_validation_reporting.ipynb
deleted file mode 100644
index 854ccde766..0000000000
--- a/site/notebooks/EXECUTED/model_validation/4-finalize_validation_reporting.ipynb
+++ /dev/null
@@ -1,1233 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# ValidMind for model validation 4 — Finalize testing and reporting\n",
-    "\n",
-    "Learn how to use ValidMind for your end-to-end model validation process with our series of four introductory notebooks. In this last notebook, finalize the compliance assessment process and have a complete validation report ready for review.\n",
-    "\n",
-    "This notebook will walk you through how to supplement ValidMind tests with your own custom tests and include them as additional evidence in your validation report. A custom test is any function that takes a set of inputs and parameters as arguments and returns one or more outputs:\n",
-    "\n",
-    "- The function can be as simple or as complex as you need it to be — it can use external libraries, make API calls, or do anything else that you can do in Python.\n",
-    "- The only requirement is that the function signature and return values can be \"understood\" and handled by the ValidMind Library. As such, custom tests offer added flexibility by extending the default tests provided by ValidMind, enabling you to document any type of model or use case.\n",
-    "\n",
-    "**For a more in-depth introduction to custom tests,** refer to our [Implement custom tests](../../how_to/tests/custom_tests/implement_custom_tests.ipynb) notebook.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
-    "<br></br>\n",
-    "Our course tailor-made for validators new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/validator-fundamentals/validator-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Validator Fundamentals</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [Prerequisites](#toc1__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_1__)    \n",
-    "  - [Import the sample dataset](#toc2_2__)    \n",
-    "  - [Split the preprocessed dataset](#toc2_3__)    \n",
-    "  - [Import the champion model](#toc2_4__)    \n",
-    "  - [Train potential challenger model](#toc2_5__)    \n",
-    "  - [Initialize the model objects](#toc2_6__)    \n",
-    "- [Implementing custom tests](#toc3__)    \n",
-    "  - [Implement a custom inline test](#toc3_1__)    \n",
-    "    - [Create a confusion matrix plot](#toc3_1_1__)    \n",
-    "    - [Add parameters to custom tests](#toc3_1_2__)    \n",
-    "    - [Pass parameters to custom tests](#toc3_1_3__)    \n",
-    "  - [Use external test providers](#toc3_2__)    \n",
-    "    - [Create custom tests folder](#toc3_2_1__)    \n",
-    "    - [Save an inline test](#toc3_2_2__)    \n",
-    "    - [Register a local test provider](#toc3_2_3__)    \n",
-    "- [Verify test runs](#toc4__)    \n",
-    "- [In summary](#toc5__)    \n",
-    "- [Next steps](#toc6__)    \n",
-    "  - [Work with your validation report](#toc6_1__)    \n",
-    "  - [Learn more](#toc6_2__)    \n",
-    "    - [Use cases](#toc6_2_1__)    \n",
-    "    - [Discover more learning resources](#toc6_2_2__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## Prerequisites\n",
-    "\n",
-    "In order to finalize validation and reporting, you'll need to first have:\n",
-    "\n",
-    "- [x] Registered a model within the ValidMind Platform and granted yourself access to the model as a validator\n",
-    "- [x] Installed the ValidMind Library in your local environment, allowing you to access all its features\n",
-    "- [x] Learned how to import and initialize datasets and models for use with ValidMind\n",
-    "- [x] Understood the basics of how to identify and run validation tests\n",
-    "- [x] Run validation tests for your champion and challenger models, and logged the results of those tests to the ValidMind Platform\n",
-    "- [x] Inserted your logged test results into your validation report\n",
-    "- [x] Added some preliminary artifacts (findings) to your validation report\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Need help with the above steps?</b></span>\n",
-    "<br></br>\n",
-    "Refer to the first three notebooks in this series:\n",
-    "\n",
-    "- <a href=\"1-set_up_validmind_for_validation.ipynb\" style=\"color: #DE257E;\"><b>1 — Set up the ValidMind Library for validation</b></a>\n",
-    "- <a href=\"2-start_validation_process.ipynb\" style=\"color: #DE257E;\"><b>2 — Start the model validation process</b></a>\n",
-    "- <a href=\"3-developing_challenger_model.ipynb\" style=\"color: #DE257E;\"><b>2 — Developing a potential challenger model</b></a>\n",
-    "\n",
-    "</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up\n",
-    "\n",
-    "This section should be very familiar to you now — as we performed the same actions in the previous two notebooks in this series."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library\n",
-    "\n",
-    "As usual, let's first connect up the ValidMind Library to our model we previously registered in the ValidMind Platform:\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Validation` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Make sure the ValidMind Library is installed\n",
-    "\n",
-    "%pip install -q validmind\n",
-    "\n",
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"validation-report\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Import the sample dataset\n",
-    "\n",
-    "Next, we'll load in the same sample [Bank Customer Churn Prediction](https://www.kaggle.com/datasets/shantanudhakadd/bank-customer-churn-prediction) dataset used to develop the champion model that we will independently preprocess:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load the sample dataset\n",
-    "from validmind.datasets.classification import customer_churn as demo_dataset\n",
-    "\n",
-    "print(\n",
-    "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{demo_dataset.target_column}' \\n\\t• Class labels: {demo_dataset.class_labels}\"\n",
-    ")\n",
-    "\n",
-    "raw_df = demo_dataset.load_data()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize the raw dataset for use in ValidMind tests\n",
-    "vm_raw_dataset = vm.init_dataset(\n",
-    "    dataset=raw_df,\n",
-    "    input_id=\"raw_dataset\",\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import pandas as pd\n",
-    "\n",
-    "raw_copy_df = raw_df.sample(frac=1)  # Create a copy of the raw dataset\n",
-    "\n",
-    "# Create a balanced dataset with the same number of exited and not exited customers\n",
-    "exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 1]\n",
-    "not_exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 0].sample(n=exited_df.shape[0])\n",
-    "\n",
-    "balanced_raw_df = pd.concat([exited_df, not_exited_df])\n",
-    "balanced_raw_df = balanced_raw_df.sample(frac=1, random_state=42)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Let’s also quickly remove highly correlated features from the dataset using the output from a ValidMind test:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Register new data and now 'balanced_raw_dataset' is the new dataset object of interest\n",
-    "vm_balanced_raw_dataset = vm.init_dataset(\n",
-    "    dataset=balanced_raw_df,\n",
-    "    input_id=\"balanced_raw_dataset\",\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Run HighPearsonCorrelation test with our balanced dataset as input and return a result object\n",
-    "corr_result = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
-    "    params={\"max_threshold\": 0.3},\n",
-    "    inputs={\"dataset\": vm_balanced_raw_dataset},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# From result object, extract table from `corr_result.tables`\n",
-    "features_df = corr_result.tables[0].data\n",
-    "features_df"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Extract list of features that failed the test\n",
-    "high_correlation_features = features_df[features_df[\"Pass/Fail\"] == \"Fail\"][\"Columns\"].tolist()\n",
-    "high_correlation_features"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Extract feature names from the list of strings\n",
-    "high_correlation_features = [feature.split(\",\")[0].strip(\"()\") for feature in high_correlation_features]\n",
-    "high_correlation_features"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Remove the highly correlated features from the dataset\n",
-    "balanced_raw_no_age_df = balanced_raw_df.drop(columns=high_correlation_features)\n",
-    "\n",
-    "# Re-initialize the dataset object\n",
-    "vm_raw_dataset_preprocessed = vm.init_dataset(\n",
-    "    dataset=balanced_raw_no_age_df,\n",
-    "    input_id=\"raw_dataset_preprocessed\",\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Re-run the test with the reduced feature set\n",
-    "corr_result = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
-    "    params={\"max_threshold\": 0.3},\n",
-    "    inputs={\"dataset\": vm_raw_dataset_preprocessed},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Split the preprocessed dataset\n",
-    "\n",
-    "With our raw dataset rebalanced with highly correlated features removed, let's now **spilt our dataset into train and test** in preparation for model evaluation testing:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Encode categorical features in the dataset\n",
-    "balanced_raw_no_age_df = pd.get_dummies(\n",
-    "    balanced_raw_no_age_df, columns=[\"Geography\", \"Gender\"], drop_first=True\n",
-    ")\n",
-    "balanced_raw_no_age_df.head()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from sklearn.model_selection import train_test_split\n",
-    "\n",
-    "# Split the dataset into train and test\n",
-    "train_df, test_df = train_test_split(balanced_raw_no_age_df, test_size=0.20)\n",
-    "\n",
-    "X_train = train_df.drop(\"Exited\", axis=1)\n",
-    "y_train = train_df[\"Exited\"]\n",
-    "X_test = test_df.drop(\"Exited\", axis=1)\n",
-    "y_test = test_df[\"Exited\"]"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize the split datasets\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    input_id=\"train_dataset_final\",\n",
-    "    dataset=train_df,\n",
-    "    target_column=\"Exited\",\n",
-    ")\n",
-    "\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    input_id=\"test_dataset_final\",\n",
-    "    dataset=test_df,\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_4__'></a>\n",
-    "\n",
-    "### Import the champion model\n",
-    "\n",
-    "With our raw dataset assessed and preprocessed, let's go ahead and import the champion model submitted by the model development team in the format of a `.pkl` file: **[lr_model_champion.pkl](lr_model_champion.pkl)**"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Import the champion model\n",
-    "import pickle as pkl\n",
-    "\n",
-    "with open(\"lr_model_champion.pkl\", \"rb\") as f:\n",
-    "    log_reg = pkl.load(f)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_5__'></a>\n",
-    "\n",
-    "### Train potential challenger model\n",
-    "\n",
-    "We'll also train our random forest classification challenger model to see how it compares:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Import the Random Forest Classification model\n",
-    "from sklearn.ensemble import RandomForestClassifier\n",
-    "\n",
-    "# Create the model instance with 50 decision trees\n",
-    "rf_model = RandomForestClassifier(\n",
-    "    n_estimators=50,\n",
-    "    random_state=42,\n",
-    ")\n",
-    "\n",
-    "# Train the model\n",
-    "rf_model.fit(X_train, y_train)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_6__'></a>\n",
-    "\n",
-    "### Initialize the model objects\n",
-    "\n",
-    "In addition to the initialized datasets, you'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for each of our two models:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize the champion logistic regression model\n",
-    "vm_log_model = vm.init_model(\n",
-    "    log_reg,\n",
-    "    input_id=\"log_model_champion\",\n",
-    ")\n",
-    "\n",
-    "# Initialize the challenger random forest classification model\n",
-    "vm_rf_model = vm.init_model(\n",
-    "    rf_model,\n",
-    "    input_id=\"rf_model\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Assign predictions to Champion — Logistic regression model\n",
-    "vm_train_ds.assign_predictions(model=vm_log_model)\n",
-    "vm_test_ds.assign_predictions(model=vm_log_model)\n",
-    "\n",
-    "# Assign predictions to Challenger — Random forest classification model\n",
-    "vm_train_ds.assign_predictions(model=vm_rf_model)\n",
-    "vm_test_ds.assign_predictions(model=vm_rf_model)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Implementing custom tests\n",
-    "\n",
-    "Thanks to the model documentation ([Learn more ...](https://docs.validmind.ai/developer/validmind-library.html#for-model-development)), we know that the model development team implemented a custom test to further evaluate the performance of the champion model.\n",
-    "\n",
-    "In a usual model validation situation, you would load a saved custom test provided by the model development team. In the following section, we'll have you implement the same custom test and make it available for reuse, to familiarize you with the processes.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about custom tests?</b></span>\n",
-    "<br></br>\n",
-    "Refer to our in-depth introduction to custom tests: <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/custom_tests/implement_custom_tests.html\" style=\"color: #DE257E;\"><b>Implement custom tests</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Implement a custom inline test\n",
-    "\n",
-    "Let's implement the same custom *inline test* that calculates the confusion matrix for a binary classification model that the model development team used in their performance evaluations.\n",
-    "\n",
-    "- An inline test refers to a test written and executed within the same environment as the code being tested — in this case, right in this Jupyter Notebook —  without requiring a separate test file or framework.\n",
-    "- You'll note that the custom test function is just a regular Python function that can include and require any Python library as you see fit."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1_1__'></a>\n",
-    "\n",
-    "#### Create a confusion matrix plot\n",
-    "\n",
-    "Let's first create a confusion matrix plot using the `confusion_matrix` function from the `sklearn.metrics` module:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import matplotlib.pyplot as plt\n",
-    "from sklearn import metrics\n",
-    "\n",
-    "# Get the predicted classes\n",
-    "y_pred = log_reg.predict(vm_test_ds.x)\n",
-    "\n",
-    "confusion_matrix = metrics.confusion_matrix(y_test, y_pred)\n",
-    "\n",
-    "cm_display = metrics.ConfusionMatrixDisplay(\n",
-    "    confusion_matrix=confusion_matrix, display_labels=[False, True]\n",
-    ")\n",
-    "cm_display.plot()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Next, create a [`@vm.test` wrapper](https://docs.validmind.ai/validmind/validmind.html#test) that will allow you to create a reusable test. **Note the following changes in the code below:**\n",
-    "\n",
-    "- The function `confusion_matrix` takes two arguments `dataset` and `model`. This is a `VMDataset` and `VMModel` object respectively.\n",
-    "  - `VMDataset` objects allow you to access the dataset's true (target) values by accessing the `.y` attribute.\n",
-    "  - `VMDataset` objects allow you to access the predictions for a given model by accessing the `.y_pred()` method.\n",
-    "- The function docstring provides a description of what the test does. This will be displayed along with the result in this notebook as well as in the ValidMind Platform.\n",
-    "- The function body calculates the confusion matrix using the `sklearn.metrics.confusion_matrix` function as we just did above.\n",
-    "- The function then returns the `ConfusionMatrixDisplay.figure_` object — this is important as the ValidMind Library expects the output of the custom test to be a plot or a table.\n",
-    "- The `@vm.test` decorator is doing the work of creating a wrapper around the function that will allow it to be run by the ValidMind Library. It also registers the test so it can be found by the ID `my_custom_tests.ConfusionMatrix`."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "@vm.test(\"my_custom_tests.ConfusionMatrix\")\n",
-    "def confusion_matrix(dataset, model):\n",
-    "    \"\"\"The confusion matrix is a table that is often used to describe the performance of a classification model on a set of data for which the true values are known.\n",
-    "\n",
-    "    The confusion matrix is a 2x2 table that contains 4 values:\n",
-    "\n",
-    "    - True Positive (TP): the number of correct positive predictions\n",
-    "    - True Negative (TN): the number of correct negative predictions\n",
-    "    - False Positive (FP): the number of incorrect positive predictions\n",
-    "    - False Negative (FN): the number of incorrect negative predictions\n",
-    "\n",
-    "    The confusion matrix can be used to assess the holistic performance of a classification model by showing the accuracy, precision, recall, and F1 score of the model on a single figure.\n",
-    "    \"\"\"\n",
-    "    y_true = dataset.y\n",
-    "    y_pred = dataset.y_pred(model=model)\n",
-    "\n",
-    "    confusion_matrix = metrics.confusion_matrix(y_true, y_pred)\n",
-    "\n",
-    "    cm_display = metrics.ConfusionMatrixDisplay(\n",
-    "        confusion_matrix=confusion_matrix, display_labels=[False, True]\n",
-    "    )\n",
-    "    cm_display.plot()\n",
-    "\n",
-    "    plt.close()  # close the plot to avoid displaying it\n",
-    "\n",
-    "    return cm_display.figure_  # return the figure object itself"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You can now run the newly created custom test on both the training and test datasets for both models using the [`run_test()` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Champion train and test\n",
-    "vm.tests.run_test(\n",
-    "    test_id=\"my_custom_tests.ConfusionMatrix:champion\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds,vm_test_ds],\n",
-    "        \"model\" : [vm_log_model]\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Challenger train and test\n",
-    "vm.tests.run_test(\n",
-    "    test_id=\"my_custom_tests.ConfusionMatrix:challenger\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds,vm_test_ds],\n",
-    "        \"model\" : [vm_rf_model]\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your model's documentation for some test IDs. </b></span>\n",
-    "<br></br>\n",
-    "That's expected, as when we run validations tests the results logged need to be manually added to your report as part of your compliance assessment process within the ValidMind Platform.</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1_2__'></a>\n",
-    "\n",
-    "#### Add parameters to custom tests\n",
-    "\n",
-    "Custom tests can take parameters just like any other function. To demonstrate, let's modify the `confusion_matrix` function to take an additional parameter `normalize` that will allow you to normalize the confusion matrix:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "@vm.test(\"my_custom_tests.ConfusionMatrix\")\n",
-    "def confusion_matrix(dataset, model, normalize=False):\n",
-    "    \"\"\"The confusion matrix is a table that is often used to describe the performance of a classification model on a set of data for which the true values are known.\n",
-    "\n",
-    "    The confusion matrix is a 2x2 table that contains 4 values:\n",
-    "\n",
-    "    - True Positive (TP): the number of correct positive predictions\n",
-    "    - True Negative (TN): the number of correct negative predictions\n",
-    "    - False Positive (FP): the number of incorrect positive predictions\n",
-    "    - False Negative (FN): the number of incorrect negative predictions\n",
-    "\n",
-    "    The confusion matrix can be used to assess the holistic performance of a classification model by showing the accuracy, precision, recall, and F1 score of the model on a single figure.\n",
-    "    \"\"\"\n",
-    "    y_true = dataset.y\n",
-    "    y_pred = dataset.y_pred(model=model)\n",
-    "\n",
-    "    if normalize:\n",
-    "        confusion_matrix = metrics.confusion_matrix(y_true, y_pred, normalize=\"all\")\n",
-    "    else:\n",
-    "        confusion_matrix = metrics.confusion_matrix(y_true, y_pred)\n",
-    "\n",
-    "    cm_display = metrics.ConfusionMatrixDisplay(\n",
-    "        confusion_matrix=confusion_matrix, display_labels=[False, True]\n",
-    "    )\n",
-    "    cm_display.plot()\n",
-    "\n",
-    "    plt.close()  # close the plot to avoid displaying it\n",
-    "\n",
-    "    return cm_display.figure_  # return the figure object itself"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1_3__'></a>\n",
-    "\n",
-    "#### Pass parameters to custom tests\n",
-    "\n",
-    "You can pass parameters to custom tests by providing a dictionary of parameters to the `run_test()` function.\n",
-    "\n",
-    "- The parameters will override any default parameters set in the custom test definition. Note that `dataset` and `model` are still passed as `inputs`.\n",
-    "- Since these are `VMDataset` or `VMModel` inputs, they have a special meaning.\n",
-    "\n",
-    "Re-running and logging the custom confusion matrix with `normalize=True` for both models and our testing dataset looks like this:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Champion with test dataset and normalize=True\n",
-    "vm.tests.run_test(\n",
-    "    test_id=\"my_custom_tests.ConfusionMatrix:test_normalized_champion\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_test_ds],\n",
-    "        \"model\" : [vm_log_model]\n",
-    "    },\n",
-    "    params={\"normalize\": True}\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Challenger with test dataset and normalize=True\n",
-    "vm.tests.run_test(\n",
-    "    test_id=\"my_custom_tests.ConfusionMatrix:test_normalized_challenger\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_test_ds],\n",
-    "        \"model\" : [vm_rf_model]\n",
-    "    },\n",
-    "    params={\"normalize\": True}\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2__'></a>\n",
-    "\n",
-    "### Use external test providers\n",
-    "\n",
-    "Sometimes you may want to reuse the same set of custom tests across multiple models and share them with others in your organization, like the model development team would have done with you in this example workflow featured in this series of notebooks. In this case, you can create an external custom *test provider* that will allow you to load custom tests from a local folder or a Git repository.\n",
-    "\n",
-    "In this section you will learn how to declare a local filesystem test provider that allows loading tests from a local folder following these high level steps:\n",
-    "\n",
-    "1. Create a folder of custom tests from existing inline tests (tests that exist in your active Jupyter Notebook)\n",
-    "2. Save an inline test to a file\n",
-    "3. Define and register a [`LocalTestProvider`](https://docs.validmind.ai/validmind/validmind/tests.html#LocalTestProvider) that points to that folder\n",
-    "4. Run test provider tests\n",
-    "5. Add the test results to your documentation"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_1__'></a>\n",
-    "\n",
-    "#### Create custom tests folder\n",
-    "\n",
-    "Let's start by creating a new folder that will contain reusable custom tests from your existing inline tests.\n",
-    "\n",
-    "The following code snippet will create a new `my_tests` directory in the current working directory if it doesn't exist:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "tests_folder = \"my_tests\"\n",
-    "\n",
-    "import os\n",
-    "\n",
-    "# create tests folder\n",
-    "os.makedirs(tests_folder, exist_ok=True)\n",
-    "\n",
-    "# remove existing tests\n",
-    "for f in os.listdir(tests_folder):\n",
-    "    # remove files and pycache\n",
-    "    if f.endswith(\".py\") or f == \"__pycache__\":\n",
-    "        os.system(f\"rm -rf {tests_folder}/{f}\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "After running the command above, confirm that a new `my_tests` directory was created successfully. For example:\n",
-    "\n",
-    "```\n",
-    "~/notebooks/tutorials/model_validation/my_tests/\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_2__'></a>\n",
-    "\n",
-    "#### Save an inline test\n",
-    "\n",
-    "The `@vm.test` decorator we used in **Implement a custom inline test** above to register one-off custom tests also includes a convenience method on the function object that allows you to simply call `<func_name>.save()` to save the test to a Python file at a specified path.\n",
-    "\n",
-    "While `save()` will get you started by creating the file and saving the function code with the correct name, it won't automatically include any imports, or other functions or variables, outside of the functions that are needed for the test to run. To solve this, pass in an optional `imports` argument ensuring necessary imports are added to the file.\n",
-    "\n",
-    "The `confusion_matrix` test requires the following additional imports:\n",
-    "\n",
-    "```python\n",
-    "import matplotlib.pyplot as plt\n",
-    "from sklearn import metrics\n",
-    "```\n",
-    "\n",
-    "Let's pass these imports to the `save()` method to ensure they are included in the file with the following command:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "confusion_matrix.save(\n",
-    "    # Save it to the custom tests folder we created\n",
-    "    tests_folder,\n",
-    "    imports=[\"import matplotlib.pyplot as plt\", \"from sklearn import metrics\"],\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "- [x] Confirm that the `save()` method saved the `confusion_matrix` function to a file named `ConfusionMatrix.py` in the `my_tests` folder.\n",
-    "- [x] Note that the new file provides some context on the origin of the test, which is useful for traceability:\n",
-    "\n",
-    "    ```\n",
-    "    # Saved from __main__.confusion_matrix\n",
-    "    # Original Test ID: my_custom_tests.ConfusionMatrix\n",
-    "    # New Test ID: <test_provider_namespace>.ConfusionMatrix\n",
-    "    ```\n",
-    "\n",
-    "- [x]  Additionally, the new test function has been stripped off its decorator, as it now resides in a file that will be loaded by the test provider:\n",
-    "\n",
-    "    ```python\n",
-    "    def ConfusionMatrix(dataset, model, normalize=False):\n",
-    "    ```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_3__'></a>\n",
-    "\n",
-    "#### Register a local test provider\n",
-    "\n",
-    "Now that your `my_tests` folder has a sample custom test, let's initialize a test provider that will tell the ValidMind Library where to find your custom tests:\n",
-    "\n",
-    "- ValidMind offers out-of-the-box test providers for local tests (tests in a folder) or a Github provider for tests in a Github repository.\n",
-    "- You can also create your own test provider by creating a class that has a [`load_test` method](https://docs.validmind.ai/validmind/validmind/tests.html#load_test) that takes a test ID and returns the test function matching that ID.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about test providers?</b></span>\n",
-    "<br></br>\n",
-    "An extended introduction to test providers can be found in: <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/custom_tests/integrate_external_test_providers.html\" style=\"color: #DE257E;\"><b>Integrate external test providers</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "##### Initialize a local test provider\n",
-    "\n",
-    "For most use cases, using a `LocalTestProvider` that allows you to load custom tests from a designated directory should be sufficient.\n",
-    "\n",
-    "**The most important attribute for a test provider is its `namespace`.** This is a string that will be used to prefix test IDs in model documentation. This allows you to have multiple test providers with tests that can even share the same ID, but are distinguished by their namespace.\n",
-    "\n",
-    "Let's go ahead and load the custom tests from our `my_tests` directory:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.tests import LocalTestProvider\n",
-    "\n",
-    "# initialize the test provider with the tests folder we created earlier\n",
-    "my_test_provider = LocalTestProvider(tests_folder)\n",
-    "\n",
-    "vm.tests.register_test_provider(\n",
-    "    namespace=\"my_test_provider\",\n",
-    "    test_provider=my_test_provider,\n",
-    ")\n",
-    "# `my_test_provider.load_test()` will be called for any test ID that starts with `my_test_provider`\n",
-    "# e.g. `my_test_provider.ConfusionMatrix` will look for a function named `ConfusionMatrix` in `my_tests/ConfusionMatrix.py` file"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "##### Run test provider tests\n",
-    "\n",
-    "Now that we've set up the test provider, we can run any test that's located in the tests folder by using the `run_test()` method as with any other test:\n",
-    "\n",
-    "- For tests that reside in a test provider directory, the test ID will be the `namespace` specified when registering the provider, followed by the path to the test file relative to the tests folder.\n",
-    "- For example, the Confusion Matrix test we created earlier will have the test ID `my_test_provider.ConfusionMatrix`. You could organize the tests in subfolders, say `classification` and `regression`, and the test ID for the Confusion Matrix test would then be `my_test_provider.classification.ConfusionMatrix`.\n",
-    "\n",
-    "Let's go ahead and re-run the confusion matrix test with our testing dataset for our two models by using the test ID `my_test_provider.ConfusionMatrix`. This should load the test from the test provider and run it as before."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Champion with test dataset and test provider custom test\n",
-    "vm.tests.run_test(\n",
-    "    test_id=\"my_test_provider.ConfusionMatrix:champion\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_test_ds],\n",
-    "        \"model\" : [vm_log_model]\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Challenger with test dataset  and test provider custom test\n",
-    "vm.tests.run_test(\n",
-    "    test_id=\"my_test_provider.ConfusionMatrix:challenger\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_test_ds],\n",
-    "        \"model\" : [vm_rf_model]\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Verify test runs\n",
-    "\n",
-    "Our final task is to verify that all the tests provided by the model development team were run and reported accurately. Note the appended `result_ids` to delineate which dataset we ran the test with for the relevant tests.\n",
-    "\n",
-    "Here, we'll specify all the tests we'd like to independently rerun in a dictionary called `test_config`. **Note here that `inputs` and `input_grid` expect the `input_id` of the dataset or model as the value rather than the variable name we specified**:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test_config = {\n",
-    "    # Run with the raw dataset\n",
-    "    'validmind.data_validation.DatasetDescription:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'}\n",
-    "    },\n",
-    "    'validmind.data_validation.DescriptiveStatistics:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'}\n",
-    "    },\n",
-    "    'validmind.data_validation.MissingValues:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'min_percentage_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.ClassImbalance:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'min_percent_threshold': 10}\n",
-    "    },\n",
-    "    'validmind.data_validation.Duplicates:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'min_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.HighCardinality:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {\n",
-    "            'num_threshold': 100,\n",
-    "            'percent_threshold': 0.1,\n",
-    "            'threshold_type': 'percent'\n",
-    "        }\n",
-    "    },\n",
-    "    'validmind.data_validation.Skewness:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'max_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.UniqueRows:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'min_percent_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.TooManyZeroValues:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'max_percent_threshold': 0.03}\n",
-    "    },\n",
-    "    'validmind.data_validation.IQROutliersTable:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'threshold': 5}\n",
-    "    },\n",
-    "    # Run with the preprocessed dataset\n",
-    "    'validmind.data_validation.DescriptiveStatistics:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset_preprocessed'}\n",
-    "    },\n",
-    "    'validmind.data_validation.TabularDescriptionTables:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset_preprocessed'}\n",
-    "    },\n",
-    "    'validmind.data_validation.MissingValues:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset_preprocessed'},\n",
-    "        'params': {'min_percentage_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.TabularNumericalHistograms:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset_preprocessed'}\n",
-    "    },\n",
-    "    'validmind.data_validation.TabularCategoricalBarPlots:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset_preprocessed'}\n",
-    "    },\n",
-    "    'validmind.data_validation.TargetRateBarPlots:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset_preprocessed'},\n",
-    "        'params': {'default_column': 'loan_status'}\n",
-    "    },\n",
-    "    # Run with the training and test datasets\n",
-    "    'validmind.data_validation.DescriptiveStatistics:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']}\n",
-    "    },\n",
-    "    'validmind.data_validation.TabularDescriptionTables:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']}\n",
-    "    },\n",
-    "    'validmind.data_validation.ClassImbalance:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']},\n",
-    "        'params': {'min_percent_threshold': 10}\n",
-    "    },\n",
-    "    'validmind.data_validation.UniqueRows:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']},\n",
-    "        'params': {'min_percent_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.TabularNumericalHistograms:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']}\n",
-    "    },\n",
-    "    'validmind.data_validation.MutualInformation:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']},\n",
-    "        'params': {'min_threshold': 0.01}\n",
-    "    },\n",
-    "    'validmind.data_validation.PearsonCorrelationMatrix:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']}\n",
-    "    },\n",
-    "    'validmind.data_validation.HighPearsonCorrelation:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']},\n",
-    "        'params': {'max_threshold': 0.3, 'top_n_correlations': 10}\n",
-    "    },\n",
-    "    'validmind.model_validation.ModelMetadata': {\n",
-    "        'input_grid': {'model': ['log_model_champion', 'rf_model']}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.ModelParameters': {\n",
-    "        'input_grid': {'model': ['log_model_champion', 'rf_model']}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.ROCCurve': {\n",
-    "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final'], 'model': ['log_model_champion']}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.MinimumROCAUCScore': {\n",
-    "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final'], 'model': ['log_model_champion']},\n",
-    "        'params': {'min_threshold': 0.5}\n",
-    "    }\n",
-    "}"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Then batch run and log our tests in `test_config`:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "for t in test_config:\n",
-    "    print(t)\n",
-    "    try:\n",
-    "        # Check if test has input_grid\n",
-    "        if 'input_grid' in test_config[t]:\n",
-    "            # For tests with input_grid, pass the input_grid configuration\n",
-    "            if 'params' in test_config[t]:\n",
-    "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid'], params=test_config[t]['params']).log()\n",
-    "            else:\n",
-    "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid']).log()\n",
-    "        else:\n",
-    "            # Original logic for regular inputs\n",
-    "            if 'params' in test_config[t]:\n",
-    "                vm.tests.run_test(t, inputs=test_config[t]['inputs'], params=test_config[t]['params']).log()\n",
-    "            else:\n",
-    "                vm.tests.run_test(t, inputs=test_config[t]['inputs']).log()\n",
-    "    except Exception as e:\n",
-    "        print(f\"Error running test {t}: {str(e)}\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## In summary\n",
-    "\n",
-    "In this final notebook, you learned how to:\n",
-    "\n",
-    "- [x] Implement a custom inline test\n",
-    "- [x] Run and log your custom inline tests\n",
-    "- [x] Use external custom test providers\n",
-    "- [x] Run and log tests from your custom test providers\n",
-    "- [x] Re-run tests provided by your model development team to verify that they were run and reported accurately\n",
-    "\n",
-    "With our ValidMind for model validation series of notebooks, you learned how to validate a model end-to-end with the ValidMind Library by running through some common scenarios in a typical model validation setting:\n",
-    "\n",
-    "- Verifying the data quality steps performed by the model development team\n",
-    "- Independently replicating the champion model's results and conducting additional tests to assess performance, stability, and robustness\n",
-    "- Setting up test inputs and a challenger model for comparative analysis\n",
-    "- Running validation tests, analyzing results, and logging artifacts to ValidMind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Next steps"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1__'></a>\n",
-    "\n",
-    "### Work with your validation report\n",
-    "\n",
-    "Now that you've logged all your test results and verified the work done by the model development team, head to the ValidMind Platform to wrap up your validation report. Continue to work on your validation report by:\n",
-    "\n",
-    "- **Inserting additional test results:** Click **Link Evidence to Report** under any section of 2. Validation in your validation report. (Learn more: [Link evidence to reports](https://docs.validmind.ai/guide/model-validation/assess-compliance.html#link-evidence-to-reports))\n",
-    "\n",
-    "- **Making qualitative edits to your test descriptions:** Expand any linked evidence under Validator Evidence and click **See evidence details** to review and edit the ValidMind-generated test descriptions for quality and accuracy. (Learn more: [Preparing validation reports](https://docs.validmind.ai/guide/model-validation/preparing-validation-reports.html#get-started))\n",
-    "\n",
-    "- **Adding more findings:** Click **Link Finding to Report** in any validation report section, then click **+ Create New Finding**. (Learn more: [Add and manage model findings](https://docs.validmind.ai/guide/model-validation/add-manage-model-findings.html))\n",
-    "\n",
-    "- **Adding risk assessment notes:** Click under **Risk Assessment Notes** in any validation report section to access the text editor and content editing toolbar, including an option to generate a draft with AI. Once generated, edit your ValidMind-generated test descriptions to adhere to your organization's requirements. (Learn more: [Work with content blocks](https://docs.validmind.ai/guide/model-documentation/work-with-content-blocks.html#content-editing-toolbar))\n",
-    "\n",
-    "- **Assessing compliance:** Under the Guideline for any validation report section, click **ASSESSMENT** and select the compliance status from the drop-down menu. (Learn more: [Provide compliance assessments](https://docs.validmind.ai/guide/model-validation/assess-compliance.html#provide-compliance-assessments))\n",
-    "\n",
-    "- **Collaborate with other stakeholders:** Use the ValidMind Platform's real-time collaborative features to work seamlessly together with the rest of your organization, including model developers. Propose suggested changes in the model documentation, work with versioned history, and use comments to discuss specific portions of the model documentation. (Learn more: [Collaborate with others](https://docs.validmind.ai/guide/model-documentation/collaborate-with-others.html))\n",
-    "\n",
-    "When your validation report is complete and ready for review, submit it for approval from the same ValidMind Platform where you made your edits and collaborated with the rest of your organization, ensuring transparency and a thorough model validation history. (Learn more: [Submit for approval](https://docs.validmind.ai/guide/model-documentation/submit-for-approval.html))"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2__'></a>\n",
-    "\n",
-    "### Learn more\n",
-    "\n",
-    "Now that you're familiar with the basics, you can explore the following notebooks to get a deeper understanding on how the ValidMind Library assists you in streamlining model validation:"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2_1__'></a>\n",
-    "\n",
-    "#### Use cases\n",
-    "\n",
-    "- [Validate an application scorecard model](../../use_cases/model_validation/validate_application_scorecard.ipynb)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2_2__'></a>\n",
-    "\n",
-    "#### Discover more learning resources\n",
-    "\n",
-    "Learn more about the ValidMind Library tools we used in this notebook:\n",
-    "\n",
-    "- [Explore tests](../../how_to/tests/explore_tests/explore_tests.ipynb)\n",
-    "- [Run dataset-based tests](../../how_to/tests/run_tests/1_run_dataset_based_tests.ipynb)\n",
-    "- [Implement custom tests](../../how_to/tests/custom_tests/implement_custom_tests.ipynb)\n",
-    "- [Integrate external test providers](../../how_to/tests/custom_tests/integrate_external_test_providers.ipynb)\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-8028ef6a3da9409a8eab5aa0cf246c57",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
-  },
-  "language_info": {
-   "name": "python",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
-}
diff --git a/site/notebooks/EXECUTED/model_validation/inserted-class-imbalance-results.png b/site/notebooks/EXECUTED/model_validation/inserted-class-imbalance-results.png
deleted file mode 100644
index 2efea1a09b..0000000000
Binary files a/site/notebooks/EXECUTED/model_validation/inserted-class-imbalance-results.png and /dev/null differ
diff --git a/site/notebooks/EXECUTED/model_validation/link-artifact.png b/site/notebooks/EXECUTED/model_validation/link-artifact.png
deleted file mode 100644
index 23edc1c9eb..0000000000
Binary files a/site/notebooks/EXECUTED/model_validation/link-artifact.png and /dev/null differ
diff --git a/site/notebooks/EXECUTED/model_validation/link-validator-evidence.png b/site/notebooks/EXECUTED/model_validation/link-validator-evidence.png
deleted file mode 100644
index 660a19cfab..0000000000
Binary files a/site/notebooks/EXECUTED/model_validation/link-validator-evidence.png and /dev/null differ
diff --git a/site/notebooks/EXECUTED/validation/1-set_up_validmind_for_validation.ipynb b/site/notebooks/EXECUTED/validation/1-set_up_validmind_for_validation.ipynb
new file mode 100644
index 0000000000..feda59a354
--- /dev/null
+++ b/site/notebooks/EXECUTED/validation/1-set_up_validmind_for_validation.ipynb
@@ -0,0 +1,533 @@
+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# ValidMind for validation 1 — Set up the ValidMind Library for validation\n",
+        "\n",
+        "Learn how to use ValidMind for your end-to-end validation process based on common scenarios with our series of four introductory notebooks. In this first notebook, set up the ValidMind Library in preparation for validating a champion.\n",
+        "\n",
+        "These notebooks use a binary classification model as an example, but the same principles shown here apply to other record (model) types.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
+        "<br></br>\n",
+        "Our course tailor-made for validators new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/validator-fundamentals/validator-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Validator Fundamentals</b></a></div>"
+      ],
+      "id": "821a881e"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [Introduction](#toc1__)    \n",
+        "- [About ValidMind](#toc2__)    \n",
+        "  - [Before you begin](#toc2_1__)    \n",
+        "  - [New to ValidMind?](#toc2_2__)    \n",
+        "  - [Key concepts](#toc2_3__)    \n",
+        "- [Setting up](#toc3__)    \n",
+        "  - [Register a sample model](#toc3_1__)    \n",
+        "    - [Assign validator credentials](#toc3_1_1__)    \n",
+        "    - [Apply documentation template](#toc3_1_2__)    \n",
+        "    - [Apply validation report template](#toc3_1_3__)    \n",
+        "  - [Install the ValidMind Library](#toc3_2__)    \n",
+        "  - [Initialize the ValidMind Library](#toc3_3__)    \n",
+        "    - [Get your code snippet](#toc3_3_1__)    \n",
+        "- [Getting to know ValidMind](#toc4__)    \n",
+        "  - [Preview the validation report template](#toc4_1__)    \n",
+        "    - [View validation report in the ValidMind Platform](#toc4_1_1__)    \n",
+        "  - [Explore available tests](#toc4_2__)    \n",
+        "- [Upgrade ValidMind](#toc5__)    \n",
+        "- [In summary](#toc6__)    \n",
+        "- [Next steps](#toc7__)    \n",
+        "  - [Start the validation process](#toc7_1__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ],
+      "id": "19ea797c"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## Introduction\n",
+        "\n",
+        "Validation aims to independently assess the compliance of *champions* created by developers with regulatory guidance by conducting thorough testing and analysis, potentially including the use of challengers to benchmark performance. Assessments, presented in the form of a validation report, typically include *artifacts (findings)* and recommendations to address those issues.\n",
+        "\n",
+        "A *binary classification model* is a type of predictive model used in churn analysis to identify customers who are likely to leave a service or subscription by analyzing various behavioral, transactional, and demographic factors.\n",
+        "\n",
+        "- This model helps businesses take proactive measures to retain at-risk customers by offering personalized incentives, improving customer service, or adjusting pricing strategies.\n",
+        "- Effective validation of a churn prediction model ensures that businesses can accurately identify potential churners, optimize retention efforts, and enhance overall customer satisfaction while minimizing revenue loss."
+      ],
+      "id": "d624f88d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate comparison and other validation tests, and then use the ValidMind Platform to submit compliance assessments of champions via comprehensive validation reports. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and developers."
+      ],
+      "id": "4fb1ef5a"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
+      ],
+      "id": "594f9fd4"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+      ],
+      "id": "262ed111"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**validation report:** A validation report is a comprehensive and structured review evaluating a record's accuracy, performance, and suitability for its intended purpose. A report follows established validation guidelines to ensure consistency and adherence to internal and regulatory standards — encompassing the process of risk assessment, identifying areas of potential error or risk within the record's components, supporting transparency, regulatory compliance, and informed decision-making by documenting the validator’s independent review and conclusions.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**validation report template**: A default ValidMind document template that serves as a standardized framework for conducting and documenting validation, including sections designated for attaching test results, evidence, or artifacts (findings). By outlining required documentation, recommended analyses, and expected validation tests, validation report templates ensure consistency and completeness across validation reports and help guide validators through a systematic review process while promoting comparability and traceability of validation outcomes.\n",
+        "\n",
+        "**artifacts (findings)**: Observations or issues identified during validation, including any deviations from expected performance or standards. Artifacts are organized by type — default types provided by ValidMind include Validation Issue, Policy Exception, and Limitation. Custom artifact types can be created to track other categories relevant to your organization.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ],
+      "id": "0eb67fe9"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Setting up"
+      ],
+      "id": "e0e1cf3d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Register a sample model\n",
+        "\n",
+        "In a usual lifecycle, a champion will have been independently registered in your inventory and submitted to you for validation by your development team as part of the effective challenge process. (**Learn more:** [Submit documents](https://docs.validmind.ai/guide/documentation/submit-documents.html))\n",
+        "\n",
+        "For this notebook, we'll have you register a dummy record (model) in the ValidMind Platform inventory and assign yourself as the validator to familiarize you with the ValidMind interface and circumvent the need for an existing model:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down — don’t worry, we’ll adjust these permissions next for validation.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ],
+      "id": "609fe59b"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1_1__'></a>\n",
+        "\n",
+        "#### Assign validator credentials\n",
+        "\n",
+        "In order to log tests as a validator instead of as a developer, on the details page that appears after you've successfully registered your sample model:\n",
+        "\n",
+        "1. Remove yourself as an owner:\n",
+        "\n",
+        "    - Click on the **OWNERS** tile.\n",
+        "    - Click the **x** next to your name to remove yourself from that model's role.\n",
+        "    - Click **Save** to apply your changes to that role.\n",
+        "\n",
+        "2. Remove yourself as a developer:\n",
+        "\n",
+        "    - Click on the **DEVELOPERS** tile.\n",
+        "    - Click the **x** next to your name to remove yourself from that model's role.\n",
+        "    - Click **Save** to apply your changes to that role.\n",
+        "\n",
+        "3. Add yourself as a validator:\n",
+        "\n",
+        "    - Click on the **VALIDATORS** tile.\n",
+        "    - Select your name from the drop-down menu.\n",
+        "    - Click **Save** to apply your changes to that role."
+      ],
+      "id": "58e552bb"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier for developers.\n",
+        "\n",
+        "We'll need this documentation template later for reference as we draft our validation report:\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Documentation**.\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Binary classification`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ],
+      "id": "84251589"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1_3__'></a>\n",
+        "\n",
+        "#### Apply validation report template\n",
+        "\n",
+        "Next, let's select a validation report template. A template predefines sections for your report and provides a general outline to follow, making the validation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Validation**.\n",
+        "\n",
+        "    If you cannot locate your Validation document, make sure Validation type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Generic Validation Report`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ],
+      "id": "fdfb5dc5"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
+        "<br></br>\n",
+        "Python 3.8 <= x <= 3.14</div>\n",
+        "\n",
+        "To install the library:"
+      ],
+      "id": "f656d0d6"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "931d8f7f"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_3__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ],
+      "id": "1435fd5b"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_3_1__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Validation` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ],
+      "id": "b375b341"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"validation-report\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "d5d87e2d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Getting to know ValidMind"
+      ],
+      "id": "331e1c07"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Preview the validation report template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will attach evidence to this template in the form of risk assessment notes, artifacts, and test results later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library:"
+      ],
+      "id": "f6331a98"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "13d34bbb"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1_1__'></a>\n",
+        "\n",
+        "#### View validation report in the ValidMind Platform\n",
+        "\n",
+        "Next, let's head to the ValidMind Platform to see the template in action:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, navigate to **Inventory** and select the model you registered for this \"ValidMind for validation\" series of notebooks.\n",
+        "\n",
+        "3. Click **Validation** under Documents for your model and note:\n",
+        "\n",
+        "    - [x] The risk assessment compliance summary at the top of the report (screenshot below)\n",
+        "    - [x] How the structure of the validation report reflects the previewed template\n",
+        "\n",
+        "    <img src= \"compliance-summary.png\" alt=\"Screenshot showing the risk assessment compliance summary\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
+        "    <br><br>"
+      ],
+      "id": "20717133"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Explore available tests\n",
+        "\n",
+        "Next, let's explore the list of all available tests in the ValidMind Library with [the `vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) — we'll later narrow down the tests we want to run from this list when we learn to run tests."
+      ],
+      "id": "f5d0aaab"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.list_tests()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "de6abc2a"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ],
+      "id": "dce47e40"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "10272aa9"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ],
+      "id": "7a0c3cc2"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ],
+      "id": "2dac11d5"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## In summary\n",
+        "\n",
+        "In this first notebook, you learned how to:\n",
+        "\n",
+        "- [x] Register a record (model) within the ValidMind Platform and assign yourself as the validator\n",
+        "- [x] Install and initialize the ValidMind Library\n",
+        "- [x] Preview the validation report template for your model\n",
+        "- [x] Explore the available tests offered by the ValidMind Library"
+      ],
+      "id": "174d2c8d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "<a id='toc7_1__'></a>\n",
+        "\n",
+        "### Start the validation process\n",
+        "\n",
+        "Now that the ValidMind Library is connected to your model in the ValidMind Library with the correct template applied, we can go ahead and start the validation process: **[2 — Start the validation process](2-start_validation_process.ipynb)**"
+      ],
+      "id": "d8ffdcf7"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-5d7a1c159e4840fca79011d1c0380725"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "name": "python",
+      "version": "3.10.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 5
+}
diff --git a/site/notebooks/EXECUTED/validation/2-start_validation_process.ipynb b/site/notebooks/EXECUTED/validation/2-start_validation_process.ipynb
new file mode 100644
index 0000000000..a0d4440e6c
--- /dev/null
+++ b/site/notebooks/EXECUTED/validation/2-start_validation_process.ipynb
@@ -0,0 +1,896 @@
+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# ValidMind for validation 2 — Start the validation process\n",
+        "\n",
+        "Learn how to use ValidMind for your end-to-end validation process with our series of four introductory notebooks. In this second notebook, independently verify the data quality tests performed on the dataset used to train the champion.\n",
+        "\n",
+        "You'll learn how to run relevant validation tests with ValidMind, log the results of those tests to the ValidMind Platform, and insert your logged test results as evidence into your validation report. You'll become familiar with the tests available in ValidMind, as well as how to run them. Running tests during validation is crucial to the effective challenge process, as we want to independently evaluate the evidence and assessments provided by the development team.\n",
+        "\n",
+        "While running our tests in this notebook, we'll focus on:\n",
+        "\n",
+        "- Ensuring that data used for training and testing the champion is of appropriate data quality\n",
+        "- Ensuring that the raw data has been preprocessed appropriately and that the resulting final datasets reflects this\n",
+        "\n",
+        "**For a full list of out-of-the-box tests and descriptions,** use the interactive [ValidMind test sandbox](https://docs.validmind.ai/developer/how-to/test-sandbox.html).\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
+        "<br></br>\n",
+        "Our course tailor-made for validators new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/validator-fundamentals/validator-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Validator Fundamentals</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [Prerequisites](#toc1__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_1__)    \n",
+        "- [Load the sample dataset](#toc3__)    \n",
+        "- [Verifying data quality adjustments](#toc4__)    \n",
+        "  - [Identify qualitative tests](#toc4_1__)    \n",
+        "  - [Initialize the ValidMind dataset](#toc4_2__)    \n",
+        "  - [Run data quality tests](#toc4_3__)    \n",
+        "    - [Run tabular data tests](#toc4_3_1__)    \n",
+        "  - [Remove highly correlated features](#toc4_4__)    \n",
+        "- [Documenting test results](#toc5__)    \n",
+        "  - [Configure and run comparison tests](#toc5_1__)    \n",
+        "  - [Log tests with unique identifiers](#toc5_2__)    \n",
+        "  - [Add test results to reporting](#toc5_3__)    \n",
+        "- [Preparing the preprocessed dataset](#toc6__)    \n",
+        "  - [Split the preprocessed dataset](#toc6_1__)    \n",
+        "  - [Initialize the split datasets](#toc6_2__)    \n",
+        "- [In summary](#toc7__)    \n",
+        "- [Next steps](#toc8__)    \n",
+        "  - [Develop potential challenger models](#toc8_1__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## Prerequisites\n",
+        "\n",
+        "In order to independently assess the quality of your datasets with notebook, you'll need to first have:\n",
+        "\n",
+        "- [x] Registered a model within the ValidMind Platform and granted yourself access to the model as a validator\n",
+        "- [x] Installed the ValidMind Library in your local environment, allowing you to access all its features\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Need help with the above steps?</b></span>\n",
+        "<br></br>\n",
+        "Refer to the first notebook in this series: <a href=\"1-set_up_validmind_for_validation.ipynb\" style=\"color: #DE257E;\"><b>1 — Set up the ValidMind Library for validation</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library\n",
+        "\n",
+        "First, let's connect up the ValidMind Library to our model we previously registered in the ValidMind Platform:\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Validation` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Make sure the ValidMind Library is installed\n",
+        "\n",
+        "%pip install -q validmind\n",
+        "\n",
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"validation-report\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Load the sample dataset\n",
+        "\n",
+        "Let's first import the public [Bank Customer Churn Prediction](https://www.kaggle.com/datasets/shantanudhakadd/bank-customer-churn-prediction) dataset from Kaggle, which was used to develop the dummy champion.\n",
+        "\n",
+        "We'll use this dataset to review steps that should have been conducted during the initial development and documentation of the champion to ensure that the model was built correctly. By independently performing steps taken by the development team, we can confirm whether the model was built using appropriate and properly processed data.\n",
+        "\n",
+        "In our below example, note that:\n",
+        "\n",
+        "- The target column, `Exited` has a value of `1` when a customer has churned and `0` otherwise.\n",
+        "- The ValidMind Library provides a wrapper to automatically load the dataset as a [Pandas DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html) object. A Pandas Dataframe is a two-dimensional tabular data structure that makes use of rows and columns."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "from validmind.datasets.classification import customer_churn as demo_dataset\n",
+        "\n",
+        "print(\n",
+        "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{demo_dataset.target_column}' \\n\\t• Class labels: {demo_dataset.class_labels}\"\n",
+        ")\n",
+        "\n",
+        "raw_df = demo_dataset.load_data()\n",
+        "raw_df.head()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Verifying data quality adjustments\n",
+        "\n",
+        "Let's say that thanks to the documentation submitted by the development team (**Learn more:** [ValidMind for development](https://docs.validmind.ai/developer/validmind-library.html#development)), we know that the sample dataset was first modified before being used to train the champion. After performing some data quality assessments on the raw dataset, it was determined that the dataset required rebalancing, and highly correlated features were also removed."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Identify qualitative tests\n",
+        "\n",
+        "During validation, we use the same data processing logic and training procedure to confirm that the model's results can be reproduced independently, so let's start by doing some data quality assessments by running a few individual tests just like the development team did.\n",
+        "\n",
+        "Use the [`vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) introduced by the first notebook in this series in combination with [`vm.tests.list_tags()`](https://docs.validmind.ai/validmind/validmind/tests.html#list_tags) and [`vm.tests.list_tasks()`](https://docs.validmind.ai/validmind/validmind/tests.html#list_tasks) to find which prebuilt tests are relevant for data quality assessment:\n",
+        "\n",
+        "- **`tasks`** represent the kind of modeling task associated with a test. Here we'll focus on `classification` tasks.\n",
+        "- **`tags`** are free-form descriptions providing more details about the test, for example, what category the test falls into. Here we'll focus on the `data_quality` tag."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Get the list of available task types\n",
+        "sorted(vm.tests.list_tasks())"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Get the list of available tags\n",
+        "sorted(vm.tests.list_tags())"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You can pass `tags` and `tasks` as parameters to the `vm.tests.list_tests()` function to filter the tests based on the tags and task types.\n",
+        "\n",
+        "For example, to find tests related to tabular data quality for classification models, you can call `list_tests()` like this:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "vm.tests.list_tests(task=\"classification\", tags=[\"tabular_data\", \"data_quality\"])"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about navigating ValidMind tests?</b></span>\n",
+        "<br></br>\n",
+        "Refer to our notebook outlining the utilities available for viewing and understanding available ValidMind tests: <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/explore_tests/explore_tests.html\" style=\"color: #DE257E;\"><b>Explore tests</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind dataset\n",
+        "\n",
+        "With the individual tests we want to run identified, the next step is to connect your data with a ValidMind `Dataset` object. **This step is always necessary every time you want to connect a dataset to documentation and produce test results through ValidMind,** but you only need to do it once per dataset.\n",
+        "\n",
+        "Initialize a ValidMind dataset object using the [`init_dataset` function](https://docs.validmind.ai/validmind/validmind.html#init_dataset) from the ValidMind (`vm`) module. For this example, we'll pass in the following arguments:\n",
+        "\n",
+        "- **`dataset`** — The raw dataset that you want to provide as input to tests.\n",
+        "- **`input_id`** — A unique identifier that allows tracking what inputs are used when running each individual test.\n",
+        "- **`target_column`** — A required argument if tests require access to true values. This is the name of the target column in the dataset."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# vm_raw_dataset is now a VMDataset object that you can pass to any ValidMind test\n",
+        "vm_raw_dataset = vm.init_dataset(\n",
+        "    dataset=raw_df,\n",
+        "    input_id=\"raw_dataset\",\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_3__'></a>\n",
+        "\n",
+        "### Run data quality tests\n",
+        "\n",
+        "Now that we know how to initialize a ValidMind `dataset` object, we're ready to run some tests!\n",
+        "\n",
+        "You run individual tests by calling [the `run_test` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test) provided by the `validmind.tests` module. For the examples below, we'll pass in the following arguments:\n",
+        "\n",
+        "- **`test_id`** — The ID of the test to run, as seen in the `ID` column when you run `list_tests`. \n",
+        "- **`params`** — A dictionary of parameters for the test. These will override any `default_params` set in the test definition. "
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_3_1__'></a>\n",
+        "\n",
+        "#### Run tabular data tests\n",
+        "\n",
+        "The inputs expected by a test can also be found in the test definition — let's take `validmind.data_validation.DescriptiveStatistics` as an example.\n",
+        "\n",
+        "Note that the output of the [`describe_test()` function](https://docs.validmind.ai/validmind/validmind/tests.html#describe_test) below shows that this test expects a `dataset` as input:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "vm.tests.describe_test(\"validmind.data_validation.DescriptiveStatistics\")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Now, let's run a few tests to assess the quality of the dataset:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "result2 = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.ClassImbalance\",\n",
+        "    inputs={\"dataset\": vm_raw_dataset},\n",
+        "    params={\"min_percent_threshold\": 30},\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "The output above shows that the `validmind.data_validation.ClassImbalance` test did not pass according to the value we set for `min_percent_threshold` — great, this matches what was reported by the development team.\n",
+        "\n",
+        "To address this issue, we'll re-run the test on some processed data. In this case let's apply a very simple rebalancing technique to the dataset:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "import pandas as pd\n",
+        "\n",
+        "raw_copy_df = raw_df.sample(frac=1)  # Create a copy of the raw dataset\n",
+        "\n",
+        "# Create a balanced dataset with the same number of exited and not exited customers\n",
+        "exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 1]\n",
+        "not_exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 0].sample(n=exited_df.shape[0])\n",
+        "\n",
+        "balanced_raw_df = pd.concat([exited_df, not_exited_df])\n",
+        "balanced_raw_df = balanced_raw_df.sample(frac=1, random_state=42)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "With this new balanced dataset, you can re-run the individual test to see if it now passes the class imbalance test requirement.\n",
+        "\n",
+        "As this is technically a different dataset, **remember to first initialize a new ValidMind `Dataset` object** to pass in as input as required by `run_test()`:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Register new data and now 'balanced_raw_dataset' is the new dataset object of interest\n",
+        "vm_balanced_raw_dataset = vm.init_dataset(\n",
+        "    dataset=balanced_raw_df,\n",
+        "    input_id=\"balanced_raw_dataset\",\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Pass the initialized `balanced_raw_dataset` as input into the test run\n",
+        "result = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.ClassImbalance\",\n",
+        "    inputs={\"dataset\": vm_balanced_raw_dataset},\n",
+        "    params={\"min_percent_threshold\": 30},\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_4__'></a>\n",
+        "\n",
+        "### Remove highly correlated features\n",
+        "\n",
+        "Next, let's also remove highly correlated features from our dataset as outlined by the development team. Removing highly correlated features helps make the model simpler, more stable, and easier to understand.\n",
+        "\n",
+        "You can utilize the output from a ValidMind test for further use — in this below example, to retrieve the list of features with the highest correlation coefficients and use them to reduce the final list of features for modeling.\n",
+        "\n",
+        "First, we'll run `validmind.data_validation.HighPearsonCorrelation` with the `balanced_raw_dataset` we initialized previously as input as is for comparison with later runs:\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "corr_result = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
+        "    params={\"max_threshold\": 0.3},\n",
+        "    inputs={\"dataset\": vm_balanced_raw_dataset},\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "The output above shows that the test did not pass according to the value we set for `max_threshold` — as reported and expected.\n",
+        "\n",
+        "`corr_result` is an object of type `TestResult`. We can inspect the result object to see what the test has produced:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "print(type(corr_result))\n",
+        "print(\"Result ID: \", corr_result.result_id)\n",
+        "print(\"Params: \", corr_result.params)\n",
+        "print(\"Passed: \", corr_result.passed)\n",
+        "print(\"Tables: \", corr_result.tables)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let's remove the highly correlated features and create a new VM `dataset` object.\n",
+        "\n",
+        "We'll begin by checking out the table in the result and extracting a list of features that failed the test:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Extract table from `corr_result.tables`\n",
+        "features_df = corr_result.tables[0].data\n",
+        "features_df"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Extract list of features that failed the test\n",
+        "high_correlation_features = features_df[features_df[\"Pass/Fail\"] == \"Fail\"][\"Columns\"].tolist()\n",
+        "high_correlation_features"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Next, extract the feature names from the list of strings (example: `(Age, Exited)` > `Age`):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "high_correlation_features = [feature.split(\",\")[0].strip(\"()\") for feature in high_correlation_features]\n",
+        "high_correlation_features"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Now, it's time to re-initialize the dataset with the highly correlated features removed.\n",
+        "\n",
+        "**Note the use of a different `input_id`.** This allows tracking the inputs used when running each individual test."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Remove the highly correlated features from the dataset\n",
+        "balanced_raw_no_age_df = balanced_raw_df.drop(columns=high_correlation_features)\n",
+        "\n",
+        "# Re-initialize the dataset object\n",
+        "vm_raw_dataset_preprocessed = vm.init_dataset(\n",
+        "    dataset=balanced_raw_no_age_df,\n",
+        "    input_id=\"raw_dataset_preprocessed\",\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Re-running the test with the reduced feature set should pass the test:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "corr_result = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
+        "    params={\"max_threshold\": 0.3},\n",
+        "    inputs={\"dataset\": vm_raw_dataset_preprocessed},\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You can also plot the correlation matrix to visualize the new correlation between features:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "corr_result = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.PearsonCorrelationMatrix\",\n",
+        "    inputs={\"dataset\": vm_raw_dataset_preprocessed},\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Documenting test results\n",
+        "\n",
+        "Now that we've done some analysis on two different datasets, we can use ValidMind to easily document why certain things were done to our raw data with testing to support it. Every test result returned by the `run_test()` function has a `.log()` method that can be used to send the test results to the ValidMind Platform.\n",
+        "\n",
+        "When logging validation test results to the platform, you'll need to manually add those results to the desired section of the validation report. To demonstrate how to add test results to your validation report, we'll log our data quality tests and insert the results via the ValidMind Platform."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Configure and run comparison tests\n",
+        "\n",
+        "Below, we'll perform comparison tests between the original raw dataset (`raw_dataset`) and the final preprocessed (`raw_dataset_preprocessed`) dataset, again logging the results to the ValidMind Platform. \n",
+        "\n",
+        "We can specify all the tests we'd ike to run in a dictionary called `test_config`, and we'll pass in the following arguments for each test:\n",
+        "\n",
+        "  - **`params`:** Individual test parameters.\n",
+        "  - **`input_grid`:** Individual test inputs to compare. In this case, we'll input our two datasets for comparison.\n",
+        "\n",
+        "**Note here that the `input_grid` expects the `input_id` of the dataset as the value rather than the variable name we specified:**"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Individual test config with inputs specified\n",
+        "test_config = {\n",
+        "    \"validmind.data_validation.ClassImbalance\": {\n",
+        "        \"input_grid\": {\"dataset\": [\"raw_dataset\", \"raw_dataset_preprocessed\"]},\n",
+        "        \"params\": {\"min_percent_threshold\": 30}\n",
+        "    },\n",
+        "    \"validmind.data_validation.HighPearsonCorrelation\": {\n",
+        "        \"input_grid\": {\"dataset\": [\"raw_dataset\", \"raw_dataset_preprocessed\"]},\n",
+        "        \"params\": {\"max_threshold\": 0.3}\n",
+        "    },\n",
+        "}"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Then batch run and log our tests in `test_config`:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "for t in test_config:\n",
+        "    print(t)\n",
+        "    try:\n",
+        "        # Check if test has input_grid\n",
+        "        if 'input_grid' in test_config[t]:\n",
+        "            # For tests with input_grid, pass the input_grid configuration\n",
+        "            if 'params' in test_config[t]:\n",
+        "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid'], params=test_config[t]['params']).log()\n",
+        "            else:\n",
+        "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid']).log()\n",
+        "        else:\n",
+        "            # Original logic for regular inputs\n",
+        "            if 'params' in test_config[t]:\n",
+        "                vm.tests.run_test(t, inputs=test_config[t]['inputs'], params=test_config[t]['params']).log()\n",
+        "            else:\n",
+        "                vm.tests.run_test(t, inputs=test_config[t]['inputs']).log()\n",
+        "    except Exception as e:\n",
+        "        print(f\"Error running test {t}: {str(e)}\")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your documentation for some test IDs. </b></span>\n",
+        "<br></br>\n",
+        "That's expected, as when we run validations tests the results logged need to be manually added to your report as part of your compliance assessment process within the ValidMind Platform.</div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2__'></a>\n",
+        "\n",
+        "### Log tests with unique identifiers\n",
+        "\n",
+        "Next, we'll use the previously initialized `vm_balanced_raw_dataset` (that still has a highly correlated `Age` column) as input to run an individual test, then log the result to the ValidMind Platform.\n",
+        "\n",
+        "When running individual tests, **you can use a custom `result_id` to tag the individual result with a unique identifier:**\n",
+        "\n",
+        "- This `result_id` can be appended to `test_id` with a `:` separator.\n",
+        "- The `balanced_raw_dataset` result identifier will correspond to the `balanced_raw_dataset` input, the dataset that still has the `Age` column."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "result = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.HighPearsonCorrelation:balanced_raw_dataset\",\n",
+        "    params={\"max_threshold\": 0.3},\n",
+        "    inputs={\"dataset\": vm_balanced_raw_dataset},\n",
+        ")\n",
+        "result.log()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_3__'></a>\n",
+        "\n",
+        "### Add test results to reporting\n",
+        "\n",
+        "With some test results logged, let's head to the model we connected to at the beginning of this notebook and learn how to insert a test result into our validation report. (**Learn more:** [Assess compliance](https://docs.validmind.ai/guide/validation/assess-compliance.html#link-validator-evidence))\n",
+        "\n",
+        "While the example below focuses on a specific test result, you can follow the same general procedure for your other results:\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you connected to earlier.\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Validation** under Documents.\n",
+        "\n",
+        "3. Click on **2.2.1. Data Quality** to expand that section.\n",
+        "\n",
+        "4. Under the Class Imbalance Assessment guideline, click **Evidence** to expand the evidence panel.\n",
+        "\n",
+        "5. Click **Link Evidence**, then select **Validator Evidence**.\n",
+        "\n",
+        "6. Select the Class Imbalance test results we logged: **ValidMind Data Validation Class Imbalance**\n",
+        "\n",
+        "    <img src= \"selecting-class-imbalance-results.png\" alt=\"Screenshot showing the ClassImbalance test selected\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
+        "    <br><br>\n",
+        "\n",
+        "7. Click **Update Linked Evidence** to add the test results to the validation report.\n",
+        "\n",
+        "8. Confirm that the results for the Class Imbalance test you inserted has been correctly inserted into section **2.2.1. Data Quality** of the report.\n",
+        "\n",
+        "    - Note that these test results are flagged as **Requires Attention** — as they include comparative results from our initial raw dataset.\n",
+        "    - Click **See evidence details** to review the LLM-generated description that summarizes the test results, that confirm that our final preprocessed dataset actually passes our test:\n",
+        "\n",
+        "    <img src= \"class-imbalance-results-detail.png\" alt=\"Screenshot showing the ClassImbalance test generated description in the text editor\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
+        "    <br><br>\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>    Here in this text editor, you can make qualitative edits to the draft that ValidMind generated to finalize the test results.</b></span>\n",
+        "<br></br>\n",
+        "Learn more: <a href=\"https://docs.validmind.ai/guide/documentation/work-with-content-blocks.html\" style=\"color: #DE257E;\"><b>Work with content blocks</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Preparing the preprocessed dataset"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_1__'></a>\n",
+        "\n",
+        "### Split the preprocessed dataset\n",
+        "\n",
+        "With our raw dataset rebalanced with highly correlated features removed, let's now **spilt our dataset into train and test** in preparation for model evaluation testing.\n",
+        "\n",
+        "To start, let's grab the first few rows from the `balanced_raw_no_age_df` dataset we initialized earlier:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "balanced_raw_no_age_df.head()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Before training the model, we need to encode the categorical features in the dataset:\n",
+        "\n",
+        "- Use the `OneHotEncoder` class from the `sklearn.preprocessing` module to encode the categorical features.\n",
+        "- The categorical features in the dataset are `Geography` and `Gender`."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "balanced_raw_no_age_df = pd.get_dummies(\n",
+        "    balanced_raw_no_age_df, columns=[\"Geography\", \"Gender\"], drop_first=True\n",
+        ")\n",
+        "balanced_raw_no_age_df.head()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Splitting our dataset into training and testing is essential for proper validation testing, as this helps assess how well the model generalizes to unseen data:\n",
+        "\n",
+        "- We start by dividing our `balanced_raw_no_age_df` dataset into training and test subsets using `train_test_split`, with 80% of the data allocated to training (`train_df`) and 20% to testing (`test_df`).\n",
+        "- From each subset, we separate the features (all columns except \"Exited\") into `X_train` and `X_test`, and the target column (\"Exited\") into `y_train` and `y_test`."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "from sklearn.model_selection import train_test_split\n",
+        "\n",
+        "train_df, test_df = train_test_split(balanced_raw_no_age_df, test_size=0.20)\n",
+        "\n",
+        "X_train = train_df.drop(\"Exited\", axis=1)\n",
+        "y_train = train_df[\"Exited\"]\n",
+        "X_test = test_df.drop(\"Exited\", axis=1)\n",
+        "y_test = test_df[\"Exited\"]"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2__'></a>\n",
+        "\n",
+        "### Initialize the split datasets\n",
+        "\n",
+        "Next, let's initialize the training and testing datasets so they are available for use:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "vm_train_ds = vm.init_dataset(\n",
+        "    input_id=\"train_dataset_final\",\n",
+        "    dataset=train_df,\n",
+        "    target_column=\"Exited\",\n",
+        ")\n",
+        "\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    input_id=\"test_dataset_final\",\n",
+        "    dataset=test_df,\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## In summary\n",
+        "\n",
+        "In this second notebook, you learned how to:\n",
+        "\n",
+        "- [x] Import a sample dataset\n",
+        "- [x] Identify which tests you might want to run with ValidMind\n",
+        "- [x] Initialize ValidMind datasets\n",
+        "- [x] Run individual tests\n",
+        "- [x] Utilize the output from tests you’ve run\n",
+        "- [x] Log test results as evidence to the ValidMind Platform\n",
+        "- [x] Insert test results into your validation report"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "<a id='toc8_1__'></a>\n",
+        "\n",
+        "### Develop potential challenger models\n",
+        "\n",
+        "Now that you're familiar with the basics of using the ValidMind Library, let's use it to develop a challenger model: **[3 — Developing a potential challenger](3-developing_potential_challenger.ipynb)**"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "copyright-5715327492f24f8fadeab186aecb10ba",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ]
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "name": "python",
+      "version": "3.10.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 2
+}
diff --git a/site/notebooks/EXECUTED/validation/3-developing_potential_challenger.ipynb b/site/notebooks/EXECUTED/validation/3-developing_potential_challenger.ipynb
new file mode 100644
index 0000000000..2ed29a195f
--- /dev/null
+++ b/site/notebooks/EXECUTED/validation/3-developing_potential_challenger.ipynb
@@ -0,0 +1,889 @@
+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# ValidMind for validation 3 — Developing a potential challenger\n",
+        "\n",
+        "Learn how to use ValidMind for your end-to-end validation process with our series of four introductory notebooks. In this third notebook, develop a potential challenger and then pass your challenger and its predictions to ValidMind.\n",
+        "\n",
+        "A *challenger* is an alternate record (model) that attempts to outperform the champion, ensuring that the best performing fit-for-purpose record is always considered for deployment. Challengers also help avoid over-reliance on a single record, and allow testing of new features, algorithms, or data sources without disrupting the production lifecycle.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
+        "<br></br>\n",
+        "Our course tailor-made for validators new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/validator-fundamentals/validator-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Validator Fundamentals</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [Prerequisites](#toc1__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_1__)    \n",
+        "  - [Import the sample dataset](#toc2_2__)    \n",
+        "    - [Preprocess the dataset](#toc2_2_1__)    \n",
+        "  - [Split the preprocessed dataset](#toc2_3__)    \n",
+        "- [Import the champion model](#toc3__)    \n",
+        "- [Training a potential challenger model](#toc4__)    \n",
+        "  - [Random forest classification model](#toc4_1__)    \n",
+        "  - [Initialize the ValidMind models](#toc4_2__)    \n",
+        "  - [Assign predictions](#toc4_3__)    \n",
+        "- [Running model evaluation tests](#toc5__)    \n",
+        "  - [Run model performance tests](#toc5_1__)    \n",
+        "    - [Evaluate performance of the champion model](#toc5_1_1__)    \n",
+        "    - [Log an artifact](#toc5_1_2__)    \n",
+        "    - [Evaluate performance of challenger model](#toc5_1_3__)    \n",
+        "  - [Run diagnostic tests](#toc5_2__)    \n",
+        "  - [Run feature importance tests](#toc5_3__)    \n",
+        "- [In summary](#toc6__)    \n",
+        "- [Next steps](#toc7__)    \n",
+        "  - [Finalize validation and reporting](#toc7_1__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## Prerequisites\n",
+        "\n",
+        "In order to develop potential challengers with this notebook, you'll need to first have:\n",
+        "\n",
+        "- [x] Registered a model within the ValidMind Platform and granted yourself access to the model as a validator\n",
+        "- [x] Installed the ValidMind Library in your local environment, allowing you to access all its features\n",
+        "- [x] Learned how to import and initialize datasets for use with ValidMind\n",
+        "- [x] Understood the basics of how to run and log tests with ValidMind\n",
+        "- [x] Run data quality tests on the datasets used to train the champion, and logged the results of those tests to ValidMind\n",
+        "- [x] Inserted your logged test results into your validation report\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Need help with the above steps?</b></span>\n",
+        "<br></br>\n",
+        "Refer to the first two notebooks in this series:\n",
+        "\n",
+        "- <a href=\"1-set_up_validmind_for_validation.ipynb\" style=\"color: #DE257E;\"><b>1 — Set up the ValidMind Library for validation</b></a>\n",
+        "- <a href=\"2-start_validation_process.ipynb\" style=\"color: #DE257E;\"><b>2 — Start the validation process</b></a>\n",
+        "\n",
+        "</div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up\n",
+        "\n",
+        "This section should be quite familiar to you — as we performed the same actions in the previous notebook, **[2 — Start the validation process](2-start_validation_process.ipynb)**."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library\n",
+        "\n",
+        "As usual, let's first connect up the ValidMind Library to our model we previously registered in the ValidMind Platform:\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Validation` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Make sure the ValidMind Library is installed\n",
+        "\n",
+        "%pip install -q validmind\n",
+        "\n",
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"validation-report\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Import the sample dataset\n",
+        "\n",
+        "Next, we'll load in the sample [Bank Customer Churn Prediction](https://www.kaggle.com/datasets/shantanudhakadd/bank-customer-churn-prediction) dataset used to develop the champion that we will independently preprocess:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Load the sample dataset\n",
+        "from validmind.datasets.classification import customer_churn as demo_dataset\n",
+        "\n",
+        "print(\n",
+        "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{demo_dataset.target_column}' \\n\\t• Class labels: {demo_dataset.class_labels}\"\n",
+        ")\n",
+        "\n",
+        "raw_df = demo_dataset.load_data()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Preprocess the dataset\n",
+        "\n",
+        "We’ll apply a simple rebalancing technique to the dataset before continuing:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "import pandas as pd\n",
+        "\n",
+        "raw_copy_df = raw_df.sample(frac=1)  # Create a copy of the raw dataset\n",
+        "\n",
+        "# Create a balanced dataset with the same number of exited and not exited customers\n",
+        "exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 1]\n",
+        "not_exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 0].sample(n=exited_df.shape[0])\n",
+        "\n",
+        "balanced_raw_df = pd.concat([exited_df, not_exited_df])\n",
+        "balanced_raw_df = balanced_raw_df.sample(frac=1, random_state=42)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let’s also quickly remove highly correlated features from the dataset using the output from a ValidMind test.\n",
+        "\n",
+        "As you know, before we can run tests you’ll need to initialize a ValidMind dataset object with the [`init_dataset` function](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Register new data and now 'balanced_raw_dataset' is the new dataset object of interest\n",
+        "vm_balanced_raw_dataset = vm.init_dataset(\n",
+        "    dataset=balanced_raw_df,\n",
+        "    input_id=\"balanced_raw_dataset\",\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "With our balanced dataset initialized, we can then run our test and utilize the output to help us identify the features we want to remove:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Run HighPearsonCorrelation test with our balanced dataset as input and return a result object\n",
+        "corr_result = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
+        "    params={\"max_threshold\": 0.3},\n",
+        "    inputs={\"dataset\": vm_balanced_raw_dataset},\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# From result object, extract table from `corr_result.tables`\n",
+        "features_df = corr_result.tables[0].data\n",
+        "features_df"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Extract list of features that failed the test\n",
+        "high_correlation_features = features_df[features_df[\"Pass/Fail\"] == \"Fail\"][\"Columns\"].tolist()\n",
+        "high_correlation_features"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Extract feature names from the list of strings\n",
+        "high_correlation_features = [feature.split(\",\")[0].strip(\"()\") for feature in high_correlation_features]\n",
+        "high_correlation_features"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "We can then re-initialize the dataset with a different `input_id` and the highly correlated features removed and re-run the test for confirmation:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Remove the highly correlated features from the dataset\n",
+        "balanced_raw_no_age_df = balanced_raw_df.drop(columns=high_correlation_features)\n",
+        "\n",
+        "# Re-initialize the dataset object\n",
+        "vm_raw_dataset_preprocessed = vm.init_dataset(\n",
+        "    dataset=balanced_raw_no_age_df,\n",
+        "    input_id=\"raw_dataset_preprocessed\",\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Re-run the test with the reduced feature set\n",
+        "corr_result = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
+        "    params={\"max_threshold\": 0.3},\n",
+        "    inputs={\"dataset\": vm_raw_dataset_preprocessed},\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Split the preprocessed dataset\n",
+        "\n",
+        "With our raw dataset rebalanced with highly correlated features removed, let's now **spilt our dataset into train and test** in preparation for model evaluation testing:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Encode categorical features in the dataset\n",
+        "balanced_raw_no_age_df = pd.get_dummies(\n",
+        "    balanced_raw_no_age_df, columns=[\"Geography\", \"Gender\"], drop_first=True\n",
+        ")\n",
+        "balanced_raw_no_age_df.head()"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "from sklearn.model_selection import train_test_split\n",
+        "\n",
+        "# Split the dataset into train and test\n",
+        "train_df, test_df = train_test_split(balanced_raw_no_age_df, test_size=0.20)\n",
+        "\n",
+        "X_train = train_df.drop(\"Exited\", axis=1)\n",
+        "y_train = train_df[\"Exited\"]\n",
+        "X_test = test_df.drop(\"Exited\", axis=1)\n",
+        "y_test = test_df[\"Exited\"]"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Initialize the split datasets\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    input_id=\"train_dataset_final\",\n",
+        "    dataset=train_df,\n",
+        "    target_column=\"Exited\",\n",
+        ")\n",
+        "\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    input_id=\"test_dataset_final\",\n",
+        "    dataset=test_df,\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Import the champion model\n",
+        "\n",
+        "With our raw dataset assessed and preprocessed, let's go ahead and import the champion submitted by the development team in the format of a `.pkl` file: **[lr_model_champion.pkl](lr_model_champion.pkl)**"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Import the champion model\n",
+        "import pickle as pkl\n",
+        "\n",
+        "with open(\"lr_model_champion.pkl\", \"rb\") as f:\n",
+        "    log_reg = pkl.load(f)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Training a potential challenger model\n",
+        "\n",
+        "We're curious how an alternate model compares to our champion, so let's train a challenger as a basis for our testing.\n",
+        "\n",
+        "Our champion *logistic regression model* is a simpler, parametric model that assumes a linear relationship between the independent variables and the log-odds of the outcome. While logistic regression may not capture complex patterns as effectively, it offers a high degree of interpretability and is easier to explain to stakeholders. However, risk is not calculated in isolation from a single factor, but rather in consideration with trade-offs in predictive performance, ease of interpretability, and overall alignment with business objectives."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Random forest classification model\n",
+        "\n",
+        "A *random forest classification model* is an ensemble machine learning algorithm that uses multiple decision trees to classify data. In ensemble learning, multiple models are combined to improve prediction accuracy and robustness.\n",
+        "\n",
+        "Random forest classification models generally have higher accuracy because they capture complex, non-linear relationships, but as a result they lack transparency in their predictions."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Import the Random Forest Classification model\n",
+        "from sklearn.ensemble import RandomForestClassifier\n",
+        "\n",
+        "# Create the model instance with 50 decision trees\n",
+        "rf_model = RandomForestClassifier(\n",
+        "    n_estimators=50,\n",
+        "    random_state=42,\n",
+        ")\n",
+        "\n",
+        "# Train the model\n",
+        "rf_model.fit(X_train, y_train)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind models\n",
+        "\n",
+        "In addition to the initialized datasets, you'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for each of our two models.\n",
+        "\n",
+        "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+        "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
+        "\n",
+        "Initialize your model objects with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Initialize the champion logistic regression model\n",
+        "vm_log_model = vm.init_model(\n",
+        "    log_reg,\n",
+        "    input_id=\"log_model_champion\",\n",
+        ")\n",
+        "\n",
+        "# Initialize the challenger random forest classification model\n",
+        "vm_rf_model = vm.init_model(\n",
+        "    rf_model,\n",
+        "    input_id=\"rf_model\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_3__'></a>\n",
+        "\n",
+        "### Assign predictions\n",
+        "\n",
+        "With our models registered, we'll move on to assigning both the predictive probabilities coming directly from each model's predictions, and the binary prediction after applying the cutoff threshold described in the Compute binary predictions step above.\n",
+        "\n",
+        "- The [`assign_predictions()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#assign_predictions) from the `Dataset` object can link existing predictions to any number of models.\n",
+        "- This method links the model's class prediction values and probabilities to our `vm_train_ds` and `vm_test_ds` datasets.\n",
+        "\n",
+        "If no prediction values are passed, the method will compute predictions automatically:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Champion — Logistic regression model\n",
+        "vm_train_ds.assign_predictions(model=vm_log_model)\n",
+        "vm_test_ds.assign_predictions(model=vm_log_model)\n",
+        "\n",
+        "# Challenger — Random forest classification model\n",
+        "vm_train_ds.assign_predictions(model=vm_rf_model)\n",
+        "vm_test_ds.assign_predictions(model=vm_rf_model)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Running model evaluation tests\n",
+        "\n",
+        "With our setup complete, let's run the rest of our validation tests. Since we have already verified the data quality of the dataset used to train our champion, we will now focus on comprehensive performance evaluations of both the champion and challenger models."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Run model performance tests\n",
+        "\n",
+        "Let's run some performance tests, beginning with independent testing of our champion logistic regression model, then moving on to our potential challenger model.\n",
+        "\n",
+        "Use [`vm.tests.list_tests()`](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) to identify all the model performance tests for classification:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "\n",
+        "vm.tests.list_tests(tags=[\"model_performance\"], task=\"classification\")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "We'll isolate the specific tests we want to run in `mpt`:\n",
+        "\n",
+        "- `model_validation.sklearn.ClassifierPerformance`\n",
+        "- `model_validation.sklearn.ConfusionMatrix`\n",
+        "- `model_validation.sklearn.MinimumAccuracy`\n",
+        "- `model_validation.sklearn.MinimumF1Score`\n",
+        "- `model_validation.sklearn.ROCCurve`\n",
+        "\n",
+        "As we learned in the previous notebook [2 — Start the model validation process](2-start_validation_process.ipynb), you can use a custom `result_id` to tag the individual result with a unique identifier by appending this `result_id` to the `test_id` with a `:` separator. We'll append an identifier for our champion model here:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "mpt = [\n",
+        "    \"validmind.model_validation.sklearn.ClassifierPerformance:logreg_champion\",\n",
+        "    \"validmind.model_validation.sklearn.ConfusionMatrix:logreg_champion\",\n",
+        "    \"validmind.model_validation.sklearn.MinimumAccuracy:logreg_champion\",\n",
+        "    \"validmind.model_validation.sklearn.MinimumF1Score:logreg_champion\",\n",
+        "    \"validmind.model_validation.sklearn.ROCCurve:logreg_champion\"\n",
+        "]"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1_1__'></a>\n",
+        "\n",
+        "#### Evaluate performance of the champion model\n",
+        "\n",
+        "Now, let's run and log our batch of model performance tests using our testing dataset (`vm_test_ds`) for our champion model:\n",
+        "\n",
+        "- The test set serves as a proxy for real-world data, providing an unbiased estimate of model performance since it was not used during training or tuning.\n",
+        "- The test set also acts as protection against selection bias and model tweaking, giving a final, more unbiased checkpoint."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "for test in mpt:\n",
+        "    vm.tests.run_test(\n",
+        "        test,\n",
+        "        inputs={\n",
+        "            \"dataset\": vm_test_ds, \"model\" : vm_log_model,\n",
+        "        },\n",
+        "    ).log()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your documentation for some test IDs. </b></span>\n",
+        "<br></br>\n",
+        "That's expected, as when we run validations tests the results logged need to be manually added to your report as part of your compliance assessment process within the ValidMind Platform.</div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1_2__'></a>\n",
+        "\n",
+        "#### Log an artifact\n",
+        "\n",
+        "As we can observe from the output above, our champion doesn't pass the `MinimumAccuracy` based on the default thresholds of the out-of-the-box test, so let's log an artifact (finding) in the ValidMind Platform  (**Learn more:** [Add and manage artifacts](https://docs.validmind.ai/guide/validation/add-manage-artifacts.html)):\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you connected to earlier.\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Validation** under Documents.\n",
+        "\n",
+        "3. Click on **2.2.2. Model Performance** to expand that section.\n",
+        "\n",
+        "4. Under the Model Performance Metrics guideline, click to expand the **Artifacts** panel.\n",
+        "\n",
+        "5. Click **Link Artifact** and select **Validation Issue** as the type of artifact.\n",
+        "\n",
+        "6. Click **+ Add Validation Issue** and enter in the details for your validation issue, for example:\n",
+        "\n",
+        "    - **TITLE** — Champion Logistic Regression Model Fails Minimum Accuracy Threshold\n",
+        "    - **RISK AREA** — Model Performance\n",
+        "    - **DOCUMENTATION SECTION** — 3.2. Model Evaluation\n",
+        "    - **DESCRIPTION** — The logistic regression champion model was subjected to a Minimum Accuracy test to determine whether its predictive accuracy meets the predefined performance threshold of 0.7. The model achieved an accuracy score of 0.6136, which falls below the required minimum. As a result, the test produced a Fail outcome.\n",
+        "\n",
+        "7. Click **Add Validation Issue** to submit the validation issue.\n",
+        "\n",
+        "8. Select the validation issue you just added to link to your validation report.\n",
+        "\n",
+        "9. Click **Update Linked Artifacts** to insert your validation issue.\n",
+        "\n",
+        "10. Confirm that the validation issue you inserted has been correctly inserted into section 2.2.2. Model Performance of the report.\n",
+        "\n",
+        "11. Click on the validation issue to expand the issue, where you can adjust details such as severity, owner, due date, status, etc. as well as include proposed remediation plans or supporting documentation as attachments."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1_3__'></a>\n",
+        "\n",
+        "#### Evaluate performance of challenger model\n",
+        "\n",
+        "We've now conducted similar tests as the development team for our champion, with the aim of verifying their test results.\n",
+        "\n",
+        "Next, let's see how our challengers compare. We'll use the same batch of tests here as we did in `mpt`, but append a different `result_id` to indicate that these results should be associated with our challenger:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "mpt_chall = [\n",
+        "    \"validmind.model_validation.sklearn.ClassifierPerformance:champion_vs_challenger\",\n",
+        "    \"validmind.model_validation.sklearn.ConfusionMatrix:champion_vs_challenger\",\n",
+        "    \"validmind.model_validation.sklearn.MinimumAccuracy:champion_vs_challenger\",\n",
+        "    \"validmind.model_validation.sklearn.MinimumF1Score:champion_vs_challenger\",\n",
+        "    \"validmind.model_validation.sklearn.ROCCurve:champion_vs_challenger\"\n",
+        "]"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "We'll run each test once for each model with the same `vm_test_ds` dataset to compare them:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "for test in mpt_chall:\n",
+        "    vm.tests.run_test(\n",
+        "        test,\n",
+        "        input_grid={\n",
+        "            \"dataset\": [vm_test_ds], \"model\" : [vm_log_model,vm_rf_model]\n",
+        "        }\n",
+        "    ).log()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Based on the performance metrics, our challenger random forest classification model passes the <code>MinimumAccuracy</code> where our champion did not.</b></span>\n",
+        "<br></br>\n",
+        "In your validation report, support your recommendation in your validation issue's <b>Proposed Remediation Plan</b> to investigate the usage of our challenger by inserting the performance tests we logged with this notebook into the appropriate section.</div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2__'></a>\n",
+        "\n",
+        "### Run diagnostic tests\n",
+        "\n",
+        "Next, we want to inspect the robustness and stability testing comparison between our champion and challenger.\n",
+        "\n",
+        "Use `list_tests()` to list all available diagnosis tests applicable to classification tasks:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "vm.tests.list_tests(tags=[\"model_diagnosis\"], task=\"classification\")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let’s now assess the models for potential signs of *overfitting* and identify any sub-segments where performance may inconsistent with the `model_validation.sklearn.OverfitDiagnosis` test.\n",
+        "\n",
+        "Overfitting occurs when a model learns the training data too well, capturing not only the true pattern but noise and random fluctuations resulting in excellent performance on the training dataset but poor generalization to new, unseen data:\n",
+        "\n",
+        "- Since the training dataset (`vm_train_ds`) was used to fit the model, we use this set to establish a baseline performance for how well the model performs on data it has already seen.\n",
+        "- The testing dataset (`vm_test_ds`) was never seen during training, and here simulates real-world generalization, or how well the model performs on new, unseen data. "
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "vm.tests.run_test(\n",
+        "    test_id=\"validmind.model_validation.sklearn.OverfitDiagnosis:champion_vs_challenger\",\n",
+        "    input_grid={\n",
+        "        \"datasets\": [[vm_train_ds,vm_test_ds]],\n",
+        "        \"model\" : [vm_log_model,vm_rf_model]\n",
+        "    }\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let's also conduct *robustness* and *stability* testing of the two models with the `model_validation.sklearn.RobustnessDiagnosis` test.\n",
+        "\n",
+        "Robustness refers to a model's ability to maintain consistent performance, and stability refers to a model's ability to produce consistent outputs over time across different data subsets.\n",
+        "\n",
+        "Again, we'll use both the training and testing datasets to establish baseline performance and to simulate real-world generalization:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "vm.tests.run_test(\n",
+        "    test_id=\"validmind.model_validation.sklearn.RobustnessDiagnosis:Champion_vs_LogRegression\",\n",
+        "    input_grid={\n",
+        "        \"datasets\": [[vm_train_ds,vm_test_ds]],\n",
+        "        \"model\" : [vm_log_model,vm_rf_model]\n",
+        "    },\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_3__'></a>\n",
+        "\n",
+        "### Run feature importance tests\n",
+        "\n",
+        "We also want to verify the relative influence of different input features on our models' predictions, as well as inspect the differences between our champion and challenger to see if a certain model offers more understandable or logical importance scores for features.\n",
+        "\n",
+        "Use `list_tests()` to identify all the feature importance tests for classification:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Store the feature importance tests\n",
+        "FI = vm.tests.list_tests(tags=[\"feature_importance\"], task=\"classification\",pretty=False)\n",
+        "FI"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "We'll only use our testing dataset (`vm_test_ds`) here, to provide a realistic, unseen sample that mimic future or production data, as the training dataset has already influenced our model during learning:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Run and log our feature importance tests for both models for the testing dataset\n",
+        "for test in FI:\n",
+        "    vm.tests.run_test(\n",
+        "        \"\".join((test,':champion_vs_challenger')),\n",
+        "        input_grid={\n",
+        "            \"dataset\": [vm_test_ds], \"model\" : [vm_log_model,vm_rf_model]\n",
+        "        },\n",
+        "    ).log()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## In summary\n",
+        "\n",
+        "In this third notebook, you learned how to:\n",
+        "\n",
+        "- [x] Initialize ValidMind model objects\n",
+        "- [x] Assign predictions and probabilities to your ValidMind model objects\n",
+        "- [x] Use tests from ValidMind to evaluate the potential of models, including comparative tests between champion and challengers\n",
+        "- [x] Log an artifact in the ValidMind Platform"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "<a id='toc7_1__'></a>\n",
+        "\n",
+        "### Finalize validation and reporting\n",
+        "\n",
+        "Now that you're familiar with the basics of using the ValidMind Library to run and log validation tests, let's learn how to implement some custom tests and wrap up our validation: **[4 — Finalize validation and reporting](4-finalize_validation_reporting.ipynb)**"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "copyright-910d55973ae44bb1a1cd609d39ae5ca8",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ]
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "name": "python",
+      "version": "3.10.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 2
+}
diff --git a/site/notebooks/EXECUTED/validation/4-finalize_validation_reporting.ipynb b/site/notebooks/EXECUTED/validation/4-finalize_validation_reporting.ipynb
new file mode 100644
index 0000000000..32d46c6e2d
--- /dev/null
+++ b/site/notebooks/EXECUTED/validation/4-finalize_validation_reporting.ipynb
@@ -0,0 +1,1235 @@
+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# ValidMind for validation 4 — Finalize testing and reporting\n",
+        "\n",
+        "Learn how to use ValidMind for your end-to-end validation process with our series of four introductory notebooks. In this last notebook, finalize the compliance assessment process and have a complete validation report ready for review.\n",
+        "\n",
+        "This notebook will walk you through how to supplement ValidMind tests with your own custom tests and include them as additional evidence in your validation report. A custom test is any function that takes a set of inputs and parameters as arguments and returns one or more outputs:\n",
+        "\n",
+        "- The function can be as simple or as complex as you need it to be — it can use external libraries, make API calls, or do anything else that you can do in Python.\n",
+        "- The only requirement is that the function signature and return values can be \"understood\" and handled by the ValidMind Library. As such, custom tests offer added flexibility by extending the default tests provided by ValidMind, enabling you to document any type of record (model) or use case.\n",
+        "\n",
+        "**For a more in-depth introduction to custom tests,** refer to our [Implement custom tests](../../how_to/tests/custom_tests/implement_custom_tests.ipynb) notebook.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
+        "<br></br>\n",
+        "Our course tailor-made for validators new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/validator-fundamentals/validator-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Validator Fundamentals</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [Prerequisites](#toc1__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_1__)    \n",
+        "  - [Import the sample dataset](#toc2_2__)    \n",
+        "  - [Split the preprocessed dataset](#toc2_3__)    \n",
+        "  - [Import the champion model](#toc2_4__)    \n",
+        "  - [Train potential challenger model](#toc2_5__)    \n",
+        "  - [Initialize the ValidMind models](#toc2_6__)    \n",
+        "- [Implementing custom tests](#toc3__)    \n",
+        "  - [Implement a custom inline test](#toc3_1__)    \n",
+        "    - [Create a confusion matrix plot](#toc3_1_1__)    \n",
+        "    - [Add parameters to custom tests](#toc3_1_2__)    \n",
+        "    - [Pass parameters to custom tests](#toc3_1_3__)    \n",
+        "  - [Use external test providers](#toc3_2__)    \n",
+        "    - [Create custom tests folder](#toc3_2_1__)    \n",
+        "    - [Save an inline test](#toc3_2_2__)    \n",
+        "    - [Register a local test provider](#toc3_2_3__)    \n",
+        "- [Verify test runs](#toc4__)    \n",
+        "- [In summary](#toc5__)    \n",
+        "- [Next steps](#toc6__)    \n",
+        "  - [Work with your validation report](#toc6_1__)    \n",
+        "  - [Learn more](#toc6_2__)    \n",
+        "    - [Use cases](#toc6_2_1__)    \n",
+        "    - [Discover more learning resources](#toc6_2_2__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## Prerequisites\n",
+        "\n",
+        "In order to finalize validation and reporting, you'll need to first have:\n",
+        "\n",
+        "- [x] Registered a model within the ValidMind Platform and granted yourself access to the model as a validator\n",
+        "- [x] Installed the ValidMind Library in your local environment, allowing you to access all its features\n",
+        "- [x] Learned how to import and initialize datasets and models for use with ValidMind\n",
+        "- [x] Understood the basics of how to identify and run validation tests\n",
+        "- [x] Run validation tests for your champion and challengers, and logged the results of those tests to the ValidMind Platform\n",
+        "- [x] Inserted your logged test results into your validation report\n",
+        "- [x] Added some preliminary artifacts (findings) to your validation report\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Need help with the above steps?</b></span>\n",
+        "<br></br>\n",
+        "Refer to the first three notebooks in this series:\n",
+        "\n",
+        "- <a href=\"1-set_up_validmind_for_validation.ipynb\" style=\"color: #DE257E;\"><b>1 — Set up the ValidMind Library for validation</b></a>\n",
+        "- <a href=\"2-start_validation_process.ipynb\" style=\"color: #DE257E;\"><b>2 — Start the validation process</b></a>\n",
+        "- <a href=\"3-developing_potential_challenger.ipynb\" style=\"color: #DE257E;\"><b>3 — Developing a potential challenger</b></a>\n",
+        "\n",
+        "</div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up\n",
+        "\n",
+        "This section should be very familiar to you now — as we performed the same actions in the previous two notebooks in this series."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library\n",
+        "\n",
+        "As usual, let's first connect up the ValidMind Library to our model we previously registered in the ValidMind Platform:\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Validation` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Make sure the ValidMind Library is installed\n",
+        "\n",
+        "%pip install -q validmind\n",
+        "\n",
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"validation-report\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Import the sample dataset\n",
+        "\n",
+        "Next, we'll load in the same sample [Bank Customer Churn Prediction](https://www.kaggle.com/datasets/shantanudhakadd/bank-customer-churn-prediction) dataset used to develop the champion that we will independently preprocess:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Load the sample dataset\n",
+        "from validmind.datasets.classification import customer_churn as demo_dataset\n",
+        "\n",
+        "print(\n",
+        "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{demo_dataset.target_column}' \\n\\t• Class labels: {demo_dataset.class_labels}\"\n",
+        ")\n",
+        "\n",
+        "raw_df = demo_dataset.load_data()"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Initialize the raw dataset for use in ValidMind tests\n",
+        "vm_raw_dataset = vm.init_dataset(\n",
+        "    dataset=raw_df,\n",
+        "    input_id=\"raw_dataset\",\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "import pandas as pd\n",
+        "\n",
+        "raw_copy_df = raw_df.sample(frac=1)  # Create a copy of the raw dataset\n",
+        "\n",
+        "# Create a balanced dataset with the same number of exited and not exited customers\n",
+        "exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 1]\n",
+        "not_exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 0].sample(n=exited_df.shape[0])\n",
+        "\n",
+        "balanced_raw_df = pd.concat([exited_df, not_exited_df])\n",
+        "balanced_raw_df = balanced_raw_df.sample(frac=1, random_state=42)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let’s also quickly remove highly correlated features from the dataset using the output from a ValidMind test:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Register new data and now 'balanced_raw_dataset' is the new dataset object of interest\n",
+        "vm_balanced_raw_dataset = vm.init_dataset(\n",
+        "    dataset=balanced_raw_df,\n",
+        "    input_id=\"balanced_raw_dataset\",\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Run HighPearsonCorrelation test with our balanced dataset as input and return a result object\n",
+        "corr_result = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
+        "    params={\"max_threshold\": 0.3},\n",
+        "    inputs={\"dataset\": vm_balanced_raw_dataset},\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# From result object, extract table from `corr_result.tables`\n",
+        "features_df = corr_result.tables[0].data\n",
+        "features_df"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Extract list of features that failed the test\n",
+        "high_correlation_features = features_df[features_df[\"Pass/Fail\"] == \"Fail\"][\"Columns\"].tolist()\n",
+        "high_correlation_features"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Extract feature names from the list of strings\n",
+        "high_correlation_features = [feature.split(\",\")[0].strip(\"()\") for feature in high_correlation_features]\n",
+        "high_correlation_features"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Remove the highly correlated features from the dataset\n",
+        "balanced_raw_no_age_df = balanced_raw_df.drop(columns=high_correlation_features)\n",
+        "\n",
+        "# Re-initialize the dataset object\n",
+        "vm_raw_dataset_preprocessed = vm.init_dataset(\n",
+        "    dataset=balanced_raw_no_age_df,\n",
+        "    input_id=\"raw_dataset_preprocessed\",\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Re-run the test with the reduced feature set\n",
+        "corr_result = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
+        "    params={\"max_threshold\": 0.3},\n",
+        "    inputs={\"dataset\": vm_raw_dataset_preprocessed},\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Split the preprocessed dataset\n",
+        "\n",
+        "With our raw dataset rebalanced with highly correlated features removed, let's now **spilt our dataset into train and test** in preparation for model evaluation testing:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Encode categorical features in the dataset\n",
+        "balanced_raw_no_age_df = pd.get_dummies(\n",
+        "    balanced_raw_no_age_df, columns=[\"Geography\", \"Gender\"], drop_first=True\n",
+        ")\n",
+        "balanced_raw_no_age_df.head()"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "from sklearn.model_selection import train_test_split\n",
+        "\n",
+        "# Split the dataset into train and test\n",
+        "train_df, test_df = train_test_split(balanced_raw_no_age_df, test_size=0.20)\n",
+        "\n",
+        "X_train = train_df.drop(\"Exited\", axis=1)\n",
+        "y_train = train_df[\"Exited\"]\n",
+        "X_test = test_df.drop(\"Exited\", axis=1)\n",
+        "y_test = test_df[\"Exited\"]"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Initialize the split datasets\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    input_id=\"train_dataset_final\",\n",
+        "    dataset=train_df,\n",
+        "    target_column=\"Exited\",\n",
+        ")\n",
+        "\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    input_id=\"test_dataset_final\",\n",
+        "    dataset=test_df,\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_4__'></a>\n",
+        "\n",
+        "### Import the champion model\n",
+        "\n",
+        "With our raw dataset assessed and preprocessed, let's go ahead and import the champion submitted by the development team in the format of a `.pkl` file: **[lr_model_champion.pkl](lr_model_champion.pkl)**"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Import the champion model\n",
+        "import pickle as pkl\n",
+        "\n",
+        "with open(\"lr_model_champion.pkl\", \"rb\") as f:\n",
+        "    log_reg = pkl.load(f)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_5__'></a>\n",
+        "\n",
+        "### Train potential challenger model\n",
+        "\n",
+        "We'll also train our random forest classification challenger to see how it compares:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Import the Random Forest Classification model\n",
+        "from sklearn.ensemble import RandomForestClassifier\n",
+        "\n",
+        "# Create the model instance with 50 decision trees\n",
+        "rf_model = RandomForestClassifier(\n",
+        "    n_estimators=50,\n",
+        "    random_state=42,\n",
+        ")\n",
+        "\n",
+        "# Train the model\n",
+        "rf_model.fit(X_train, y_train)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_6__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind models\n",
+        "\n",
+        "In addition to the initialized datasets, you'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for each of our two models:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Initialize the champion logistic regression model\n",
+        "vm_log_model = vm.init_model(\n",
+        "    log_reg,\n",
+        "    input_id=\"log_model_champion\",\n",
+        ")\n",
+        "\n",
+        "# Initialize the challenger random forest classification model\n",
+        "vm_rf_model = vm.init_model(\n",
+        "    rf_model,\n",
+        "    input_id=\"rf_model\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Assign predictions to Champion — Logistic regression model\n",
+        "vm_train_ds.assign_predictions(model=vm_log_model)\n",
+        "vm_test_ds.assign_predictions(model=vm_log_model)\n",
+        "\n",
+        "# Assign predictions to Challenger — Random forest classification model\n",
+        "vm_train_ds.assign_predictions(model=vm_rf_model)\n",
+        "vm_test_ds.assign_predictions(model=vm_rf_model)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Implementing custom tests\n",
+        "\n",
+        "Thanks to the documentation (**Learn more:** [ValidMind for development](https://docs.validmind.ai/developer/validmind-library.html#development)), we know that the development team implemented a custom test to further evaluate the performance of the champion.\n",
+        "\n",
+        "In a usual validation situation, you would load a saved custom test provided by the development team. In the following section, we'll have you implement the same custom test and make it available for reuse, to familiarize you with the processes.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about custom tests?</b></span>\n",
+        "<br></br>\n",
+        "Refer to our in-depth introduction to custom tests: <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/custom_tests/implement_custom_tests.html\" style=\"color: #DE257E;\"><b>Implement custom tests</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Implement a custom inline test\n",
+        "\n",
+        "Let's implement the same custom *inline test* that calculates the confusion matrix for a binary classification model that the development team used in their performance evaluations.\n",
+        "\n",
+        "- An inline test refers to a test written and executed within the same environment as the code being tested — in this case, right in this Jupyter Notebook —  without requiring a separate test file or framework.\n",
+        "- You'll note that the custom test function is just a regular Python function that can include and require any Python library as you see fit."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1_1__'></a>\n",
+        "\n",
+        "#### Create a confusion matrix plot\n",
+        "\n",
+        "Let's first create a confusion matrix plot using the `confusion_matrix` function from the `sklearn.metrics` module:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "import matplotlib.pyplot as plt\n",
+        "from sklearn import metrics\n",
+        "\n",
+        "# Get the predicted classes\n",
+        "y_pred = log_reg.predict(vm_test_ds.x)\n",
+        "\n",
+        "confusion_matrix = metrics.confusion_matrix(y_test, y_pred)\n",
+        "\n",
+        "cm_display = metrics.ConfusionMatrixDisplay(\n",
+        "    confusion_matrix=confusion_matrix, display_labels=[False, True]\n",
+        ")\n",
+        "cm_display.plot()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Next, create a [`@vm.test` wrapper](https://docs.validmind.ai/validmind/validmind.html#test) that will allow you to create a reusable test. **Note the following changes in the code below:**\n",
+        "\n",
+        "- The function `confusion_matrix` takes two arguments `dataset` and `model`. This is a `VMDataset` and `VMModel` object respectively.\n",
+        "  - `VMDataset` objects allow you to access the dataset's true (target) values by accessing the `.y` attribute.\n",
+        "  - `VMDataset` objects allow you to access the predictions for a given record (model) by accessing the `.y_pred()` method.\n",
+        "- The function docstring provides a description of what the test does. This will be displayed along with the result in this notebook as well as in the ValidMind Platform.\n",
+        "- The function body calculates the confusion matrix using the `sklearn.metrics.confusion_matrix` function as we just did above.\n",
+        "- The function then returns the `ConfusionMatrixDisplay.figure_` object — this is important as the ValidMind Library expects the output of the custom test to be a plot or a table.\n",
+        "- The `@vm.test` decorator is doing the work of creating a wrapper around the function that will allow it to be run by the ValidMind Library. It also registers the test so it can be found by the ID `my_custom_tests.ConfusionMatrix`."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "@vm.test(\"my_custom_tests.ConfusionMatrix\")\n",
+        "def confusion_matrix(dataset, model):\n",
+        "    \"\"\"The confusion matrix is a table that is often used to describe the performance of a classification model on a set of data for which the true values are known.\n",
+        "\n",
+        "    The confusion matrix is a 2x2 table that contains 4 values:\n",
+        "\n",
+        "    - True Positive (TP): the number of correct positive predictions\n",
+        "    - True Negative (TN): the number of correct negative predictions\n",
+        "    - False Positive (FP): the number of incorrect positive predictions\n",
+        "    - False Negative (FN): the number of incorrect negative predictions\n",
+        "\n",
+        "    The confusion matrix can be used to assess the holistic performance of a classification model by showing the accuracy, precision, recall, and F1 score of the model on a single figure.\n",
+        "    \"\"\"\n",
+        "    y_true = dataset.y\n",
+        "    y_pred = dataset.y_pred(model=model)\n",
+        "\n",
+        "    confusion_matrix = metrics.confusion_matrix(y_true, y_pred)\n",
+        "\n",
+        "    cm_display = metrics.ConfusionMatrixDisplay(\n",
+        "        confusion_matrix=confusion_matrix, display_labels=[False, True]\n",
+        "    )\n",
+        "    cm_display.plot()\n",
+        "\n",
+        "    plt.close()  # close the plot to avoid displaying it\n",
+        "\n",
+        "    return cm_display.figure_  # return the figure object itself"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You can now run the newly created custom test on both the training and test datasets for both models using the [`run_test()` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Champion train and test\n",
+        "vm.tests.run_test(\n",
+        "    test_id=\"my_custom_tests.ConfusionMatrix:champion\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds,vm_test_ds],\n",
+        "        \"model\" : [vm_log_model]\n",
+        "    }\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Challenger train and test\n",
+        "vm.tests.run_test(\n",
+        "    test_id=\"my_custom_tests.ConfusionMatrix:challenger\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds,vm_test_ds],\n",
+        "        \"model\" : [vm_rf_model]\n",
+        "    }\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your documentation for some test IDs. </b></span>\n",
+        "<br></br>\n",
+        "That's expected, as when we run validations tests the results logged need to be manually added to your report as part of your compliance assessment process within the ValidMind Platform.</div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1_2__'></a>\n",
+        "\n",
+        "#### Add parameters to custom tests\n",
+        "\n",
+        "Custom tests can take parameters just like any other function. To demonstrate, let's modify the `confusion_matrix` function to take an additional parameter `normalize` that will allow you to normalize the confusion matrix:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "@vm.test(\"my_custom_tests.ConfusionMatrix\")\n",
+        "def confusion_matrix(dataset, model, normalize=False):\n",
+        "    \"\"\"The confusion matrix is a table that is often used to describe the performance of a classification model on a set of data for which the true values are known.\n",
+        "\n",
+        "    The confusion matrix is a 2x2 table that contains 4 values:\n",
+        "\n",
+        "    - True Positive (TP): the number of correct positive predictions\n",
+        "    - True Negative (TN): the number of correct negative predictions\n",
+        "    - False Positive (FP): the number of incorrect positive predictions\n",
+        "    - False Negative (FN): the number of incorrect negative predictions\n",
+        "\n",
+        "    The confusion matrix can be used to assess the holistic performance of a classification model by showing the accuracy, precision, recall, and F1 score of the model on a single figure.\n",
+        "    \"\"\"\n",
+        "    y_true = dataset.y\n",
+        "    y_pred = dataset.y_pred(model=model)\n",
+        "\n",
+        "    if normalize:\n",
+        "        confusion_matrix = metrics.confusion_matrix(y_true, y_pred, normalize=\"all\")\n",
+        "    else:\n",
+        "        confusion_matrix = metrics.confusion_matrix(y_true, y_pred)\n",
+        "\n",
+        "    cm_display = metrics.ConfusionMatrixDisplay(\n",
+        "        confusion_matrix=confusion_matrix, display_labels=[False, True]\n",
+        "    )\n",
+        "    cm_display.plot()\n",
+        "\n",
+        "    plt.close()  # close the plot to avoid displaying it\n",
+        "\n",
+        "    return cm_display.figure_  # return the figure object itself"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1_3__'></a>\n",
+        "\n",
+        "#### Pass parameters to custom tests\n",
+        "\n",
+        "You can pass parameters to custom tests by providing a dictionary of parameters to the `run_test()` function.\n",
+        "\n",
+        "- The parameters will override any default parameters set in the custom test definition. Note that `dataset` and `model` are still passed as `inputs`.\n",
+        "- Since these are `VMDataset` or `VMModel` inputs, they have a special meaning.\n",
+        "\n",
+        "Re-running and logging the custom confusion matrix with `normalize=True` for both models and our testing dataset looks like this:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Champion with test dataset and normalize=True\n",
+        "vm.tests.run_test(\n",
+        "    test_id=\"my_custom_tests.ConfusionMatrix:test_normalized_champion\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_test_ds],\n",
+        "        \"model\" : [vm_log_model]\n",
+        "    },\n",
+        "    params={\"normalize\": True}\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Challenger with test dataset and normalize=True\n",
+        "vm.tests.run_test(\n",
+        "    test_id=\"my_custom_tests.ConfusionMatrix:test_normalized_challenger\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_test_ds],\n",
+        "        \"model\" : [vm_rf_model]\n",
+        "    },\n",
+        "    params={\"normalize\": True}\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2__'></a>\n",
+        "\n",
+        "### Use external test providers\n",
+        "\n",
+        "Sometimes you may want to reuse the same set of custom tests across multiple records (models) and share them with others in your organization, like the development team would have done with you in this example workflow featured in this series of notebooks. In this case, you can create an external custom *test provider* that will allow you to load custom tests from a local folder or a Git repository.\n",
+        "\n",
+        "In this section you will learn how to declare a local filesystem test provider that allows loading tests from a local folder following these high level steps:\n",
+        "\n",
+        "1. Create a folder of custom tests from existing inline tests (tests that exist in your active Jupyter Notebook)\n",
+        "2. Save an inline test to a file\n",
+        "3. Define and register a [`LocalTestProvider`](https://docs.validmind.ai/validmind/validmind/tests.html#LocalTestProvider) that points to that folder\n",
+        "4. Run test provider tests\n",
+        "5. Add the test results to your documentation"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_1__'></a>\n",
+        "\n",
+        "#### Create custom tests folder\n",
+        "\n",
+        "Let's start by creating a new folder that will contain reusable custom tests from your existing inline tests.\n",
+        "\n",
+        "The following code snippet will create a new `my_tests` directory in the current working directory if it doesn't exist:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "tests_folder = \"my_tests\"\n",
+        "\n",
+        "import os\n",
+        "\n",
+        "# create tests folder\n",
+        "os.makedirs(tests_folder, exist_ok=True)\n",
+        "\n",
+        "# remove existing tests\n",
+        "for f in os.listdir(tests_folder):\n",
+        "    # remove files and pycache\n",
+        "    if f.endswith(\".py\") or f == \"__pycache__\":\n",
+        "        os.system(f\"rm -rf {tests_folder}/{f}\")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "After running the command above, confirm that a new `my_tests` directory was created successfully. For example:\n",
+        "\n",
+        "```\n",
+        "~/notebooks/tutorials/validation/my_tests/\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_2__'></a>\n",
+        "\n",
+        "#### Save an inline test\n",
+        "\n",
+        "The `@vm.test` decorator we used in **Implement a custom inline test** above to register one-off custom tests also includes a convenience method on the function object that allows you to simply call `<func_name>.save()` to save the test to a Python file at a specified path.\n",
+        "\n",
+        "While `save()` will get you started by creating the file and saving the function code with the correct name, it won't automatically include any imports, or other functions or variables, outside of the functions that are needed for the test to run. To solve this, pass in an optional `imports` argument ensuring necessary imports are added to the file.\n",
+        "\n",
+        "The `confusion_matrix` test requires the following additional imports:\n",
+        "\n",
+        "```python\n",
+        "import matplotlib.pyplot as plt\n",
+        "from sklearn import metrics\n",
+        "```\n",
+        "\n",
+        "Let's pass these imports to the `save()` method to ensure they are included in the file with the following command:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "confusion_matrix.save(\n",
+        "    # Save it to the custom tests folder we created\n",
+        "    tests_folder,\n",
+        "    imports=[\"import matplotlib.pyplot as plt\", \"from sklearn import metrics\"],\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "- [x] Confirm that the `save()` method saved the `confusion_matrix` function to a file named `ConfusionMatrix.py` in the `my_tests` folder.\n",
+        "- [x] Note that the new file provides some context on the origin of the test, which is useful for traceability:\n",
+        "\n",
+        "    ```\n",
+        "    # Saved from __main__.confusion_matrix\n",
+        "    # Original Test ID: my_custom_tests.ConfusionMatrix\n",
+        "    # New Test ID: <test_provider_namespace>.ConfusionMatrix\n",
+        "    ```\n",
+        "\n",
+        "- [x]  Additionally, the new test function has been stripped off its decorator, as it now resides in a file that will be loaded by the test provider:\n",
+        "\n",
+        "    ```python\n",
+        "    def ConfusionMatrix(dataset, model, normalize=False):\n",
+        "    ```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_3__'></a>\n",
+        "\n",
+        "#### Register a local test provider\n",
+        "\n",
+        "Now that your `my_tests` folder has a sample custom test, let's initialize a test provider that will tell the ValidMind Library where to find your custom tests:\n",
+        "\n",
+        "- ValidMind offers out-of-the-box test providers for local tests (tests in a folder) or a Github provider for tests in a Github repository.\n",
+        "- You can also create your own test provider by creating a class that has a [`load_test` method](https://docs.validmind.ai/validmind/validmind/tests.html#load_test) that takes a test ID and returns the test function matching that ID.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about test providers?</b></span>\n",
+        "<br></br>\n",
+        "An extended introduction to test providers can be found in: <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/custom_tests/integrate_external_test_providers.html\" style=\"color: #DE257E;\"><b>Integrate external test providers</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Initialize a local test provider\n",
+        "\n",
+        "For most use cases, using a `LocalTestProvider` that allows you to load custom tests from a designated directory should be sufficient.\n",
+        "\n",
+        "**The most important attribute for a test provider is its `namespace`.** This is a string that will be used to prefix test IDs in documentation. This allows you to have multiple test providers with tests that can even share the same ID, but are distinguished by their namespace.\n",
+        "\n",
+        "Let's go ahead and load the custom tests from our `my_tests` directory:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "from validmind.tests import LocalTestProvider\n",
+        "\n",
+        "# initialize the test provider with the tests folder we created earlier\n",
+        "my_test_provider = LocalTestProvider(tests_folder)\n",
+        "\n",
+        "vm.tests.register_test_provider(\n",
+        "    namespace=\"my_test_provider\",\n",
+        "    test_provider=my_test_provider,\n",
+        ")\n",
+        "# `my_test_provider.load_test()` will be called for any test ID that starts with `my_test_provider`\n",
+        "# e.g. `my_test_provider.ConfusionMatrix` will look for a function named `ConfusionMatrix` in `my_tests/ConfusionMatrix.py` file"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Run test provider tests\n",
+        "\n",
+        "Now that we've set up the test provider, we can run any test that's located in the tests folder by using the `run_test()` method as with any other test:\n",
+        "\n",
+        "- For tests that reside in a test provider directory, the test ID will be the `namespace` specified when registering the provider, followed by the path to the test file relative to the tests folder.\n",
+        "- For example, the Confusion Matrix test we created earlier will have the test ID `my_test_provider.ConfusionMatrix`. You could organize the tests in subfolders, say `classification` and `regression`, and the test ID for the Confusion Matrix test would then be `my_test_provider.classification.ConfusionMatrix`.\n",
+        "\n",
+        "Let's go ahead and re-run the confusion matrix test with our testing dataset for our two models by using the test ID `my_test_provider.ConfusionMatrix`. This should load the test from the test provider and run it as before."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Champion with test dataset and test provider custom test\n",
+        "vm.tests.run_test(\n",
+        "    test_id=\"my_test_provider.ConfusionMatrix:champion\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_test_ds],\n",
+        "        \"model\" : [vm_log_model]\n",
+        "    }\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Challenger with test dataset  and test provider custom test\n",
+        "vm.tests.run_test(\n",
+        "    test_id=\"my_test_provider.ConfusionMatrix:challenger\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_test_ds],\n",
+        "        \"model\" : [vm_rf_model]\n",
+        "    }\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Verify test runs\n",
+        "\n",
+        "Our final task is to verify that all the tests provided by the development team were run and reported accurately. Note the appended `result_ids` to delineate which dataset we ran the test with for the relevant tests.\n",
+        "\n",
+        "Here, we'll specify all the tests we'd like to independently rerun in a dictionary called `test_config`. **Note here that `inputs` and `input_grid` expect the `input_id` of the dataset or model as the value rather than the variable name we specified**:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "test_config = {\n",
+        "    # Run with the raw dataset\n",
+        "    'validmind.data_validation.DatasetDescription:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'}\n",
+        "    },\n",
+        "    'validmind.data_validation.DescriptiveStatistics:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'}\n",
+        "    },\n",
+        "    'validmind.data_validation.MissingValues:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'min_percentage_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.ClassImbalance:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'min_percent_threshold': 10}\n",
+        "    },\n",
+        "    'validmind.data_validation.Duplicates:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'min_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.HighCardinality:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {\n",
+        "            'num_threshold': 100,\n",
+        "            'percent_threshold': 0.1,\n",
+        "            'threshold_type': 'percent'\n",
+        "        }\n",
+        "    },\n",
+        "    'validmind.data_validation.Skewness:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'max_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.UniqueRows:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'min_percent_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.TooManyZeroValues:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'max_percent_threshold': 0.03}\n",
+        "    },\n",
+        "    'validmind.data_validation.IQROutliersTable:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'threshold': 5}\n",
+        "    },\n",
+        "    # Run with the preprocessed dataset\n",
+        "    'validmind.data_validation.DescriptiveStatistics:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset_preprocessed'}\n",
+        "    },\n",
+        "    'validmind.data_validation.TabularDescriptionTables:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset_preprocessed'}\n",
+        "    },\n",
+        "    'validmind.data_validation.MissingValues:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset_preprocessed'},\n",
+        "        'params': {'min_percentage_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.TabularNumericalHistograms:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset_preprocessed'}\n",
+        "    },\n",
+        "    'validmind.data_validation.TabularCategoricalBarPlots:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset_preprocessed'}\n",
+        "    },\n",
+        "    'validmind.data_validation.TargetRateBarPlots:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset_preprocessed'},\n",
+        "        'params': {'default_column': 'loan_status'}\n",
+        "    },\n",
+        "    # Run with the training and test datasets\n",
+        "    'validmind.data_validation.DescriptiveStatistics:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']}\n",
+        "    },\n",
+        "    'validmind.data_validation.TabularDescriptionTables:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']}\n",
+        "    },\n",
+        "    'validmind.data_validation.ClassImbalance:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']},\n",
+        "        'params': {'min_percent_threshold': 10}\n",
+        "    },\n",
+        "    'validmind.data_validation.UniqueRows:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']},\n",
+        "        'params': {'min_percent_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.TabularNumericalHistograms:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']}\n",
+        "    },\n",
+        "    'validmind.data_validation.MutualInformation:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']},\n",
+        "        'params': {'min_threshold': 0.01}\n",
+        "    },\n",
+        "    'validmind.data_validation.PearsonCorrelationMatrix:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']}\n",
+        "    },\n",
+        "    'validmind.data_validation.HighPearsonCorrelation:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']},\n",
+        "        'params': {'max_threshold': 0.3, 'top_n_correlations': 10}\n",
+        "    },\n",
+        "    'validmind.model_validation.ModelMetadata': {\n",
+        "        'input_grid': {'model': ['log_model_champion', 'rf_model']}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.ModelParameters': {\n",
+        "        'input_grid': {'model': ['log_model_champion', 'rf_model']}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.ROCCurve': {\n",
+        "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final'], 'model': ['log_model_champion']}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.MinimumROCAUCScore': {\n",
+        "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final'], 'model': ['log_model_champion']},\n",
+        "        'params': {'min_threshold': 0.5}\n",
+        "    }\n",
+        "}"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Then batch run and log our tests in `test_config`:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "for t in test_config:\n",
+        "    print(t)\n",
+        "    try:\n",
+        "        # Check if test has input_grid\n",
+        "        if 'input_grid' in test_config[t]:\n",
+        "            # For tests with input_grid, pass the input_grid configuration\n",
+        "            if 'params' in test_config[t]:\n",
+        "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid'], params=test_config[t]['params']).log()\n",
+        "            else:\n",
+        "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid']).log()\n",
+        "        else:\n",
+        "            # Original logic for regular inputs\n",
+        "            if 'params' in test_config[t]:\n",
+        "                vm.tests.run_test(t, inputs=test_config[t]['inputs'], params=test_config[t]['params']).log()\n",
+        "            else:\n",
+        "                vm.tests.run_test(t, inputs=test_config[t]['inputs']).log()\n",
+        "    except Exception as e:\n",
+        "        print(f\"Error running test {t}: {str(e)}\")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## In summary\n",
+        "\n",
+        "In this final notebook, you learned how to:\n",
+        "\n",
+        "- [x] Implement a custom inline test\n",
+        "- [x] Run and log your custom inline tests\n",
+        "- [x] Use external custom test providers\n",
+        "- [x] Run and log tests from your custom test providers\n",
+        "- [x] Re-run tests provided by your development team to verify that they were run and reported accurately\n",
+        "\n",
+        "With our ValidMind for validation series of notebooks, you learned how to validate a record (model) end-to-end with the ValidMind Library by running through some common scenarios in a typical validation setting:\n",
+        "\n",
+        "- Verifying the data quality steps performed by the development team\n",
+        "- Independently replicating the champion's results and conducting additional tests to assess performance, stability, and robustness\n",
+        "- Setting up test inputs and a challenger for comparative analysis\n",
+        "- Running validation tests, analyzing results, and logging artifacts to ValidMind"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Next steps"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_1__'></a>\n",
+        "\n",
+        "### Work with your validation report\n",
+        "\n",
+        "Now that you've logged all your test results and verified the work done by the development team, head to the ValidMind Platform to wrap up your validation report. Continue to work on your validation report by:\n",
+        "\n",
+        "- **Inserting additional test results:** Click **Link Evidence** under any Evidence panel of 2. Validation in your validation report. (Learn more: [Link evidence to reports](https://docs.validmind.ai/guide/validation/assess-compliance.html#link-evidence-to-reports))\n",
+        "\n",
+        "- **Making qualitative edits to your test descriptions:** Expand any linked evidence under Validator Evidence and click **See evidence details** to review and edit the ValidMind-generated test descriptions for quality and accuracy. (Learn more: [Preparing validation reports](https://docs.validmind.ai/guide/validation/preparing-validation-reports.html#validation-overview))\n",
+        "\n",
+        "- **Adding more findings:** Click **Link Finding to Report** in any validation report section, then click **+ Create New Finding**. (Learn more: [Add and manage artifacts](https://docs.validmind.ai/guide/validation/add-manage-artifacts.html))\n",
+        "\n",
+        "- **Adding risk assessment notes:** Click under **Risk Assessment Notes** in any validation report section to access the text editor and content editing toolbar, including an option to generate a draft with AI. Once generated, edit your ValidMind-generated test descriptions to adhere to your organization's requirements. (Learn more: [Work with content blocks](https://docs.validmind.ai/guide/documentation/work-with-content-blocks.html#content-editing-toolbar))\n",
+        "\n",
+        "- **Assessing compliance:** Under the Guideline for any validation report section, click **ASSESSMENT** and select the compliance status from the drop-down menu. (Learn more: [Assign compliance assessments](https://docs.validmind.ai/guide/validation/assess-compliance.html#assign-compliance-assessments))\n",
+        "\n",
+        "- **Collaborate with other stakeholders:** Use the ValidMind Platform's real-time collaborative features to work seamlessly together with the rest of your organization, including developers. Propose suggested changes in the documentation, work with versioned history, and use comments to discuss specific portions of the documentation. (Learn more: [Collaborate with others](https://docs.validmind.ai/guide/documentation/collaborate-with-others.html))\n",
+        "\n",
+        "When your validation report is complete and ready for review, submit it for approval from the same ValidMind Platform where you made your edits and collaborated with the rest of your organization, ensuring transparency and a thorough validation history. (Learn more: [Submit documents](https://docs.validmind.ai/guide/documentation/submit-documents.html))"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2__'></a>\n",
+        "\n",
+        "### Learn more\n",
+        "\n",
+        "Now that you're familiar with the basics, you can explore the following notebooks to get a deeper understanding on how the ValidMind Library assists you in streamlining validation:"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2_1__'></a>\n",
+        "\n",
+        "#### Use cases\n",
+        "\n",
+        "- [Validate an application scorecard model](../../use_cases/validation/validate_application_scorecard.ipynb)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2_2__'></a>\n",
+        "\n",
+        "#### Discover more learning resources\n",
+        "\n",
+        "Learn more about the ValidMind Library tools we used in this notebook:\n",
+        "\n",
+        "- [Explore tests](../../how_to/tests/explore_tests/explore_tests.ipynb)\n",
+        "- [Run dataset-based tests](../../how_to/tests/run_tests/1-run_dataset-based_tests.ipynb)\n",
+        "- [Implement custom tests](../../how_to/tests/custom_tests/implement_custom_tests.ipynb)\n",
+        "- [Integrate external test providers](../../how_to/tests/custom_tests/integrate_external_test_providers.ipynb)\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "copyright-0f5cad51d1144e528b343ccbd8f66d06",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ]
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "name": "python",
+      "version": "3.10.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 2
+}
diff --git a/site/notebooks/EXECUTED/model_validation/class-imbalance-results-detail.png b/site/notebooks/EXECUTED/validation/class-imbalance-results-detail.png
similarity index 100%
rename from site/notebooks/EXECUTED/model_validation/class-imbalance-results-detail.png
rename to site/notebooks/EXECUTED/validation/class-imbalance-results-detail.png
diff --git a/site/notebooks/EXECUTED/model_validation/compliance-summary.png b/site/notebooks/EXECUTED/validation/compliance-summary.png
similarity index 100%
rename from site/notebooks/EXECUTED/model_validation/compliance-summary.png
rename to site/notebooks/EXECUTED/validation/compliance-summary.png
diff --git a/site/notebooks/EXECUTED/model_validation/inserted-minimum-f1-scores.png b/site/notebooks/EXECUTED/validation/inserted-minimum-f1-scores.png
similarity index 100%
rename from site/notebooks/EXECUTED/model_validation/inserted-minimum-f1-scores.png
rename to site/notebooks/EXECUTED/validation/inserted-minimum-f1-scores.png
diff --git a/site/notebooks/EXECUTED/model_validation/lr_model_champion.pkl b/site/notebooks/EXECUTED/validation/lr_model_champion.pkl
similarity index 100%
rename from site/notebooks/EXECUTED/model_validation/lr_model_champion.pkl
rename to site/notebooks/EXECUTED/validation/lr_model_champion.pkl
diff --git a/site/notebooks/EXECUTED/model_validation/selecting-class-imbalance-results.png b/site/notebooks/EXECUTED/validation/selecting-class-imbalance-results.png
similarity index 100%
rename from site/notebooks/EXECUTED/model_validation/selecting-class-imbalance-results.png
rename to site/notebooks/EXECUTED/validation/selecting-class-imbalance-results.png
diff --git a/site/notebooks/EXECUTED/model_validation/selecting-minimum-f1-scores.png b/site/notebooks/EXECUTED/validation/selecting-minimum-f1-scores.png
similarity index 100%
rename from site/notebooks/EXECUTED/model_validation/selecting-minimum-f1-scores.png
rename to site/notebooks/EXECUTED/validation/selecting-minimum-f1-scores.png
diff --git a/site/notebooks/how_to/data_and_datasets/dataset_inputs/configure_dataset_features.ipynb b/site/notebooks/how_to/data_and_datasets/dataset_inputs/configure_dataset_features.ipynb
index d8f086ea96..1b9ab41dab 100644
--- a/site/notebooks/how_to/data_and_datasets/dataset_inputs/configure_dataset_features.ipynb
+++ b/site/notebooks/how_to/data_and_datasets/dataset_inputs/configure_dataset_features.ipynb
@@ -1,472 +1,484 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Configure dataset features\n",
-    "\n",
-    "When initializing a ValidMind dataset object, you can pass in a list of features to use instead of utilizing all dataset columns when running tests.\n",
-    "\n",
-    "This notebook shows how to use custom feature columns with `init_dataset`. The default behavior of `init_dataset` is to utilize all dataset columns when running tests. It is also possible to pass in a list of features to use and thus restrict computations to only those features."
-   ]
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Configure dataset features\n",
+        "\n",
+        "When initializing a ValidMind dataset object, you can pass in a list of features to use instead of utilizing all dataset columns when running tests.\n",
+        "\n",
+        "This notebook shows how to use custom feature columns with `init_dataset`. The default behavior of `init_dataset` is to utilize all dataset columns when running tests. It is also possible to pass in a list of features to use and thus restrict computations to only those features."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "- [Load the sample dataset](#toc3__)    \n",
+        "  - [Initialize the training and test datasets](#toc3_1__)    \n",
+        "  - [Defining custom features](#toc3_2__)    \n",
+        "- [Next steps](#toc4__)    \n",
+        "  - [Work with your model documentation](#toc4_1__)    \n",
+        "  - [Discover more learning resources](#toc4_2__)    \n",
+        "- [Upgrade ValidMind](#toc5__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+        "\n",
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "%pip install -q validmind"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Binary classification`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Load the sample dataset"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "%matplotlib inline\n",
+        "\n",
+        "# Import the sample dataset from the library\n",
+        "\n",
+        "from validmind.datasets.classification import customer_churn as demo_dataset\n",
+        "\n",
+        "# You can also try a different dataset with:\n",
+        "# from validmind.datasets.classification import taiwan_credit as demo_dataset\n",
+        "\n",
+        "df = demo_dataset.load_data()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Initialize the training and test datasets\n",
+        "\n",
+        "Before you can run a test suite, which are just a collection of tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
+        "\n",
+        "This function takes a number of arguments:\n",
+        "\n",
+        "- `dataset` — the raw dataset that you want to analyze\n",
+        "- `input_id` - a unique identifier that allows tracking what inputs are used when running each individual test\n",
+        "- `target_column` — the name of the target column in the dataset\n",
+        "- `feature_columns` - the names of the feature columns in the dataset"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "feature_columns = [\n",
+        "    \"CreditScore\",\n",
+        "    \"Age\",\n",
+        "    \"Tenure\",\n",
+        "    \"Balance\",\n",
+        "    \"NumOfProducts\",\n",
+        "    \"HasCrCard\",\n",
+        "    \"IsActiveMember\",\n",
+        "    \"EstimatedSalary\",\n",
+        "]\n",
+        "\n",
+        "vm_dataset = vm.init_dataset(\n",
+        "    dataset=df,\n",
+        "    input_id=\"raw_dataset\",\n",
+        "    target_column=demo_dataset.target_column,\n",
+        "    feature_columns=feature_columns,\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2__'></a>\n",
+        "\n",
+        "### Defining custom features\n",
+        "\n",
+        "This section shows how we can define a subset of features to use when running dataset tests. Any feature that is not included in the `feature_columns` argument is omitted from the computation of the `DescriptiveStatistics` test in the examples below."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "In the following example we use the `DescriptiveStatistics` test to show how the output changes when customizing features."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "1. Running a test with all the features."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "vm_dataset = vm.init_dataset(\n",
+        "    dataset=df,\n",
+        "    input_id=\"raw_dataset_all_features\",\n",
+        "    target_column=demo_dataset.target_column,\n",
+        ")\n",
+        "\n",
+        "test = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.DescriptiveStatistics\",\n",
+        "    inputs={\"dataset\": vm_dataset},\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "2. Running a test with a subset of features."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "vm_dataset = vm.init_dataset(\n",
+        "    dataset=df,\n",
+        "    input_id=\"raw_dataset_subset\",\n",
+        "    target_column=demo_dataset.target_column,\n",
+        "    feature_columns=[\"CreditScore\", \"Age\", \"Balance\", \"Geography\"],\n",
+        ")\n",
+        "\n",
+        "test = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.DescriptiveStatistics\",\n",
+        "    inputs={\"dataset\": vm_dataset},\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
+        "\n",
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Work with your documentation\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
+        "\n",
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "%pip show validmind"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "copyright-32870f8bce7f4ed0903136a69d02b421",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ]
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": ".venv",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.8.13"
+    }
   },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "- [Load the sample dataset](#toc3__)    \n",
-    "  - [Initialize the training and test datasets](#toc3_1__)    \n",
-    "  - [Defining custom features](#toc3_2__)    \n",
-    "- [Next steps](#toc4__)    \n",
-    "  - [Work with your model documentation](#toc4_1__)    \n",
-    "  - [Discover more learning resources](#toc4_2__)    \n",
-    "- [Upgrade ValidMind](#toc5__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
-    "\n",
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Custom tests**: Custom tests are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom test.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom test. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Binary classification`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Load the sample dataset"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%matplotlib inline\n",
-    "\n",
-    "# Import the sample dataset from the library\n",
-    "\n",
-    "from validmind.datasets.classification import customer_churn as demo_dataset\n",
-    "\n",
-    "# You can also try a different dataset with:\n",
-    "# from validmind.datasets.classification import taiwan_credit as demo_dataset\n",
-    "\n",
-    "df = demo_dataset.load_data()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Initialize the training and test datasets\n",
-    "\n",
-    "Before you can run a test suite, which are just a collection of tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
-    "\n",
-    "This function takes a number of arguments:\n",
-    "\n",
-    "- `dataset` — the raw dataset that you want to analyze\n",
-    "- `input_id` - a unique identifier that allows tracking what inputs are used when running each individual test\n",
-    "- `target_column` — the name of the target column in the dataset\n",
-    "- `feature_columns` - the names of the feature columns in the dataset"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "feature_columns = [\n",
-    "    \"CreditScore\",\n",
-    "    \"Age\",\n",
-    "    \"Tenure\",\n",
-    "    \"Balance\",\n",
-    "    \"NumOfProducts\",\n",
-    "    \"HasCrCard\",\n",
-    "    \"IsActiveMember\",\n",
-    "    \"EstimatedSalary\",\n",
-    "]\n",
-    "\n",
-    "vm_dataset = vm.init_dataset(\n",
-    "    dataset=df,\n",
-    "    input_id=\"raw_dataset\",\n",
-    "    target_column=demo_dataset.target_column,\n",
-    "    feature_columns=feature_columns,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2__'></a>\n",
-    "\n",
-    "### Defining custom features\n",
-    "\n",
-    "This section shows how we can define a subset of features to use when running dataset tests. Any feature that is not included in the `feature_columns` argument is omitted from the computation of the `DescriptiveStatistics` test in the examples below."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "In the following example we use the `DescriptiveStatistics` test to show how the output changes when customizing features."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "1. Running a test with all the features."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_dataset = vm.init_dataset(\n",
-    "    dataset=df,\n",
-    "    input_id=\"raw_dataset_all_features\",\n",
-    "    target_column=demo_dataset.target_column,\n",
-    ")\n",
-    "\n",
-    "test = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.DescriptiveStatistics\",\n",
-    "    inputs={\"dataset\": vm_dataset},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "2. Running a test with a subset of features."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_dataset = vm.init_dataset(\n",
-    "    dataset=df,\n",
-    "    input_id=\"raw_dataset_subset\",\n",
-    "    target_column=demo_dataset.target_column,\n",
-    "    feature_columns=[\"CreditScore\", \"Age\", \"Balance\", \"Geography\"],\n",
-    ")\n",
-    "\n",
-    "test = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.DescriptiveStatistics\",\n",
-    "    inputs={\"dataset\": vm_dataset},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
-    "\n",
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Work with your model documentation\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)\n",
-    "\n",
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-32870f8bce7f4ed0903136a69d02b421",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": ".venv",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.8.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
+  "nbformat": 4,
+  "nbformat_minor": 2
 }
diff --git a/site/notebooks/how_to/data_and_datasets/dataset_inputs/load_datasets_predictions.ipynb b/site/notebooks/how_to/data_and_datasets/dataset_inputs/load_datasets_predictions.ipynb
index 484648fa75..a98ff348bc 100644
--- a/site/notebooks/how_to/data_and_datasets/dataset_inputs/load_datasets_predictions.ipynb
+++ b/site/notebooks/how_to/data_and_datasets/dataset_inputs/load_datasets_predictions.ipynb
@@ -1,1061 +1,1073 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Load dataset predictions\n",
-    "\n",
-    "To enable tests to make use of predictions, you can load predictions in ValidMind dataset objects in multiple different ways.\n",
-    "\n",
-    "This interactive notebook includes the code required to load the demo dataset, preprocess the raw dataset and train a model for testing, and initialize ValidMind objects. Additionally, it offers options for loading predictions using the `assign_predictions()` function, such as loading predictions from a file, linking an existing prediction column in the dataset with a model, or allowing the ValidMind Library to run and link predictions to a model."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "  - [Preview the documentation template](#toc2_3__)    \n",
-    "- [Load the sample dataset](#toc3__)    \n",
-    "- [Prepocess the raw dataset](#toc4__)    \n",
-    "- [Train models for testing](#toc5__)    \n",
-    "- [Initialize ValidMind objects](#toc6__)    \n",
-    "  - [Initialize the ValidMind models](#toc6_1__)    \n",
-    "  - [Initialize the ValidMind datasets](#toc6_2__)    \n",
-    "- [Options to load predictions using the ValidMind Library](#toc7__)    \n",
-    "  - [Load predictions from a file](#toc7_1__)    \n",
-    "  - [Predictions calculated outside of VM](#toc7_2__)    \n",
-    "  - [Assign predictions to the training dataset](#toc7_3__)    \n",
-    "  - [Run an example test](#toc7_4__)    \n",
-    "  - [Link an existing prediction column in the dataset with a model](#toc7_5__)    \n",
-    "    - [Link prediction column to a specific model](#toc7_5_1__)    \n",
-    "  - [Link an existing prediction column in the dataset with a model](#toc7_6__)    \n",
-    "    - [Pass `<vm_model>` in dataset interface](#toc7_6_1__)    \n",
-    "    - [Through `assign_predictions` interface](#toc7_6_2__)    \n",
-    "  - [Run an example test](#toc7_7__)    \n",
-    "  - [Using `predict_fn` to store multiple columns](#toc7_8__)    \n",
-    "    - [Create enhanced predict function](#toc7_8_1__)    \n",
-    "    - [Initialize model with predict function](#toc7_8_2__)    \n",
-    "    - [Assign predictions with multiple columns](#toc7_8_3__)    \n",
-    "    - [Verify multiple columns in dataset](#toc7_8_4__)    \n",
-    "- [Next steps](#toc8__)    \n",
-    "  - [Work with your model documentation](#toc8_1__)    \n",
-    "  - [Discover more learning resources](#toc8_2__)    \n",
-    "- [Upgrade ValidMind](#toc9__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
-    "\n",
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Custom tests**: Custom tests are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom test.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom test. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Binary classification`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Load the sample dataset\n",
-    "\n",
-    "The sample dataset used here is provided by the ValidMind library. To be able to use it, you need to import the dataset and load it into a pandas [DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html), a two-dimensional tabular data structure that makes use of rows and columns:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Import the sample dataset from the library\n",
-    "\n",
-    "from validmind.datasets.classification import customer_churn as demo_dataset\n",
-    "\n",
-    "print(\n",
-    "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{demo_dataset.target_column}' \\n\\t• Class labels: {demo_dataset.class_labels}\"\n",
-    ")\n",
-    "\n",
-    "raw_df = demo_dataset.load_data()\n",
-    "raw_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Prepocess the raw dataset\n",
-    "\n",
-    "Preprocessing performs a number of operations to get ready for the subsequent steps:\n",
-    "\n",
-    "- Preprocess the data: Splits the DataFrame (`df`) into multiple datasets (`train_df`, `validation_df`, and `test_df`) using `demo_dataset.preprocess` to simplify preprocessing.\n",
-    "- Separate features and targets: Drops the target column to create feature sets (`x_train`, `x_val`) and target sets (`y_train`, `y_val`)."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "train_df, validation_df, test_df = demo_dataset.preprocess(raw_df)\n",
-    "x_train = train_df.drop(demo_dataset.target_column, axis=1)\n",
-    "y_train = train_df[demo_dataset.target_column]\n",
-    "x_val = validation_df.drop(demo_dataset.target_column, axis=1)\n",
-    "y_val = validation_df[demo_dataset.target_column]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Train models for testing\n",
-    "\n",
-    "- Initialize XGBoost and Logistic Regression Classifiers"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from sklearn.linear_model import LogisticRegression\n",
-    "import xgboost\n",
-    "\n",
-    "%matplotlib inline\n",
-    "\n",
-    "xgb = xgboost.XGBClassifier(early_stopping_rounds=10)\n",
-    "xgb.set_params(\n",
-    "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
-    ")\n",
-    "xgb.fit(\n",
-    "    x_train,\n",
-    "    y_train,\n",
-    "    eval_set=[(x_val, y_val)],\n",
-    "    verbose=False,\n",
-    ")\n",
-    "\n",
-    "lr = LogisticRegression(random_state=0)\n",
-    "lr.fit(\n",
-    "    x_train,\n",
-    "    y_train,\n",
-    ")\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Initialize ValidMind objects\n",
-    "\n",
-    "<a id='toc6_1__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind models"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_model_xgb = vm.init_model(\n",
-    "    xgb,\n",
-    "    input_id=\"xgb\",\n",
-    ")\n",
-    "vm_model_lr = vm.init_model(\n",
-    "    lr,\n",
-    "    input_id=\"lr\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind datasets\n",
-    "\n",
-    "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
-    "\n",
-    "This function takes a number of arguments:\n",
-    "\n",
-    "- `dataset` — the raw dataset that you want to provide as input to tests\n",
-    "- `input_id` - a unique identifier that allows tracking what inputs are used when running each individual test\n",
-    "- `target_column` — a required argument if tests require access to true values. This is the name of the target column in the dataset\n",
-    "- `class_labels` — an optional value to map predicted classes to class labels\n",
-    "\n",
-    "With all datasets ready, you can now initialize the raw, training and test datasets (`raw_df`, `train_df` and `test_df`) created earlier into their own dataset objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_raw_ds = vm.init_dataset(\n",
-    "    input_id=\"raw_dataset\",\n",
-    "    dataset=raw_df,\n",
-    "    target_column=demo_dataset.target_column,\n",
-    ")\n",
-    "\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    input_id=\"train_dataset\",\n",
-    "    dataset=train_df,\n",
-    "    target_column=demo_dataset.target_column,\n",
-    ")\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    input_id=\"test_dataset\", dataset=test_df, target_column=demo_dataset.target_column\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Options to load predictions using the ValidMind Library\n",
-    "\n",
-    "<a id='toc7_1__'></a>\n",
-    "\n",
-    "### Load predictions from a file\n",
-    "\n",
-    "This creates a new column called `<model_id>_prediction` in the dataset and assigns metadata to track that the `<model_id>_prediction` column is linked to the model `<model_id>`"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_2__'></a>\n",
-    "\n",
-    "### Predictions calculated outside of VM"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import pandas as pd\n",
-    "\n",
-    "train_xgb_prediction = pd.DataFrame(xgb.predict(x_train), columns=[\"xgb_prediction\"])\n",
-    "test__xgb_prediction = pd.DataFrame(xgb.predict(x_val), columns=[\"xgb_prediction\"])\n",
-    "\n",
-    "train_lr_prediction = pd.DataFrame(lr.predict(x_train), columns=[\"lr_prediction\"])\n",
-    "test_lr_prediction = pd.DataFrame(lr.predict(x_val), columns=[\"lr_prediction\"])"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_3__'></a>\n",
-    "\n",
-    "### Assign predictions to the training dataset\n",
-    "\n",
-    "We can now use the `assign_predictions()` method from the `Dataset` object to link existing predictions to any model:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds.assign_predictions(\n",
-    "    model=vm_model_xgb, prediction_values=train_xgb_prediction.xgb_prediction.values\n",
-    ")\n",
-    "vm_train_ds.assign_predictions(\n",
-    "    model=vm_model_lr, prediction_values=train_lr_prediction.lr_prediction.values\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_4__'></a>\n",
-    "\n",
-    "### Run an example test\n",
-    "\n",
-    "Now, let's run an example test such as `MinimumAccuracy` twice to show how we're able to load the correct model predictions by using the `model` input parameter, even though we're passing the same `train_ds` dataset instance to the test:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "full_suite = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.MinimumAccuracy\",\n",
-    "    inputs={\"dataset\": vm_train_ds, \"model\": vm_model_xgb},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "full_suite = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.MinimumAccuracy\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_train_ds,\n",
-    "        \"model\": vm_model_lr,\n",
-    "    },\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_5__'></a>\n",
-    "\n",
-    "### Link an existing prediction column in the dataset with a model\n",
-    "\n",
-    "This approach allows loading datasets that already have prediction columns in addition to feature and target columns. The ValidMind Library assigns metadata to track the predictions column that are linked to a given `<vm_model>` model."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "train_df2 = train_df.copy()\n",
-    "train_df2[\"xgb_prediction\"] = train_xgb_prediction.xgb_prediction.values\n",
-    "train_df2[\"lr_prediction\"] = train_lr_prediction.lr_prediction.values\n",
-    "train_df2.head(5)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "feature_columns = [\n",
-    "    \"CreditScore\",\n",
-    "    \"Gender\",\n",
-    "    \"Age\",\n",
-    "    \"Tenure\",\n",
-    "    \"Balance\",\n",
-    "    \"NumOfProducts\",\n",
-    "    \"HasCrCard\",\n",
-    "    \"IsActiveMember\",\n",
-    "    \"EstimatedSalary\",\n",
-    "    \"Geography_France\",\n",
-    "    \"Geography_Germany\",\n",
-    "    \"Geography_Spain\",\n",
-    "]\n",
-    "\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    dataset=train_df2,\n",
-    "    input_id=\"train_dataset\",\n",
-    "    target_column=demo_dataset.target_column,\n",
-    "    feature_columns=feature_columns,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_5_1__'></a>\n",
-    "\n",
-    "#### Link prediction column to a specific model\n",
-    "\n",
-    "The `prediction_column` parameter informs the `Dataset` object about the model that should be linked to that column."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds.assign_predictions(model=vm_model_xgb, prediction_column=\"xgb_prediction\")\n",
-    "vm_train_ds.assign_predictions(model=vm_model_lr, prediction_column=\"lr_prediction\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "id": "wE0OckXjSPc7"
-   },
-   "outputs": [],
-   "source": [
-    "full_suite = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.MinimumAccuracy\",\n",
-    "    inputs={\"dataset\": vm_train_ds, \"model\": vm_model_xgb},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "full_suite = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.MinimumAccuracy\",\n",
-    "    inputs={\"dataset\": vm_train_ds, \"model\": vm_model_lr},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_6__'></a>\n",
-    "\n",
-    "### Link an existing prediction column in the dataset with a model\n",
-    "\n",
-    "This lets the ValidMind Library run model predictions, creates a new column called `<model_id>_prediction`, and assign metadata to track that the `<model_id>_prediction` column is linked to the `<vm_model>` model.\n",
-    "\n",
-    "There are two ways run and assign model predictions with the ValidMind Library:\n",
-    "\n",
-    "- When initializing a `Dataset` with `init_dataset()`. This is the most straightforward method to assign predictions for a single model.\n",
-    "- Using `dataset.assign_predictions()`. This allows assigning predictions to a dataset for one or more models."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_6_1__'></a>\n",
-    "\n",
-    "#### Pass `<vm_model>` in dataset interface"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "feature_columns = [\n",
-    "    \"CreditScore\",\n",
-    "    \"Gender\",\n",
-    "    \"Age\",\n",
-    "    \"Tenure\",\n",
-    "    \"Balance\",\n",
-    "    \"NumOfProducts\",\n",
-    "    \"HasCrCard\",\n",
-    "    \"IsActiveMember\",\n",
-    "    \"EstimatedSalary\",\n",
-    "    \"Geography_France\",\n",
-    "    \"Geography_Germany\",\n",
-    "    \"Geography_Spain\",\n",
-    "]\n",
-    "\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    model=vm_model_xgb,\n",
-    "    dataset=train_df,\n",
-    "    input_id=\"train_dataset\",\n",
-    "    target_column=demo_dataset.target_column,\n",
-    "    feature_columns=feature_columns,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_6_2__'></a>\n",
-    "\n",
-    "#### Through `assign_predictions` interface"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds = vm.init_dataset(\n",
-    "    dataset=train_df,\n",
-    "    input_id=\"train_dataset\",\n",
-    "    target_column=demo_dataset.target_column,\n",
-    "    feature_columns=feature_columns,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "##### Perform predictions using the same `assign_predictions` interface"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds.assign_predictions(model=vm_model_xgb)\n",
-    "vm_train_ds.assign_predictions(model=vm_model_lr)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_7__'></a>\n",
-    "\n",
-    "### Run an example test\n",
-    "\n",
-    "Now, let's run an example test such as `MinimumAccuracy` twice to show how we're able to load the correct model predictions by using the `model` input parameter, even though we're passing the same `train_ds` dataset instance to the test:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "full_suite = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.MinimumAccuracy\",\n",
-    "    inputs={\"dataset\": vm_train_ds, \"model\": vm_model_xgb},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "full_suite = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.MinimumAccuracy\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_train_ds,\n",
-    "        \"model\": vm_model_lr,\n",
-    "    },\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_8__'></a>\n",
-    "\n",
-    "### Using `predict_fn` to store multiple columns\n",
-    "\n",
-    "The `predict_fn` parameter in `vm.init_model()` allows you to create models that return multiple pieces of information when making predictions. This is particularly useful when you want to capture additional metadata, confidence scores, feature importance, or any other model-related information alongside the main prediction.\n",
-    "\n",
-    "By returning a dictionary from your predict function, ValidMind automatically creates separate columns for each key when you run `assign_predictions()`."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_8_1__'></a>\n",
-    "\n",
-    "#### Create enhanced predict function\n",
-    "\n",
-    "Let's create a predict function that wraps our XGBoost model and returns multiple pieces of information:\n",
-    "- **prediction**: The main class prediction\n",
-    "- **prediction_proba**: The prediction probabilities for both classes\n",
-    "- **confidence**: The maximum probability as a confidence score\n",
-    "- **model_info**: Metadata about the model used"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import numpy as np\n",
-    "import pandas as pd\n",
-    "\n",
-    "def enhanced_xgb_predict_fn(input_data):\n",
-    "    \"\"\"\n",
-    "    Enhanced predict function that returns multiple pieces of information.\n",
-    "    \n",
-    "    Args:\n",
-    "        input_data: Input features for prediction (single row as dictionary when called by ValidMind)\n",
-    "    \n",
-    "    Returns:\n",
-    "        dict: Dictionary containing prediction, probabilities, confidence, and model info\n",
-    "    \"\"\"\n",
-    "    # Define the feature columns that the model was trained on\n",
-    "    # These are the same columns from x_train (excluding the target column 'Exited')\n",
-    "    training_features = [\n",
-    "        'CreditScore', 'Gender', 'Age', 'Tenure', 'Balance', 'NumOfProducts',\n",
-    "        'HasCrCard', 'IsActiveMember', 'EstimatedSalary', 'Geography_France',\n",
-    "        'Geography_Germany', 'Geography_Spain'\n",
-    "    ]\n",
-    "    \n",
-    "    # Convert dictionary input to DataFrame for model prediction\n",
-    "    # When called by ValidMind, input_data is a single row dictionary\n",
-    "    if isinstance(input_data, dict):\n",
-    "        # Filter to only include training features and convert to DataFrame\n",
-    "        filtered_data = {key: value for key, value in input_data.items() if key in training_features}\n",
-    "        input_df = pd.DataFrame([filtered_data])\n",
-    "        \n",
-    "        # Ensure all training features are present (in case some are missing)\n",
-    "        for feature in training_features:\n",
-    "            if feature not in input_df.columns:\n",
-    "                input_df[feature] = 0  # Default value for missing features\n",
-    "        \n",
-    "        # Reorder columns to match training order\n",
-    "        input_df = input_df[training_features]\n",
-    "    else:\n",
-    "        # Handle other input types (DataFrame, array, etc.)\n",
-    "        input_df = pd.DataFrame(input_data) if not isinstance(input_data, pd.DataFrame) else input_data\n",
-    "        # Filter to training features if it's a DataFrame\n",
-    "        if isinstance(input_df, pd.DataFrame):\n",
-    "            input_df = input_df[training_features]\n",
-    "    \n",
-    "    # Make predictions\n",
-    "    prediction = xgb.predict(input_df)\n",
-    "    prediction_proba = xgb.predict_proba(input_df)\n",
-    "    \n",
-    "    # Since we're processing one row at a time, extract the single values\n",
-    "    single_prediction = prediction[0] if len(prediction) > 0 else None\n",
-    "    single_proba = prediction_proba[0] if len(prediction_proba) > 0 else None\n",
-    "    \n",
-    "    # Calculate confidence as the maximum probability for this prediction\n",
-    "    confidence = np.max(single_proba) if single_proba is not None else None\n",
-    "    \n",
-    "    # Create model metadata\n",
-    "    model_info = {\n",
-    "        \"model_type\": \"XGBClassifier\",\n",
-    "        \"n_estimators\": xgb.n_estimators,\n",
-    "        \"max_depth\": xgb.max_depth,\n",
-    "        \"feature_count\": len(training_features),\n",
-    "        \"features_used\": training_features\n",
-    "    }\n",
-    "    \n",
-    "    return {\n",
-    "        \"prediction\": single_prediction,\n",
-    "        \"prediction_proba\": single_proba.tolist() if single_proba is not None else None,\n",
-    "        \"confidence\": confidence,\n",
-    "        \"model_info\": model_info\n",
-    "    }\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_8_2__'></a>\n",
-    "\n",
-    "#### Initialize model with predict function\n",
-    "\n",
-    "Now we'll create a ValidMind model using the `predict_fn` parameter. This tells ValidMind to use our enhanced function instead of the model's default `predict()` method:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize ValidMind model with the enhanced predict function\n",
-    "vm_model_enhanced_xgb = vm.init_model(\n",
-    "    model=xgb,\n",
-    "    input_id=\"enhanced_xgb\",\n",
-    "    predict_fn=enhanced_xgb_predict_fn \n",
-    ")\n",
-    "\n",
-    "print(f\"Enhanced XGBoost model initialized with input_id: {vm_model_enhanced_xgb.input_id}\")\n",
-    "print(\"This model now uses the predict function that handles dictionary inputs correctly\")\n",
-    "print(\"It will return multiple columns when predictions are assigned to datasets\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_8_3__'></a>\n",
-    "\n",
-    "#### Assign predictions with multiple columns\n",
-    "\n",
-    "When we use `assign_predictions()` with our enhanced model, ValidMind will automatically create separate columns for each key returned by our predict function. Let's assign predictions to our test dataset:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Create a fresh dataset for this demonstration\n",
-    "vm_test_ds_enhanced = vm.init_dataset(\n",
-    "    input_id=\"test_dataset_enhanced\",\n",
-    "    dataset=test_df,\n",
-    "    target_column=demo_dataset.target_column\n",
-    ")\n",
-    "\n",
-    "# This will create multiple columns based on the keys returned by our predict function\n",
-    "vm_test_ds_enhanced.assign_predictions(model=vm_model_enhanced_xgb)\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_8_4__'></a>\n",
-    "\n",
-    "#### Verify multiple columns in dataset\n",
-    "\n",
-    "Let's examine the dataset to see all the columns that were created by our enhanced predict function. Each key from the returned dictionary becomes a separate column with the model's `input_id` as a prefix:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_test_ds_enhanced._df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc8__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
-    "\n",
-    "<a id='toc8_1__'></a>\n",
-    "\n",
-    "### Work with your model documentation\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)\n",
-    "\n",
-    "<a id='toc8_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc9__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-76fcd2c215674068b812492b7c639056",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "colab": {
-   "provenance": []
-  },
-  "gpuClass": "standard",
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.11.9"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 0
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Load dataset predictions\n",
+        "\n",
+        "To enable tests to make use of predictions, you can load predictions in ValidMind dataset objects in multiple different ways.\n",
+        "\n",
+        "This interactive notebook includes the code required to load the demo dataset, preprocess the raw dataset and train a model for testing, and initialize ValidMind objects. Additionally, it offers options for loading predictions using the `assign_predictions()` function, such as loading predictions from a file, linking an existing prediction column in the dataset with a model, or allowing the ValidMind Library to run and link predictions to a model."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "  - [Preview the documentation template](#toc2_3__)    \n",
+        "- [Load the sample dataset](#toc3__)    \n",
+        "- [Prepocess the raw dataset](#toc4__)    \n",
+        "- [Train models for testing](#toc5__)    \n",
+        "- [Initialize ValidMind objects](#toc6__)    \n",
+        "  - [Initialize the ValidMind models](#toc6_1__)    \n",
+        "  - [Initialize the ValidMind datasets](#toc6_2__)    \n",
+        "- [Options to load predictions using the ValidMind Library](#toc7__)    \n",
+        "  - [Load predictions from a file](#toc7_1__)    \n",
+        "  - [Predictions calculated outside of VM](#toc7_2__)    \n",
+        "  - [Assign predictions to the training dataset](#toc7_3__)    \n",
+        "  - [Run an example test](#toc7_4__)    \n",
+        "  - [Link an existing prediction column in the dataset with a model](#toc7_5__)    \n",
+        "    - [Link prediction column to a specific model](#toc7_5_1__)    \n",
+        "  - [Link an existing prediction column in the dataset with a model](#toc7_6__)    \n",
+        "    - [Pass `<vm_model>` in dataset interface](#toc7_6_1__)    \n",
+        "    - [Through `assign_predictions` interface](#toc7_6_2__)    \n",
+        "  - [Run an example test](#toc7_7__)    \n",
+        "  - [Using `predict_fn` to store multiple columns](#toc7_8__)    \n",
+        "    - [Create enhanced predict function](#toc7_8_1__)    \n",
+        "    - [Initialize model with predict function](#toc7_8_2__)    \n",
+        "    - [Assign predictions with multiple columns](#toc7_8_3__)    \n",
+        "    - [Verify multiple columns in dataset](#toc7_8_4__)    \n",
+        "- [Next steps](#toc8__)    \n",
+        "  - [Work with your model documentation](#toc8_1__)    \n",
+        "  - [Discover more learning resources](#toc8_2__)    \n",
+        "- [Upgrade ValidMind](#toc9__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+        "\n",
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Binary classification`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Load the sample dataset\n",
+        "\n",
+        "The sample dataset used here is provided by the ValidMind library. To be able to use it, you need to import the dataset and load it into a pandas [DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html), a two-dimensional tabular data structure that makes use of rows and columns:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Import the sample dataset from the library\n",
+        "\n",
+        "from validmind.datasets.classification import customer_churn as demo_dataset\n",
+        "\n",
+        "print(\n",
+        "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{demo_dataset.target_column}' \\n\\t• Class labels: {demo_dataset.class_labels}\"\n",
+        ")\n",
+        "\n",
+        "raw_df = demo_dataset.load_data()\n",
+        "raw_df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Prepocess the raw dataset\n",
+        "\n",
+        "Preprocessing performs a number of operations to get ready for the subsequent steps:\n",
+        "\n",
+        "- Preprocess the data: Splits the DataFrame (`df`) into multiple datasets (`train_df`, `validation_df`, and `test_df`) using `demo_dataset.preprocess` to simplify preprocessing.\n",
+        "- Separate features and targets: Drops the target column to create feature sets (`x_train`, `x_val`) and target sets (`y_train`, `y_val`)."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "train_df, validation_df, test_df = demo_dataset.preprocess(raw_df)\n",
+        "x_train = train_df.drop(demo_dataset.target_column, axis=1)\n",
+        "y_train = train_df[demo_dataset.target_column]\n",
+        "x_val = validation_df.drop(demo_dataset.target_column, axis=1)\n",
+        "y_val = validation_df[demo_dataset.target_column]"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Train models for testing\n",
+        "\n",
+        "- Initialize XGBoost and Logistic Regression Classifiers"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from sklearn.linear_model import LogisticRegression\n",
+        "import xgboost\n",
+        "\n",
+        "%matplotlib inline\n",
+        "\n",
+        "xgb = xgboost.XGBClassifier(early_stopping_rounds=10)\n",
+        "xgb.set_params(\n",
+        "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
+        ")\n",
+        "xgb.fit(\n",
+        "    x_train,\n",
+        "    y_train,\n",
+        "    eval_set=[(x_val, y_val)],\n",
+        "    verbose=False,\n",
+        ")\n",
+        "\n",
+        "lr = LogisticRegression(random_state=0)\n",
+        "lr.fit(\n",
+        "    x_train,\n",
+        "    y_train,\n",
+        ")\n"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Initialize ValidMind objects\n",
+        "\n",
+        "<a id='toc6_1__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind models"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_model_xgb = vm.init_model(\n",
+        "    xgb,\n",
+        "    input_id=\"xgb\",\n",
+        ")\n",
+        "vm_model_lr = vm.init_model(\n",
+        "    lr,\n",
+        "    input_id=\"lr\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind datasets\n",
+        "\n",
+        "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
+        "\n",
+        "This function takes a number of arguments:\n",
+        "\n",
+        "- `dataset` — the raw dataset that you want to provide as input to tests\n",
+        "- `input_id` - a unique identifier that allows tracking what inputs are used when running each individual test\n",
+        "- `target_column` — a required argument if tests require access to true values. This is the name of the target column in the dataset\n",
+        "- `class_labels` — an optional value to map predicted classes to class labels\n",
+        "\n",
+        "With all datasets ready, you can now initialize the raw, training and test datasets (`raw_df`, `train_df` and `test_df`) created earlier into their own dataset objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_raw_ds = vm.init_dataset(\n",
+        "    input_id=\"raw_dataset\",\n",
+        "    dataset=raw_df,\n",
+        "    target_column=demo_dataset.target_column,\n",
+        ")\n",
+        "\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    input_id=\"train_dataset\",\n",
+        "    dataset=train_df,\n",
+        "    target_column=demo_dataset.target_column,\n",
+        ")\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    input_id=\"test_dataset\", dataset=test_df, target_column=demo_dataset.target_column\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Options to load predictions using the ValidMind Library\n",
+        "\n",
+        "<a id='toc7_1__'></a>\n",
+        "\n",
+        "### Load predictions from a file\n",
+        "\n",
+        "This creates a new column called `<model_id>_prediction` in the dataset and assigns metadata to track that the `<model_id>_prediction` column is linked to the model `<model_id>`"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_2__'></a>\n",
+        "\n",
+        "### Predictions calculated outside of VM"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import pandas as pd\n",
+        "\n",
+        "train_xgb_prediction = pd.DataFrame(xgb.predict(x_train), columns=[\"xgb_prediction\"])\n",
+        "test__xgb_prediction = pd.DataFrame(xgb.predict(x_val), columns=[\"xgb_prediction\"])\n",
+        "\n",
+        "train_lr_prediction = pd.DataFrame(lr.predict(x_train), columns=[\"lr_prediction\"])\n",
+        "test_lr_prediction = pd.DataFrame(lr.predict(x_val), columns=[\"lr_prediction\"])"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_3__'></a>\n",
+        "\n",
+        "### Assign predictions to the training dataset\n",
+        "\n",
+        "We can now use the `assign_predictions()` method from the `Dataset` object to link existing predictions to any model:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds.assign_predictions(\n",
+        "    model=vm_model_xgb, prediction_values=train_xgb_prediction.xgb_prediction.values\n",
+        ")\n",
+        "vm_train_ds.assign_predictions(\n",
+        "    model=vm_model_lr, prediction_values=train_lr_prediction.lr_prediction.values\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_4__'></a>\n",
+        "\n",
+        "### Run an example test\n",
+        "\n",
+        "Now, let's run an example test such as `MinimumAccuracy` twice to show how we're able to load the correct model predictions by using the `model` input parameter, even though we're passing the same `train_ds` dataset instance to the test:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "full_suite = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.MinimumAccuracy\",\n",
+        "    inputs={\"dataset\": vm_train_ds, \"model\": vm_model_xgb},\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "full_suite = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.MinimumAccuracy\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_train_ds,\n",
+        "        \"model\": vm_model_lr,\n",
+        "    },\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_5__'></a>\n",
+        "\n",
+        "### Link an existing prediction column in the dataset with a model\n",
+        "\n",
+        "This approach allows loading datasets that already have prediction columns in addition to feature and target columns. The ValidMind Library assigns metadata to track the predictions column that are linked to a given `<vm_model>` model."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "train_df2 = train_df.copy()\n",
+        "train_df2[\"xgb_prediction\"] = train_xgb_prediction.xgb_prediction.values\n",
+        "train_df2[\"lr_prediction\"] = train_lr_prediction.lr_prediction.values\n",
+        "train_df2.head(5)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "feature_columns = [\n",
+        "    \"CreditScore\",\n",
+        "    \"Gender\",\n",
+        "    \"Age\",\n",
+        "    \"Tenure\",\n",
+        "    \"Balance\",\n",
+        "    \"NumOfProducts\",\n",
+        "    \"HasCrCard\",\n",
+        "    \"IsActiveMember\",\n",
+        "    \"EstimatedSalary\",\n",
+        "    \"Geography_France\",\n",
+        "    \"Geography_Germany\",\n",
+        "    \"Geography_Spain\",\n",
+        "]\n",
+        "\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    dataset=train_df2,\n",
+        "    input_id=\"train_dataset\",\n",
+        "    target_column=demo_dataset.target_column,\n",
+        "    feature_columns=feature_columns,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_5_1__'></a>\n",
+        "\n",
+        "#### Link prediction column to a specific model\n",
+        "\n",
+        "The `prediction_column` parameter informs the `Dataset` object about the model that should be linked to that column."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds.assign_predictions(model=vm_model_xgb, prediction_column=\"xgb_prediction\")\n",
+        "vm_train_ds.assign_predictions(model=vm_model_lr, prediction_column=\"lr_prediction\")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "wE0OckXjSPc7"
+      },
+      "source": [
+        "full_suite = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.MinimumAccuracy\",\n",
+        "    inputs={\"dataset\": vm_train_ds, \"model\": vm_model_xgb},\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "full_suite = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.MinimumAccuracy\",\n",
+        "    inputs={\"dataset\": vm_train_ds, \"model\": vm_model_lr},\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_6__'></a>\n",
+        "\n",
+        "### Link an existing prediction column in the dataset with a model\n",
+        "\n",
+        "This lets the ValidMind Library run model predictions, creates a new column called `<model_id>_prediction`, and assign metadata to track that the `<model_id>_prediction` column is linked to the `<vm_model>` model.\n",
+        "\n",
+        "There are two ways run and assign model predictions with the ValidMind Library:\n",
+        "\n",
+        "- When initializing a `Dataset` with `init_dataset()`. This is the most straightforward method to assign predictions for a single model.\n",
+        "- Using `dataset.assign_predictions()`. This allows assigning predictions to a dataset for one or more models."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_6_1__'></a>\n",
+        "\n",
+        "#### Pass `<vm_model>` in dataset interface"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "feature_columns = [\n",
+        "    \"CreditScore\",\n",
+        "    \"Gender\",\n",
+        "    \"Age\",\n",
+        "    \"Tenure\",\n",
+        "    \"Balance\",\n",
+        "    \"NumOfProducts\",\n",
+        "    \"HasCrCard\",\n",
+        "    \"IsActiveMember\",\n",
+        "    \"EstimatedSalary\",\n",
+        "    \"Geography_France\",\n",
+        "    \"Geography_Germany\",\n",
+        "    \"Geography_Spain\",\n",
+        "]\n",
+        "\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    model=vm_model_xgb,\n",
+        "    dataset=train_df,\n",
+        "    input_id=\"train_dataset\",\n",
+        "    target_column=demo_dataset.target_column,\n",
+        "    feature_columns=feature_columns,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_6_2__'></a>\n",
+        "\n",
+        "#### Through `assign_predictions` interface"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds = vm.init_dataset(\n",
+        "    dataset=train_df,\n",
+        "    input_id=\"train_dataset\",\n",
+        "    target_column=demo_dataset.target_column,\n",
+        "    feature_columns=feature_columns,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Perform predictions using the same `assign_predictions` interface"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds.assign_predictions(model=vm_model_xgb)\n",
+        "vm_train_ds.assign_predictions(model=vm_model_lr)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_7__'></a>\n",
+        "\n",
+        "### Run an example test\n",
+        "\n",
+        "Now, let's run an example test such as `MinimumAccuracy` twice to show how we're able to load the correct model predictions by using the `model` input parameter, even though we're passing the same `train_ds` dataset instance to the test:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "full_suite = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.MinimumAccuracy\",\n",
+        "    inputs={\"dataset\": vm_train_ds, \"model\": vm_model_xgb},\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "full_suite = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.MinimumAccuracy\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_train_ds,\n",
+        "        \"model\": vm_model_lr,\n",
+        "    },\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_8__'></a>\n",
+        "\n",
+        "### Using `predict_fn` to store multiple columns\n",
+        "\n",
+        "The `predict_fn` parameter in `vm.init_model()` allows you to create models that return multiple pieces of information when making predictions. This is particularly useful when you want to capture additional metadata, confidence scores, feature importance, or any other model-related information alongside the main prediction.\n",
+        "\n",
+        "By returning a dictionary from your predict function, ValidMind automatically creates separate columns for each key when you run `assign_predictions()`."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_8_1__'></a>\n",
+        "\n",
+        "#### Create enhanced predict function\n",
+        "\n",
+        "Let's create a predict function that wraps our XGBoost model and returns multiple pieces of information:\n",
+        "- **prediction**: The main class prediction\n",
+        "- **prediction_proba**: The prediction probabilities for both classes\n",
+        "- **confidence**: The maximum probability as a confidence score\n",
+        "- **model_info**: Metadata about the model used"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import numpy as np\n",
+        "import pandas as pd\n",
+        "\n",
+        "def enhanced_xgb_predict_fn(input_data):\n",
+        "    \"\"\"\n",
+        "    Enhanced predict function that returns multiple pieces of information.\n",
+        "    \n",
+        "    Args:\n",
+        "        input_data: Input features for prediction (single row as dictionary when called by ValidMind)\n",
+        "    \n",
+        "    Returns:\n",
+        "        dict: Dictionary containing prediction, probabilities, confidence, and model info\n",
+        "    \"\"\"\n",
+        "    # Define the feature columns that the model was trained on\n",
+        "    # These are the same columns from x_train (excluding the target column 'Exited')\n",
+        "    training_features = [\n",
+        "        'CreditScore', 'Gender', 'Age', 'Tenure', 'Balance', 'NumOfProducts',\n",
+        "        'HasCrCard', 'IsActiveMember', 'EstimatedSalary', 'Geography_France',\n",
+        "        'Geography_Germany', 'Geography_Spain'\n",
+        "    ]\n",
+        "    \n",
+        "    # Convert dictionary input to DataFrame for model prediction\n",
+        "    # When called by ValidMind, input_data is a single row dictionary\n",
+        "    if isinstance(input_data, dict):\n",
+        "        # Filter to only include training features and convert to DataFrame\n",
+        "        filtered_data = {key: value for key, value in input_data.items() if key in training_features}\n",
+        "        input_df = pd.DataFrame([filtered_data])\n",
+        "        \n",
+        "        # Ensure all training features are present (in case some are missing)\n",
+        "        for feature in training_features:\n",
+        "            if feature not in input_df.columns:\n",
+        "                input_df[feature] = 0  # Default value for missing features\n",
+        "        \n",
+        "        # Reorder columns to match training order\n",
+        "        input_df = input_df[training_features]\n",
+        "    else:\n",
+        "        # Handle other input types (DataFrame, array, etc.)\n",
+        "        input_df = pd.DataFrame(input_data) if not isinstance(input_data, pd.DataFrame) else input_data\n",
+        "        # Filter to training features if it's a DataFrame\n",
+        "        if isinstance(input_df, pd.DataFrame):\n",
+        "            input_df = input_df[training_features]\n",
+        "    \n",
+        "    # Make predictions\n",
+        "    prediction = xgb.predict(input_df)\n",
+        "    prediction_proba = xgb.predict_proba(input_df)\n",
+        "    \n",
+        "    # Since we're processing one row at a time, extract the single values\n",
+        "    single_prediction = prediction[0] if len(prediction) > 0 else None\n",
+        "    single_proba = prediction_proba[0] if len(prediction_proba) > 0 else None\n",
+        "    \n",
+        "    # Calculate confidence as the maximum probability for this prediction\n",
+        "    confidence = np.max(single_proba) if single_proba is not None else None\n",
+        "    \n",
+        "    # Create model metadata\n",
+        "    model_info = {\n",
+        "        \"model_type\": \"XGBClassifier\",\n",
+        "        \"n_estimators\": xgb.n_estimators,\n",
+        "        \"max_depth\": xgb.max_depth,\n",
+        "        \"feature_count\": len(training_features),\n",
+        "        \"features_used\": training_features\n",
+        "    }\n",
+        "    \n",
+        "    return {\n",
+        "        \"prediction\": single_prediction,\n",
+        "        \"prediction_proba\": single_proba.tolist() if single_proba is not None else None,\n",
+        "        \"confidence\": confidence,\n",
+        "        \"model_info\": model_info\n",
+        "    }\n"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_8_2__'></a>\n",
+        "\n",
+        "#### Initialize model with predict function\n",
+        "\n",
+        "Now we'll create a ValidMind model using the `predict_fn` parameter. This tells ValidMind to use our enhanced function instead of the model's default `predict()` method:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Initialize ValidMind model with the enhanced predict function\n",
+        "vm_model_enhanced_xgb = vm.init_model(\n",
+        "    model=xgb,\n",
+        "    input_id=\"enhanced_xgb\",\n",
+        "    predict_fn=enhanced_xgb_predict_fn \n",
+        ")\n",
+        "\n",
+        "print(f\"Enhanced XGBoost model initialized with input_id: {vm_model_enhanced_xgb.input_id}\")\n",
+        "print(\"This model now uses the predict function that handles dictionary inputs correctly\")\n",
+        "print(\"It will return multiple columns when predictions are assigned to datasets\")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_8_3__'></a>\n",
+        "\n",
+        "#### Assign predictions with multiple columns\n",
+        "\n",
+        "When we use `assign_predictions()` with our enhanced model, ValidMind will automatically create separate columns for each key returned by our predict function. Let's assign predictions to our test dataset:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Create a fresh dataset for this demonstration\n",
+        "vm_test_ds_enhanced = vm.init_dataset(\n",
+        "    input_id=\"test_dataset_enhanced\",\n",
+        "    dataset=test_df,\n",
+        "    target_column=demo_dataset.target_column\n",
+        ")\n",
+        "\n",
+        "# This will create multiple columns based on the keys returned by our predict function\n",
+        "vm_test_ds_enhanced.assign_predictions(model=vm_model_enhanced_xgb)\n"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_8_4__'></a>\n",
+        "\n",
+        "#### Verify multiple columns in dataset\n",
+        "\n",
+        "Let's examine the dataset to see all the columns that were created by our enhanced predict function. Each key from the returned dictionary becomes a separate column with the model's `input_id` as a prefix:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_test_ds_enhanced._df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
+        "\n",
+        "<a id='toc8_1__'></a>\n",
+        "\n",
+        "### Work with your documentation\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
+        "\n",
+        "<a id='toc8_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc9__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-76fcd2c215674068b812492b7c639056"
+    }
+  ],
+  "metadata": {
+    "colab": {
+      "provenance": []
+    },
+    "gpuClass": "standard",
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.11.9"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 0
 }
diff --git a/site/notebooks/how_to/data_and_datasets/use_dataset_model_objects.ipynb b/site/notebooks/how_to/data_and_datasets/use_dataset_model_objects.ipynb
index 1929fb3acb..7102ad6de1 100644
--- a/site/notebooks/how_to/data_and_datasets/use_dataset_model_objects.ipynb
+++ b/site/notebooks/how_to/data_and_datasets/use_dataset_model_objects.ipynb
@@ -1,991 +1,999 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Introduction to ValidMind Dataset and Model Objects\n",
-    "\n",
-    "When writing custom tests, it is essential to be aware of the interfaces of the ValidMind Dataset and ValidMind Model, which are used as input arguments.\n",
-    "\n",
-    "As a model developer, writing custom tests is beneficial when the ValidMind library lacks a built-in test for your specific needs. For example, a model might require new tests to evaluate specific aspects of the model or dataset based on a particular use case.\n",
-    "\n",
-    "This interactive notebook offers a detailed understanding of ValidMind objects and their use in writing custom tests. It introduces various interfaces provided by these objects and demonstrates how they can be leveraged to implement tests effortlessly."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "- [Load the demo dataset](#toc3__)    \n",
-    "  - [Prepocess the raw dataset](#toc3_1__)    \n",
-    "- [Train a model for testing](#toc4__)    \n",
-    "- [Explore basic components of the ValidMind library](#toc5__)    \n",
-    "  - [VMDataset Object](#toc5_1__)    \n",
-    "    - [Initialize the ValidMind datasets](#toc5_1_1__)    \n",
-    "    - [ Interfaces of the dataset object](#toc5_1_2__)    \n",
-    "  - [Using VM Dataset object as arguments in custom tests](#toc5_2__)    \n",
-    "    - [Run the test](#toc5_2_1__)    \n",
-    "  - [Using VM Dataset object and parameters as arguments in custom tests](#toc5_3__)    \n",
-    "  - [VMModel Object](#toc5_4__)    \n",
-    "  - [Initialize ValidMind model object](#toc5_5__)    \n",
-    "  - [Assign predictions to the datasets](#toc5_6__)    \n",
-    "  - [Using VM Model and Dataset objects as arguments in Custom tests](#toc5_7__)    \n",
-    "  - [Log the test results](#toc5_8__)    \n",
-    "- [In summary](#toc6__)    \n",
-    "- [Discover more learning resources](#toc7__)    \n",
-    "- [Upgrade ValidMind](#toc8__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models. You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language.\n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
-    "\n",
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "Here, we will focus on ValidMind dataset, ValidMind model and tests to use these objects to generate artefacts for the documentation.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Custom tests**: Custom tests are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "- **model**: A single ValidMind model object that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "- **dataset**: Single ValidMind dataset object that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "- **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom test.\n",
-    "- **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom test. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Dataset based Test**\n",
-    "\n",
-    "![Dataset based test architecture](./dataset_image.png)\n",
-    "The dataset based tests take VM dataset object(s) as inputs, test configuration as test parameters to produce `Outputs` as mentioned above.\n",
-    "\n",
-    "**Model based Test**\n",
-    "\n",
-    "![Model based test architecture](./model_image.png)\n",
-    "Similar to datasest based tests, the model based tests as an additional input that is VM model object. It allows to identify prediction values of a specific model in the dataset object. "
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "Please note the following recommended Python versions to use:\n",
-    "\n",
-    "- Python 3.7 > x <= 3.11\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Binary classification`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {
-    "metadata": {}
-   },
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%matplotlib inline\n",
-    "\n",
-    "import xgboost as xgb"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Load the demo dataset"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.datasets.classification import customer_churn as demo_dataset\n",
-    "\n",
-    "raw_df = demo_dataset.load_data()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Prepocess the raw dataset"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "train_df, validation_df, test_df = demo_dataset.preprocess(raw_df)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Train a model for testing\n",
-    "\n",
-    "We train a simple customer churn model for our test."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "x_train = train_df.drop(demo_dataset.target_column, axis=1)\n",
-    "y_train = train_df[demo_dataset.target_column]\n",
-    "x_val = validation_df.drop(demo_dataset.target_column, axis=1)\n",
-    "y_val = validation_df[demo_dataset.target_column]\n",
-    "\n",
-    "model = xgb.XGBClassifier(early_stopping_rounds=10)\n",
-    "model.set_params(\n",
-    "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
-    ")\n",
-    "model.fit(\n",
-    "    x_train,\n",
-    "    y_train,\n",
-    "    eval_set=[(x_val, y_val)],\n",
-    "    verbose=False,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Explore basic components of the ValidMind library\n",
-    "\n",
-    "In this section, you will learn about the basic objects of the ValidMind library that are necessary to implement both custom and built-in tests. As explained above, these objects are:\n",
-    "* VMDataset: [The high level APIs can be found here](https://docs.validmind.ai/validmind/validmind/vm_models.html#VMDataset)\n",
-    "* VMModel: [The high level APIs can be found here](https://docs.validmind.ai/validmind/validmind/vm_models.html#VMModel)\n",
-    "\n",
-    "Let's understand these objects and their interfaces step by step: "
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_1__'></a>\n",
-    "\n",
-    "### VMDataset Object"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_1_1__'></a>\n",
-    "\n",
-    "#### Initialize the ValidMind datasets\n",
-    "\n",
-    "You can initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
-    "\n",
-    "The function wraps the dataset to create a ValidMind `Dataset` object so that you can write tests effectively using the common interface provided by the VM objects. This step is always necessary every time you want to connect a dataset to documentation and produce test results through ValidMind. You only need to do it one time per dataset.\n",
-    "\n",
-    "This function takes a number of arguments. Some of the arguments are:\n",
-    "\n",
-    "- `dataset` — the raw dataset that you want to provide as input to tests\n",
-    "- `input_id` - a unique identifier that allows tracking what inputs are used when running each individual test\n",
-    "- `target_column` — a required argument if tests require access to true values. This is the name of the target column in the dataset\n",
-    "\n",
-    "The detailed list of the arguments can be found [here](https://docs.validmind.ai/validmind/validmind.html#init_dataset) "
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# vm_raw_dataset is now a VMDataset object that you can pass to any ValidMind test\n",
-    "vm_raw_dataset = vm.init_dataset(\n",
-    "    dataset=raw_df,\n",
-    "    input_id=\"raw_dataset\",\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Once you have a ValidMind dataset object (VMDataset), you can inspect its attributes and methods using the inspect_obj utility module. This module provides a list of available attributes and interfaces for use in tests. Understanding how to use VMDatasets is crucial for comprehending how a custom test functions."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.utils import inspect_obj\n",
-    "inspect_obj(vm_raw_dataset)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_1_2__'></a>\n",
-    "\n",
-    "####  Interfaces of the dataset object\n",
-    "\n",
-    "**DataFrame**"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_raw_dataset.df"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "**Feature columns**"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_raw_dataset.feature_columns"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "**Target column**"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_raw_dataset.target_column"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "**Features values**"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_raw_dataset.x_df()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "**Target value**"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_raw_dataset.y_df()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "**Numeric feature columns** "
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_raw_dataset.feature_columns_numeric"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "**Categorical feature columns** "
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_raw_dataset.feature_columns_categorical"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Similarly, you can use all other interfaces of the [VMDataset objects](https://docs.validmind.ai/validmind/validmind/vm_models.html#VMDataset) "
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2__'></a>\n",
-    "\n",
-    "### Using VM Dataset object as arguments in custom tests\n",
-    "\n",
-    "A custom test is simply a Python function that takes two types of arguments: `inputs` and `params`. The `inputs` are ValidMind objects (`VMDataset`, `VMModel`), and the `params` are additional parameters required for the underlying computation of the test. We will discuss both types of arguments in the following sections.\n",
-    "\n",
-    "Let's start with a custom test that requires only a ValidMind dataset object. In this example, we will check the balance of classes in the target column of the dataset:\n",
-    "\n",
-    "- The custom test below requires a single argument of type `VMDataset` (dataset).\n",
-    "- The `my_custom_tests.ClassImbalance` is a unique test identifier that can be assigned using the `vm.test` decorator functionality. This unique test ID will be used in the platform to load test results in the documentation.\n",
-    "- The `dataset.target_column` and `dataset.df` attributes of the `VMDataset` object are used in the test.\n",
-    "\n",
-    "Other high-level APIs (attributes and methods) of the dataset object are listed [here](https://docs.validmind.ai/validmind/validmind/vm_models.html#VMDataset).\n",
-    "\n",
-    "If you've gone through the [Implement custom tests notebook](../tests/custom_tests/implement_custom_tests.ipynb), you should have a good understanding of how custom tests are implemented in details. If you haven't, we recommend going through that notebook first."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.vm_models.dataset.dataset import VMDataset\n",
-    "import pandas as pd\n",
-    "\n",
-    "@vm.test(\"my_custom_tests.ClassImbalance\")\n",
-    "def class_imbalance(dataset):\n",
-    "    # Can only run this test if we have a Dataset object\n",
-    "    if not isinstance(dataset, VMDataset):\n",
-    "        raise ValueError(\"ClassImbalance requires a validmind Dataset object\")\n",
-    "\n",
-    "    if dataset.target_column is None:\n",
-    "        print(\"Skipping class_imbalance test because no target column is defined\")\n",
-    "        return\n",
-    "\n",
-    "    # VMDataset object provides target_column attribute\n",
-    "    target_column = dataset.target_column\n",
-    "    # we can access pandas DataFrame using df attribute\n",
-    "    imbalance_percentages = dataset.df[target_column].value_counts(\n",
-    "        normalize=True\n",
-    "    )\n",
-    "    classes = list(imbalance_percentages.index) \n",
-    "    percentages = list(imbalance_percentages.values * 100)\n",
-    "\n",
-    "    return pd.DataFrame({\"Classes\":classes, \"Percentage\": percentages})"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2_1__'></a>\n",
-    "\n",
-    "#### Run the test\n",
-    "\n",
-    "Let's run the test using the `run_test` method, which is part of the `validmind.tests` module. Here, we pass the `dataset` through the `inputs`. Similarly, you can pass `datasets`, `model`, or `models` as inputs if your custom test requires them. In this example below, we run the custom test `my_custom_tests.ClassImbalance` by passing the `dataset` through the `inputs`. "
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.tests import run_test\n",
-    "result = run_test(\n",
-    "    test_id=\"my_custom_tests.ClassImbalance\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_raw_dataset\n",
-    "    }\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You can move custom tests into separate modules in a folder. It allows you to take one-off tests and move them into an organized structure that makes it easier to manage, maintain and share them. We have provided a seperate notebook with detailed explaination [here](../tests/custom_tests/integrate_external_test_providers.ipynb) "
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_3__'></a>\n",
-    "\n",
-    "### Using VM Dataset object and parameters as arguments in custom tests\n",
-    "\n",
-    "Simlilar to `inputs`, you can pass `params` to a custom test by providing a dictionary of parameters to the `run_test()` function. The parameters will override any default parameters set in the custom test definition. Note that the `dataset` is still passed as `inputs`. \n",
-    "Let's modify the class imbalance test so that it provides flexibility to `normalize` the results."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.vm_models.dataset.dataset import VMDataset\n",
-    "import pandas as pd\n",
-    "\n",
-    "@vm.test(\"my_custom_tests.ClassImbalance\")\n",
-    "def class_imbalance(dataset, normalize=True):\n",
-    "    # Can only run this test if we have a Dataset object\n",
-    "    if not isinstance(dataset, VMDataset):\n",
-    "        raise ValueError(\"ClassImbalance requires a validmind Dataset object\")\n",
-    "\n",
-    "    if dataset.target_column is None:\n",
-    "        print(\"Skipping class_imbalance test because no target column is defined\")\n",
-    "        return\n",
-    "\n",
-    "    # VMDataset object provides target_column attribute\n",
-    "    target_column = dataset.target_column\n",
-    "    # we can access pandas DataFrame using df attribute\n",
-    "    imbalance_percentages = dataset.df[target_column].value_counts(\n",
-    "        normalize=normalize\n",
-    "    )\n",
-    "    classes = list(imbalance_percentages.index) \n",
-    "    if normalize:  \n",
-    "        result = pd.DataFrame({\"Classes\":classes, \"Percentage\": list(imbalance_percentages.values*100)})\n",
-    "    else:\n",
-    "        result = pd.DataFrame({\"Classes\":classes, \"Count\": list(imbalance_percentages.values)})\n",
-    "    return result"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "In this example, the `normalize` parameter is set to `False`, so the class counts will not be normalized. You can change the value to `True` if you want the counts to be normalized. The results of the test will reflect this flexibility, allowing for different outputs based on the parameter passed.\n",
-    "\n",
-    "Here, we have passed the `dataset` through the `inputs` and the `normalize` parameter using the `params`."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.tests import run_test\n",
-    "result = run_test(\n",
-    "    test_id = \"my_custom_tests.ClassImbalance\",\n",
-    "    inputs={\"dataset\": vm_raw_dataset},\n",
-    "    params={\"normalize\": True},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_4__'></a>\n",
-    "\n",
-    "### VMModel Object"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_5__'></a>\n",
-    "\n",
-    "### Initialize ValidMind model object\n",
-    "\n",
-    "Similar to ValidMind `Dataset` object, you can initialize a ValidMind Model object using the [`init_model`](https://docs.validmind.ai/validmind/validmind.html#init_model) function from the ValidMind (`vm`) module.\n",
-    "\n",
-    "This function takes a number of arguments. Some of the arguments are:\n",
-    "\n",
-    "- `model` — the raw model that you want evaluate\n",
-    "- `input_id` - a unique identifier that allows tracking what inputs are used when running each individual test\n",
-    "\n",
-    "The detailed list of the arguments can be found [here](https://docs.validmind.ai/validmind/validmind.html#init_model) "
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "\n",
-    "vm_model = vm.init_model(\n",
-    "    model=model,\n",
-    "    input_id=\"xgb_model\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Let's inspect the methods and attributes of the model now:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "inspect_obj(vm_model)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_6__'></a>\n",
-    "\n",
-    "### Assign predictions to the datasets\n",
-    "\n",
-    "We can now use the `assign_predictions()` method from the `Dataset` object to link existing predictions to any model. If no prediction values are passed, the method will compute predictions automatically:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds = vm.init_dataset(\n",
-    "    input_id=\"train_dataset\",\n",
-    "    dataset=train_df,\n",
-    "    type=\"generic\",\n",
-    "    target_column=demo_dataset.target_column,\n",
-    ")\n",
-    "\n",
-    "vm_train_ds.assign_predictions(model=vm_model)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You can see below, the extra prediction column (`xgb_model_prediction`) for the model (`xgb_model`) has been added in the dataset."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "print(vm_train_ds)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_7__'></a>\n",
-    "\n",
-    "### Using VM Model and Dataset objects as arguments in Custom tests\n",
-    "\n",
-    "We will now create a `@vm.test` wrapper that will allow you to create a reusable test. Note the following changes in the code below:\n",
-    "\n",
-    "- The function `confusion_matrix` takes two arguments `dataset` and `model`. This is a `VMDataset` and `VMModel` object respectively.\n",
-    "  - `VMDataset` objects allow you to access the dataset's true (target) values by accessing the `.y` attribute.\n",
-    "  - `VMDataset` objects allow you to access the predictions for a given model by accessing the `.y_pred()` method.\n",
-    "- The function docstring provides a description of what the test does. This will be displayed along with the result in this notebook as well as in the ValidMind Platform.\n",
-    "- The function body calculates the confusion matrix using the `sklearn.tests.confusion_matrix` function as we just did above.\n",
-    "- The function then returns the `ConfusionMatrixDisplay.figure_` object - this is important as the ValidMind Library expects the output of the custom test to be a plot or a table.\n",
-    "- The `@vm.test` decorator is doing the work of creating a wrapper around the function that will allow it to be run by the ValidMind Library. It also registers the test so it can be found by the ID `my_custom_tests.ConfusionMatrix` (see the section below on how test IDs work in ValidMind and why this format is important)\n",
-    "\n",
-    "Similarly, you can use the functinality provided by `VMDataset` and `VMModel` objects. You can refer our documentation page for all the avalialble APIs [here](https://docs.validmind.ai/validmind/validmind.html#init_dataset)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from sklearn import metrics\n",
-    "import matplotlib.pyplot as plt\n",
-    "@vm.test(\"my_custom_tests.ConfusionMatrix\")\n",
-    "def confusion_matrix(dataset, model):\n",
-    "    \"\"\"The confusion matrix is a table that is often used to describe the performance of a classification model on a set of data for which the true values are known.\n",
-    "\n",
-    "    The confusion matrix is a 2x2 table that contains 4 values:\n",
-    "\n",
-    "    - True Positive (TP): the number of correct positive predictions\n",
-    "    - True Negative (TN): the number of correct negative predictions\n",
-    "    - False Positive (FP): the number of incorrect positive predictions\n",
-    "    - False Negative (FN): the number of incorrect negative predictions\n",
-    "\n",
-    "    The confusion matrix can be used to assess the holistic performance of a classification model by showing the accuracy, precision, recall, and F1 score of the model on a single figure.\n",
-    "    \"\"\"\n",
-    "    # we can retrieve traget value from dataset which is y attribute\n",
-    "    y_true = dataset.y\n",
-    "    # The prediction value of a specific model using y_pred method \n",
-    "    y_pred = dataset.y_pred(model=model)\n",
-    "\n",
-    "    confusion_matrix = metrics.confusion_matrix(y_true, y_pred)\n",
-    "\n",
-    "    cm_display = metrics.ConfusionMatrixDisplay(\n",
-    "        confusion_matrix=confusion_matrix, display_labels=[False, True]\n",
-    "    )\n",
-    "    cm_display.plot()\n",
-    "    plt.close()\n",
-    "\n",
-    "    return cm_display.figure_  # return the figure object itself"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Here, we run test using two inputs; `dataset` and `model`. "
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.tests import run_test\n",
-    "result = run_test(\n",
-    "    test_id = \"my_custom_tests.ConfusionMatrix\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_train_ds,\n",
-    "        \"model\": vm_model,\n",
-    "    }\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_8__'></a>\n",
-    "\n",
-    "### Log the test results\n",
-    "\n",
-    "You can log any test result to the ValidMind Platform with the `.log()` method of the result object. This will allow you to add the result to the documentation.\n",
-    "\n",
-    "You can now do the same for the confusion matrix results."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## In summary\n",
-    "\n",
-    "In this notebook you have learned the end-to-end process to document a model with the ValidMind Library, running through some very common scenarios in a typical model development setting:\n",
-    "\n",
-    "- Running out-of-the-box tests\n",
-    "- Documenting your model by adding evidence to model documentation\n",
-    "- Extending the capabilities of the ValidMind Library by implementing custom tests\n",
-    "- Ensuring that the documentation is complete by running all tests in the documentation template"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc8__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-9be1890525a54c10be782f80fe33833f",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.14"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Introduction to ValidMind Dataset and Model Objects\n",
+        "\n",
+        "When writing custom tests, it is essential to be aware of the interfaces of the ValidMind Dataset and ValidMind Model, which are used as input arguments.\n",
+        "\n",
+        "As a model developer, writing custom tests is beneficial when the ValidMind library lacks a built-in test for your specific needs. For example, a model might require new tests to evaluate specific aspects of the model or dataset based on a particular use case.\n",
+        "\n",
+        "This interactive notebook offers a detailed understanding of ValidMind objects and their use in writing custom tests. It introduces various interfaces provided by these objects and demonstrates how they can be leveraged to implement tests effortlessly."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "- [Load the demo dataset](#toc3__)    \n",
+        "  - [Prepocess the raw dataset](#toc3_1__)    \n",
+        "- [Train a model for testing](#toc4__)    \n",
+        "- [Explore basic components of the ValidMind library](#toc5__)    \n",
+        "  - [VMDataset Object](#toc5_1__)    \n",
+        "    - [Initialize the ValidMind datasets](#toc5_1_1__)    \n",
+        "    - [ Interfaces of the dataset object](#toc5_1_2__)    \n",
+        "  - [Using VM Dataset object as arguments in custom tests](#toc5_2__)    \n",
+        "    - [Run the test](#toc5_2_1__)    \n",
+        "  - [Using VM Dataset object and parameters as arguments in custom tests](#toc5_3__)    \n",
+        "  - [VMModel Object](#toc5_4__)    \n",
+        "  - [Initialize ValidMind model object](#toc5_5__)    \n",
+        "  - [Assign predictions to the datasets](#toc5_6__)    \n",
+        "  - [Using VM Model and Dataset objects as arguments in Custom tests](#toc5_7__)    \n",
+        "  - [Log the test results](#toc5_8__)    \n",
+        "- [In summary](#toc6__)    \n",
+        "- [Discover more learning resources](#toc7__)    \n",
+        "- [Upgrade ValidMind](#toc8__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models. You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language.\n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+        "\n",
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        " - **dataset-based test**\n",
+        "\n",
+        "    ![Dataset based test architecture](./dataset_image.png)\n",
+        "    Dataset-based tests take VM dataset objects as inputs, can be configured with values passed in as parameters, and return outputs such as tables, plots, or images.\n",
+        "\n",
+        " - **model-based test**:\n",
+        "\n",
+        "    ![Model based test architecture](./model_image.png)\n",
+        "    Similar to dataset-based tests, model-based tests take additional VM model objects as inputs alongside VM dataset objects. The VM model object can wrap any type of record and is used to obtain prediction values for entries in the dataset.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [test_suites](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "Please note the following recommended Python versions to use:\n",
+        "\n",
+        "- Python 3.7 > x <= 3.11\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Binary classification`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "metadata": {}
+      },
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%matplotlib inline\n",
+        "\n",
+        "import xgboost as xgb"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Load the demo dataset"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.datasets.classification import customer_churn as demo_dataset\n",
+        "\n",
+        "raw_df = demo_dataset.load_data()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Prepocess the raw dataset"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "train_df, validation_df, test_df = demo_dataset.preprocess(raw_df)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Train a model for testing\n",
+        "\n",
+        "We train a simple customer churn model for our test."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "x_train = train_df.drop(demo_dataset.target_column, axis=1)\n",
+        "y_train = train_df[demo_dataset.target_column]\n",
+        "x_val = validation_df.drop(demo_dataset.target_column, axis=1)\n",
+        "y_val = validation_df[demo_dataset.target_column]\n",
+        "\n",
+        "model = xgb.XGBClassifier(early_stopping_rounds=10)\n",
+        "model.set_params(\n",
+        "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
+        ")\n",
+        "model.fit(\n",
+        "    x_train,\n",
+        "    y_train,\n",
+        "    eval_set=[(x_val, y_val)],\n",
+        "    verbose=False,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Explore basic components of the ValidMind library\n",
+        "\n",
+        "In this section, you will learn about the basic objects of the ValidMind library that are necessary to implement both custom and built-in tests. As explained above, these objects are:\n",
+        "* VMDataset: [The high level APIs can be found here](https://docs.validmind.ai/validmind/validmind/vm_models.html#VMDataset)\n",
+        "* VMModel: [The high level APIs can be found here](https://docs.validmind.ai/validmind/validmind/vm_models.html#VMModel)\n",
+        "\n",
+        "Let's understand these objects and their interfaces step by step: "
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### VMDataset Object"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1_1__'></a>\n",
+        "\n",
+        "#### Initialize the ValidMind datasets\n",
+        "\n",
+        "You can initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
+        "\n",
+        "The function wraps the dataset to create a ValidMind `Dataset` object so that you can write tests effectively using the common interface provided by the VM objects. This step is always necessary every time you want to connect a dataset to documentation and produce test results through ValidMind. You only need to do it one time per dataset.\n",
+        "\n",
+        "This function takes a number of arguments. Some of the arguments are:\n",
+        "\n",
+        "- `dataset` — the raw dataset that you want to provide as input to tests\n",
+        "- `input_id` - a unique identifier that allows tracking what inputs are used when running each individual test\n",
+        "- `target_column` — a required argument if tests require access to true values. This is the name of the target column in the dataset\n",
+        "\n",
+        "The detailed list of the arguments can be found [here](https://docs.validmind.ai/validmind/validmind.html#init_dataset) "
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# vm_raw_dataset is now a VMDataset object that you can pass to any ValidMind test\n",
+        "vm_raw_dataset = vm.init_dataset(\n",
+        "    dataset=raw_df,\n",
+        "    input_id=\"raw_dataset\",\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Once you have a ValidMind dataset object (VMDataset), you can inspect its attributes and methods using the inspect_obj utility module. This module provides a list of available attributes and interfaces for use in tests. Understanding how to use VMDatasets is crucial for comprehending how a custom test functions."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.utils import inspect_obj\n",
+        "inspect_obj(vm_raw_dataset)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1_2__'></a>\n",
+        "\n",
+        "####  Interfaces of the dataset object\n",
+        "\n",
+        "**DataFrame**"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_raw_dataset.df"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "**Feature columns**"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_raw_dataset.feature_columns"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "**Target column**"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_raw_dataset.target_column"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "**Features values**"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_raw_dataset.x_df()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "**Target value**"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_raw_dataset.y_df()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "**Numeric feature columns** "
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_raw_dataset.feature_columns_numeric"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "**Categorical feature columns** "
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_raw_dataset.feature_columns_categorical"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Similarly, you can use all other interfaces of the [VMDataset objects](https://docs.validmind.ai/validmind/validmind/vm_models.html#VMDataset) "
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2__'></a>\n",
+        "\n",
+        "### Using VM Dataset object as arguments in custom tests\n",
+        "\n",
+        "A custom test is simply a Python function that takes two types of arguments: `inputs` and `params`. The `inputs` are ValidMind objects (`VMDataset`, `VMModel`), and the `params` are additional parameters required for the underlying computation of the test. We will discuss both types of arguments in the following sections.\n",
+        "\n",
+        "Let's start with a custom test that requires only a ValidMind dataset object. In this example, we will check the balance of classes in the target column of the dataset:\n",
+        "\n",
+        "- The custom test below requires a single argument of type `VMDataset` (dataset).\n",
+        "- The `my_custom_tests.ClassImbalance` is a unique test identifier that can be assigned using the `vm.test` decorator functionality. This unique test ID will be used in the platform to load test results in the documentation.\n",
+        "- The `dataset.target_column` and `dataset.df` attributes of the `VMDataset` object are used in the test.\n",
+        "\n",
+        "Other high-level APIs (attributes and methods) of the dataset object are listed [here](https://docs.validmind.ai/validmind/validmind/vm_models.html#VMDataset).\n",
+        "\n",
+        "If you've gone through the [Implement custom tests notebook](../tests/custom_tests/implement_custom_tests.ipynb), you should have a good understanding of how custom tests are implemented in details. If you haven't, we recommend going through that notebook first."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.vm_models.dataset.dataset import VMDataset\n",
+        "import pandas as pd\n",
+        "\n",
+        "@vm.test(\"my_custom_tests.ClassImbalance\")\n",
+        "def class_imbalance(dataset):\n",
+        "    # Can only run this test if we have a Dataset object\n",
+        "    if not isinstance(dataset, VMDataset):\n",
+        "        raise ValueError(\"ClassImbalance requires a validmind Dataset object\")\n",
+        "\n",
+        "    if dataset.target_column is None:\n",
+        "        print(\"Skipping class_imbalance test because no target column is defined\")\n",
+        "        return\n",
+        "\n",
+        "    # VMDataset object provides target_column attribute\n",
+        "    target_column = dataset.target_column\n",
+        "    # we can access pandas DataFrame using df attribute\n",
+        "    imbalance_percentages = dataset.df[target_column].value_counts(\n",
+        "        normalize=True\n",
+        "    )\n",
+        "    classes = list(imbalance_percentages.index) \n",
+        "    percentages = list(imbalance_percentages.values * 100)\n",
+        "\n",
+        "    return pd.DataFrame({\"Classes\":classes, \"Percentage\": percentages})"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2_1__'></a>\n",
+        "\n",
+        "#### Run the test\n",
+        "\n",
+        "Let's run the test using the `run_test` method, which is part of the `validmind.tests` module. Here, we pass the `dataset` through the `inputs`. Similarly, you can pass `datasets`, `model`, or `models` as inputs if your custom test requires them. In this example below, we run the custom test `my_custom_tests.ClassImbalance` by passing the `dataset` through the `inputs`. "
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.tests import run_test\n",
+        "result = run_test(\n",
+        "    test_id=\"my_custom_tests.ClassImbalance\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_raw_dataset\n",
+        "    }\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You can move custom tests into separate modules in a folder. It allows you to take one-off tests and move them into an organized structure that makes it easier to manage, maintain and share them. We have provided a seperate notebook with detailed explaination [here](../tests/custom_tests/integrate_external_test_providers.ipynb) "
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_3__'></a>\n",
+        "\n",
+        "### Using VM Dataset object and parameters as arguments in custom tests\n",
+        "\n",
+        "Simlilar to `inputs`, you can pass `params` to a custom test by providing a dictionary of parameters to the `run_test()` function. The parameters will override any default parameters set in the custom test definition. Note that the `dataset` is still passed as `inputs`. \n",
+        "Let's modify the class imbalance test so that it provides flexibility to `normalize` the results."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.vm_models.dataset.dataset import VMDataset\n",
+        "import pandas as pd\n",
+        "\n",
+        "@vm.test(\"my_custom_tests.ClassImbalance\")\n",
+        "def class_imbalance(dataset, normalize=True):\n",
+        "    # Can only run this test if we have a Dataset object\n",
+        "    if not isinstance(dataset, VMDataset):\n",
+        "        raise ValueError(\"ClassImbalance requires a validmind Dataset object\")\n",
+        "\n",
+        "    if dataset.target_column is None:\n",
+        "        print(\"Skipping class_imbalance test because no target column is defined\")\n",
+        "        return\n",
+        "\n",
+        "    # VMDataset object provides target_column attribute\n",
+        "    target_column = dataset.target_column\n",
+        "    # we can access pandas DataFrame using df attribute\n",
+        "    imbalance_percentages = dataset.df[target_column].value_counts(\n",
+        "        normalize=normalize\n",
+        "    )\n",
+        "    classes = list(imbalance_percentages.index) \n",
+        "    if normalize:  \n",
+        "        result = pd.DataFrame({\"Classes\":classes, \"Percentage\": list(imbalance_percentages.values*100)})\n",
+        "    else:\n",
+        "        result = pd.DataFrame({\"Classes\":classes, \"Count\": list(imbalance_percentages.values)})\n",
+        "    return result"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "In this example, the `normalize` parameter is set to `False`, so the class counts will not be normalized. You can change the value to `True` if you want the counts to be normalized. The results of the test will reflect this flexibility, allowing for different outputs based on the parameter passed.\n",
+        "\n",
+        "Here, we have passed the `dataset` through the `inputs` and the `normalize` parameter using the `params`."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.tests import run_test\n",
+        "result = run_test(\n",
+        "    test_id = \"my_custom_tests.ClassImbalance\",\n",
+        "    inputs={\"dataset\": vm_raw_dataset},\n",
+        "    params={\"normalize\": True},\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_4__'></a>\n",
+        "\n",
+        "### VMModel Object"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_5__'></a>\n",
+        "\n",
+        "### Initialize ValidMind model object\n",
+        "\n",
+        "Similar to ValidMind `Dataset` object, you can initialize a ValidMind Model object using the [`init_model`](https://docs.validmind.ai/validmind/validmind.html#init_model) function from the ValidMind (`vm`) module.\n",
+        "\n",
+        "This function takes a number of arguments. Some of the arguments are:\n",
+        "\n",
+        "- `model` — the raw model that you want evaluate\n",
+        "- `input_id` - a unique identifier that allows tracking what inputs are used when running each individual test\n",
+        "\n",
+        "The detailed list of the arguments can be found [here](https://docs.validmind.ai/validmind/validmind.html#init_model) "
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "\n",
+        "vm_model = vm.init_model(\n",
+        "    model=model,\n",
+        "    input_id=\"xgb_model\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let's inspect the methods and attributes of the model now:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "inspect_obj(vm_model)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_6__'></a>\n",
+        "\n",
+        "### Assign predictions to the datasets\n",
+        "\n",
+        "We can now use the `assign_predictions()` method from the `Dataset` object to link existing predictions to any model. If no prediction values are passed, the method will compute predictions automatically:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds = vm.init_dataset(\n",
+        "    input_id=\"train_dataset\",\n",
+        "    dataset=train_df,\n",
+        "    type=\"generic\",\n",
+        "    target_column=demo_dataset.target_column,\n",
+        ")\n",
+        "\n",
+        "vm_train_ds.assign_predictions(model=vm_model)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You can see below, the extra prediction column (`xgb_model_prediction`) for the model (`xgb_model`) has been added in the dataset."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "print(vm_train_ds)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_7__'></a>\n",
+        "\n",
+        "### Using VM Model and Dataset objects as arguments in Custom tests\n",
+        "\n",
+        "We will now create a `@vm.test` wrapper that will allow you to create a reusable test. Note the following changes in the code below:\n",
+        "\n",
+        "- The function `confusion_matrix` takes two arguments `dataset` and `model`. This is a `VMDataset` and `VMModel` object respectively.\n",
+        "  - `VMDataset` objects allow you to access the dataset's true (target) values by accessing the `.y` attribute.\n",
+        "  - `VMDataset` objects allow you to access the predictions for a given record (model) by accessing the `.y_pred()` method.\n",
+        "- The function docstring provides a description of what the test does. This will be displayed along with the result in this notebook as well as in the ValidMind Platform.\n",
+        "- The function body calculates the confusion matrix using the `sklearn.tests.confusion_matrix` function as we just did above.\n",
+        "- The function then returns the `ConfusionMatrixDisplay.figure_` object - this is important as the ValidMind Library expects the output of the custom test to be a plot or a table.\n",
+        "- The `@vm.test` decorator is doing the work of creating a wrapper around the function that will allow it to be run by the ValidMind Library. It also registers the test so it can be found by the ID `my_custom_tests.ConfusionMatrix` (see the section below on how test IDs work in ValidMind and why this format is important)\n",
+        "\n",
+        "Similarly, you can use the functinality provided by `VMDataset` and `VMModel` objects. You can refer our documentation page for all the avalialble APIs [here](https://docs.validmind.ai/validmind/validmind.html#init_dataset)"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from sklearn import metrics\n",
+        "import matplotlib.pyplot as plt\n",
+        "@vm.test(\"my_custom_tests.ConfusionMatrix\")\n",
+        "def confusion_matrix(dataset, model):\n",
+        "    \"\"\"The confusion matrix is a table that is often used to describe the performance of a classification model on a set of data for which the true values are known.\n",
+        "\n",
+        "    The confusion matrix is a 2x2 table that contains 4 values:\n",
+        "\n",
+        "    - True Positive (TP): the number of correct positive predictions\n",
+        "    - True Negative (TN): the number of correct negative predictions\n",
+        "    - False Positive (FP): the number of incorrect positive predictions\n",
+        "    - False Negative (FN): the number of incorrect negative predictions\n",
+        "\n",
+        "    The confusion matrix can be used to assess the holistic performance of a classification model by showing the accuracy, precision, recall, and F1 score of the model on a single figure.\n",
+        "    \"\"\"\n",
+        "    # we can retrieve traget value from dataset which is y attribute\n",
+        "    y_true = dataset.y\n",
+        "    # The prediction value of a specific model using y_pred method \n",
+        "    y_pred = dataset.y_pred(model=model)\n",
+        "\n",
+        "    confusion_matrix = metrics.confusion_matrix(y_true, y_pred)\n",
+        "\n",
+        "    cm_display = metrics.ConfusionMatrixDisplay(\n",
+        "        confusion_matrix=confusion_matrix, display_labels=[False, True]\n",
+        "    )\n",
+        "    cm_display.plot()\n",
+        "    plt.close()\n",
+        "\n",
+        "    return cm_display.figure_  # return the figure object itself"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Here, we run test using two inputs; `dataset` and `model`. "
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.tests import run_test\n",
+        "result = run_test(\n",
+        "    test_id = \"my_custom_tests.ConfusionMatrix\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_train_ds,\n",
+        "        \"model\": vm_model,\n",
+        "    }\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_8__'></a>\n",
+        "\n",
+        "### Log the test results\n",
+        "\n",
+        "You can log any test result to the ValidMind Platform with the `.log()` method of the result object. This will allow you to add the result to the documentation.\n",
+        "\n",
+        "You can now do the same for the confusion matrix results."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## In summary\n",
+        "\n",
+        "In this notebook you have learned the end-to-end process to document a model with the ValidMind Library, running through some very common scenarios in a typical model development setting:\n",
+        "\n",
+        "- Running out-of-the-box tests\n",
+        "- Documenting your model by adding evidence to model documentation\n",
+        "- Extending the capabilities of the ValidMind Library by implementing custom tests\n",
+        "- Ensuring that the documentation is complete by running all tests in the documentation template"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-9be1890525a54c10be782f80fe33833f"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "Python 3",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.10.14"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 2
 }
diff --git a/site/notebooks/how_to/metrics/log_metrics_over_time.ipynb b/site/notebooks/how_to/metrics/log_metrics_over_time.ipynb
index 4722eeed69..7e8d1faef8 100644
--- a/site/notebooks/how_to/metrics/log_metrics_over_time.ipynb
+++ b/site/notebooks/how_to/metrics/log_metrics_over_time.ipynb
@@ -1,959 +1,975 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Log metrics over time\n",
-    "\n",
-    "Learn how to track and visualize the temporal evolution of key model performance metrics with ValidMind.\n",
-    "\n",
-    "- Key model performance metrics such as AUC, F1 score, precision, recall, and accuracy, are useful for analyzing the stability and trends in model performance indicators, helping to identify potential degradation or unexpected fluctuations in model behavior over time.\n",
-    "- By monitoring these metrics systematically, teams can detect early warning signs of model drift and take proactive measures to maintain model reliability.\n",
-    "- Unit metrics in ValidMind provide a standardized way to compute and track individual performance measures, making it easy to monitor specific aspects of model behavior.\n",
-    "\n",
-    "Log metrics over time with the ValidMind Library's [`log_metric()`](https://docs.validmind.ai/validmind/validmind.html#log_metric) function and visualize them in your documentation using the *Metric Over Time* block within the ValidMind Platform. This integration enables seamless tracking of model performance, supporting custom thresholds and facilitating the automation of alerts based on logged metrics.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Metrics over time are most commonly associated with the continued monitoring of a model's performance once it is deployed.</b></span>\n",
-    "<br></br>\n",
-    "While you are able to add Metric Over Time blocks to model documentation, we recommend first <a href=\"https://docs.validmind.ai/guide/monitoring/enable-monitoring.html\" style=\"color: #DE257E;\"><b>enabling ongoing monitoring</b></a> for your model to maximize the potential of your performance data.</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "  - [Initialize the Python environment](#toc2_3__)    \n",
-    "- [Load demo model](#toc3__)    \n",
-    "- [Log metrics](#toc4__)    \n",
-    "  - [Run unit metrics](#toc4_1__)    \n",
-    "  - [Log unit metrics over time](#toc4_2__)    \n",
-    "  - [Pass thresholds](#toc4_3__)    \n",
-    "  - [Log multiple metrics with custom thresholds](#toc4_4__)    \n",
-    "  - [Add acceptable performance flag](#toc4_5__)    \n",
-    "- [Next steps](#toc5__)    \n",
-    "  - [Work with your model documentation](#toc5_1__)    \n",
-    "  - [Discover more learning resources](#toc5_2__)    \n",
-    "- [Upgrade ValidMind](#toc6__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language.\n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Custom tests**: Custom tests are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "- **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "- **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "- **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom test.\n",
-    "- **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom test. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: The [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Credit Risk Scorecard`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Initialize the Python environment\n",
-    "\n",
-    "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 3,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import xgboost as xgb\n",
-    "import numpy as np\n",
-    "\n",
-    "from datetime import datetime, timedelta\n",
-    "\n",
-    "from validmind.unit_metrics import list_metrics, describe_metric, run_metric\n",
-    "from validmind.api_client import log_metric\n",
-    "\n",
-    "%matplotlib inline"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Load demo model\n",
-    "\n",
-    "We'll use a classification model trained on customer churn data to demonstrate ValidMind's metric logging capabilities.\n",
-    "\n",
-    "- We'll employ a built-in classification dataset, process it through train-validation-test splits, and train an XGBoost classifier.\n",
-    "- The trained model and datasets are then initialized in ValidMind's framework, enabling us to track and monitor various performance metrics in the following sections."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Import the sample dataset from the library\n",
-    "\n",
-    "from validmind.datasets.classification import customer_churn\n",
-    "\n",
-    "print(\n",
-    "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{customer_churn.target_column}' \\n\\t• Class labels: {customer_churn.class_labels}\"\n",
-    ")\n",
-    "\n",
-    "raw_df = customer_churn.load_data()\n",
-    "raw_df.head()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "train_df, validation_df, test_df = customer_churn.preprocess(raw_df)\n",
-    "\n",
-    "x_train = train_df.drop(customer_churn.target_column, axis=1)\n",
-    "y_train = train_df[customer_churn.target_column]\n",
-    "x_val = validation_df.drop(customer_churn.target_column, axis=1)\n",
-    "y_val = validation_df[customer_churn.target_column]\n",
-    "\n",
-    "model = xgb.XGBClassifier(early_stopping_rounds=10)\n",
-    "model.set_params(\n",
-    "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
-    ")\n",
-    "model.fit(\n",
-    "    x_train,\n",
-    "    y_train,\n",
-    "    eval_set=[(x_val, y_val)],\n",
-    "    verbose=False,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Once the datasets and model are prepared for validation, let's initialize the ValidMind `dataset` and `model`, specifying features and targets columns.\n",
-    "\n",
-    "- The property `input_id` allows users to uniquely identify each dataset and model.\n",
-    "- This allows for the creation of multiple versions of datasets and models, enabling us to compute metrics by specifying which versions we want to use as inputs."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 9,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_raw_dataset = vm.init_dataset(\n",
-    "    dataset=raw_df,\n",
-    "    input_id=\"raw_dataset\",\n",
-    "    target_column=customer_churn.target_column,\n",
-    "    class_labels=customer_churn.class_labels,\n",
-    ")\n",
-    "\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    dataset=train_df,\n",
-    "    input_id=\"train_dataset\",\n",
-    "    target_column=customer_churn.target_column,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    dataset=test_df, input_id=\"test_dataset\", target_column=customer_churn.target_column\n",
-    ")\n",
-    "\n",
-    "vm_model = vm.init_model(\n",
-    "    model,\n",
-    "    input_id=\"model\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "We can now use the `assign_predictions()` method from the Dataset object to link existing predictions to any model. \n",
-    "\n",
-    "If no prediction values are passed, the method will compute predictions automatically:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds.assign_predictions(\n",
-    "    model=vm_model,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds.assign_predictions(\n",
-    "    model=vm_model,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Log metrics\n",
-    "\n",
-    "Next, we'll use ValidMind to track the temporal evolution of key model performance metrics.\n",
-    "\n",
-    "We'll set appropriate thresholds for each metric, enable automated alerting when performance drifts beyond acceptable boundaries, and demonstrate how these thresholds can be customized based on business requirements and risk tolerance levels."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "metrics = [metric for metric in list_metrics() if \"classification\" in metric]\n",
-    "\n",
-    "for metric_id in metrics:\n",
-    "    describe_metric(metric_id)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Run unit metrics\n",
-    "\n",
-    "Compute individual metrics using ValidMind's *unit metrics* — single-value metrics that can be computed on a dataset and model. Use the `run_metric()` function from the `validmind.unit_metrics` module to calculate these metrics.\n",
-    "\n",
-    "The `run_metric()` function has a signature similar to `run_test()` from the `validmind.tests` module, but is specifically designed for unit metrics and takes the following arguments:\n",
-    "\n",
-    "- **`metric_id`:** The unique identifier for the metric (for example, `validmind.unit_metrics.classification.ROC_AUC`)\n",
-    "- **`inputs`:** A dictionary containing the input dataset and model or their respective input IDs\n",
-    "- **`params`:** A dictionary containing keyword arguments for the unit metric (optional, accepts any `kwargs` from the underlying sklearn implementation)\n",
-    "\n",
-    "`run_metric()` returns and displays a result object similar to a regular ValidMind test, but only shows the unit metric value. While this result object has a `.log()` method for logging to the ValidMind Platform, in this use case we'll use unit metrics to compute performance metrics and then log them over time using the `log_metric()` function from the `validmind.api_client` module."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_metric(\n",
-    "    \"validmind.unit_metrics.classification.ROC_AUC\",\n",
-    "    inputs={\n",
-    "        \"model\": vm_model,\n",
-    "        \"dataset\": vm_test_ds,\n",
-    "    },\n",
-    ")\n",
-    "auc = result.metric"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_metric(\n",
-    "    \"validmind.unit_metrics.classification.Accuracy\",\n",
-    "    inputs={\n",
-    "        \"model\": vm_model,\n",
-    "        \"dataset\": vm_test_ds,\n",
-    "    },\n",
-    ")\n",
-    "accuracy = result.metric"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_metric(\n",
-    "    \"validmind.unit_metrics.classification.Recall\",\n",
-    "    inputs={\n",
-    "        \"model\": vm_model,\n",
-    "        \"dataset\": vm_test_ds,\n",
-    "    },\n",
-    ")\n",
-    "recall = result.metric"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "f1 = run_metric(\n",
-    "    \"validmind.unit_metrics.classification.F1\",\n",
-    "    inputs={\n",
-    "        \"model\": vm_model,\n",
-    "        \"dataset\": vm_test_ds,\n",
-    "    },\n",
-    ")\n",
-    "f1 = result.metric"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "precision = run_metric(\n",
-    "    \"validmind.unit_metrics.classification.Precision\",\n",
-    "    inputs={\n",
-    "        \"model\": vm_model,\n",
-    "        \"dataset\": vm_test_ds,\n",
-    "    },\n",
-    ")\n",
-    "precision = result.metric"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Log unit metrics over time\n",
-    "\n",
-    "Using the `log_metric()` function from the `validmind.api_client` module, let's log the unit metrics over time. This function takes the following arguments:\n",
-    "\n",
-    "- **`key`:** The name of the metric to log\n",
-    "- **`value`:** The value of the metric to log\n",
-    "- **`recorded_at`:** The timestamp of the metric to log — useful for logging historic predictions\n",
-    "- **`thresholds`:** A dictionary containing the thresholds for the metric to log\n",
-    "- **`params`:** A dictionary containing the keyword arguments for the unit metric (in this case, none are required, but we can pass any `kwargs` that the underlying sklearn implementation accepts)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "log_metric(\n",
-    "    key=\"AUC Score\",\n",
-    "    value=auc,\n",
-    "    # If `recorded_at` is not included, the time at function run is logged\n",
-    "    recorded_at=datetime(2024, 1, 1), \n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "To visualize the logged metric, we'll use the **[Metrics Over Time block](https://docs.validmind.ai/guide/monitoring/work-with-metrics-over-time.html)** in the ValidMind Platform:\n",
-    "\n",
-    "- After adding this visualization block to your documentation or ongoing monitoring report (as shown in the image below), you'll be able to review your logged metrics plotted over time.\n",
-    "- In this example, since we've only logged a single data point, the visualization shows just one measurement.\n",
-    "- As you continue logging metrics, the graph will populate with more points, enabling you to track trends and patterns.\n",
-    "\n",
-    "![Metric Over Time block](./add_metric_over_time_block.png)\n",
-    "![AUC Score](./log_metric_auc_1.png)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_3__'></a>\n",
-    "\n",
-    "### Pass thresholds\n",
-    "\n",
-    "We can pass *thresholds* to the `log_metric()` function to enhance the metric over time: \n",
-    "\n",
-    "- This is useful for visualizing the metric over time and identifying potential issues. \n",
-    "- The metric visualization component provides a dynamic way to monitor and contextualize metric values through customizable thresholds. \n",
-    "- These thresholds appear as horizontal reference lines on the chart. \n",
-    "- The system always displays the most recent threshold configuration, meaning that if you update threshold values in your client application, the visualization will reflect these changes immediately. \n",
-    "\n",
-    "When a metric is logged without thresholds or with an empty threshold dictionary, the reference lines gracefully disappear from the chart, though the metric line itself remains visible. \n",
-    "\n",
-    "Thresholds are highly flexible in their implementation. You can define them with any meaningful key names (such as `low_risk`, `maximum`, `target`, or `acceptable_range`) in your metric data, and the visualization will adapt accordingly. "
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "log_metric(\n",
-    "    key=\"AUC Score\",\n",
-    "    value=auc,\n",
-    "    recorded_at=datetime(2024, 1, 1),\n",
-    "    thresholds={\n",
-    "        \"min_auc\": 0.7,\n",
-    "    }\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "![AUC Score](./log_metric_auc_2.png)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "log_metric(\n",
-    "    key=\"AUC Score\",\n",
-    "    value=auc,\n",
-    "    recorded_at=datetime(2024, 1, 1),\n",
-    "    thresholds={\n",
-    "        \"high_risk\": 0.6,\n",
-    "        \"medium_risk\": 0.7,\n",
-    "        \"low_risk\": 0.8,\n",
-    "    }\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "![AUC Score](./log_metric_auc_3.png)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_4__'></a>\n",
-    "\n",
-    "### Log multiple metrics with custom thresholds\n",
-    "\n",
-    "The following code snippet shows an example of how to set up and log multiple performance metrics with custom thresholds for each metric:\n",
-    "\n",
-    "- Using AUC, F1, Precision, Recall, and Accuracy scores as examples, it demonstrates how to define different risk levels (high, medium, low) appropriate for each metric's expected range.\n",
-    "- The code simulates 10 days of metric history by applying a gradual decay and random noise to help visualize how metrics might drift over time in a production environment."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "NUM_DAYS = 10\n",
-    "REFERENCE_DATE = datetime(2024, 1, 1)  # Fixed date: January 1st, 2024\n",
-    "base_date = REFERENCE_DATE - timedelta(days=NUM_DAYS)\n",
-    "\n",
-    "# Initial values with their specific thresholds\n",
-    "performance_metrics = {\n",
-    "    \"AUC Score\": {\n",
-    "        \"value\": auc,\n",
-    "        \"thresholds\": {\n",
-    "            \"high_risk\": 0.7,\n",
-    "            \"medium_risk\": 0.8,\n",
-    "            \"low_risk\": 0.9,\n",
-    "        }\n",
-    "    },\n",
-    "    \"F1 Score\": {\n",
-    "        \"value\": f1,\n",
-    "        \"thresholds\": {\n",
-    "            \"high_risk\": 0.5,\n",
-    "            \"medium_risk\": 0.6,\n",
-    "            \"low_risk\": 0.7,\n",
-    "        }\n",
-    "    },\n",
-    "    \"Precision Score\": {\n",
-    "        \"value\": precision,\n",
-    "        \"thresholds\": {\n",
-    "            \"high_risk\": 0.6,\n",
-    "            \"medium_risk\": 0.7,\n",
-    "            \"low_risk\": 0.8,\n",
-    "        }\n",
-    "    },\n",
-    "    \"Recall Score\": {\n",
-    "        \"value\": recall,\n",
-    "        \"thresholds\": {\n",
-    "            \"high_risk\": 0.4,\n",
-    "            \"medium_risk\": 0.5,\n",
-    "            \"low_risk\": 0.6,\n",
-    "        }\n",
-    "    },\n",
-    "    \"Accuracy Score\": {\n",
-    "        \"value\": accuracy,\n",
-    "        \"thresholds\": {\n",
-    "            \"high_risk\": 0.75,\n",
-    "            \"medium_risk\": 0.8,\n",
-    "            \"low_risk\": 0.85,\n",
-    "        }\n",
-    "    }\n",
-    "}\n",
-    "\n",
-    "# Trend parameters\n",
-    "trend_factor = 0.98  # Slight downward trend\n",
-    "noise_scale = 0.02   # Random fluctuation of ±2%\n",
-    "\n",
-    "for i in range(NUM_DAYS):\n",
-    "    recorded_at = base_date + timedelta(days=i)\n",
-    "    print(f\"\\nrecorded_at: {recorded_at}\")\n",
-    "\n",
-    "    # Log each metric with trend and noise\n",
-    "    for metric_name, metric_info in performance_metrics.items():\n",
-    "        base_value = metric_info[\"value\"]\n",
-    "        thresholds = metric_info[\"thresholds\"]\n",
-    "        \n",
-    "        # Apply trend and add random noise\n",
-    "        trend = base_value * (trend_factor ** i)\n",
-    "        noise = np.random.normal(0, noise_scale * base_value)\n",
-    "        value = max(0, min(1, trend + noise))  # Ensure value stays between 0 and 1\n",
-    "        \n",
-    "        log_metric(\n",
-    "            key=metric_name,\n",
-    "            value=value,\n",
-    "            recorded_at=recorded_at.isoformat(),\n",
-    "            thresholds=thresholds\n",
-    "        )\n",
-    "        \n",
-    "        print(f\"{metric_name:<15}: {value:.4f} (Thresholds: {thresholds})\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "![AUC Score](./log_metric_auc_4.png)\n",
-    "![Accuracy Score](./log_metric_accuracy.png)\n",
-    "![Precision Score](./log_metric_precision.png)\n",
-    "![Recall Score](./log_metric_recall.png)\n",
-    "![F1 Score](./log_metric_f1.png)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_5__'></a>\n",
-    "\n",
-    "### Add acceptable performance flag\n",
-    "\n",
-    "The `passed` parameter in the `log_metric()` function allows you to explicitly mark whether a specific metric value should be considered \"Satisfactory\" or \"Requires Attention\":\n",
-    "   - When `passed=True`: A green \"Satisfactory\" badge appears on the chart, indicating the metric value meets your acceptance criteria.\n",
-    "   - When `passed=False`: A yellow \"Requires Attention\" badge appears, highlighting potential concerns that may require investigation."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "In the example below, the `passed=True` parameter adds a green \"Satisfactory\" badge to the GINI Score metric visualization, instantly indicating that the 0.75 value meets acceptable performance standards by being above the `medium_risk` threshold of 0.6:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "log_metric(\n",
-    "    key=\"GINI Score\",\n",
-    "    value=0.75,\n",
-    "    recorded_at=datetime(2025, 6, 7),\n",
-    "    thresholds = {\n",
-    "        \"high_risk\": 0.5,\n",
-    "        \"medium_risk\": 0.6,\n",
-    "        \"low_risk\": 0.8,\n",
-    "    },\n",
-    "    passed=True\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "![GINI Score](./log_metric_satisfactory.png)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "In this example, the `passed=False` parameter adds a yellow \"Requires Attention\" badge to the GINI Score metric visualization, immediately highlighting that the value of 0.5 fails to meet acceptable performance standards by not exceeding the `medium_risk` threshold of 0.6:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "log_metric(\n",
-    "    key=\"GINI Score\",\n",
-    "    value=0.5,\n",
-    "    recorded_at=datetime(2025, 6, 9),\n",
-    "    thresholds = {\n",
-    "        \"high_risk\": 0.5,\n",
-    "        \"medium_risk\": 0.6,\n",
-    "        \"low_risk\": 0.8,\n",
-    "    },\n",
-    "    passed=False\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "![GINI Score](./log_metric_attention.png)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Here, a custom function `passed_fn` determines the badge status automatically, displaying a green \"Satisfactory\" badge for the 0.65 GINI Score because it exceeds the `medium_risk` threshold of 0.6, enabling programmatic evaluation of metric performance based on predefined business rules:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "gini = 0.65\n",
-    "\n",
-    "thresholds = {\n",
-    "    \"high_risk\": 0.5,\n",
-    "    \"medium_risk\": 0.6,\n",
-    "    \"low_risk\": 0.8,\n",
-    "}\n",
-    "\n",
-    "def passed_fn(value):\n",
-    "    return value > thresholds[\"medium_risk\"]\n",
-    "\n",
-    "log_metric(\n",
-    "    key=\"GINI Score\",\n",
-    "    value=gini, \n",
-    "    recorded_at=datetime(2025, 6, 10),\n",
-    "    thresholds=thresholds,\n",
-    "    passed=passed_fn(gini)\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "![GINI Score](./log_metric_satisfactory_2.png)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
-    "\n",
-    "<a id='toc5_1__'></a>\n",
-    "\n",
-    "### Work with your model documentation\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)\n",
-    "\n",
-    "<a id='toc5_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-584966fafc334aec9585d8f880ddba0c",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Log metrics over time\n",
+        "\n",
+        "Learn how to track and visualize the temporal evolution of key record (model) performance metrics with ValidMind.\n",
+        "\n",
+        "While this notebook uses a traditional binary classification model to demonstrate, the same principles apply to logging performance metrics over time for any record (model) type registered with ValidMind — including agentic AI systems, generative LLM applications, and beyond. For example:\n",
+        "\n",
+        "- Key model performance metrics such as AUC, F1 score, precision, recall, and accuracy, are useful for analyzing the stability and trends in model performance indicators, helping to identify potential degradation or unexpected fluctuations in model behavior over time.\n",
+        "- By monitoring these metrics systematically, teams can detect early warning signs of model drift and take proactive measures to maintain model reliability.\n",
+        "- Unit metrics in ValidMind provide a standardized way to compute and track individual performance measures, making it easy to monitor specific aspects of model behavior.\n",
+        "\n",
+        "Log metrics over time with the ValidMind Library's [`log_metric()`](https://docs.validmind.ai/validmind/validmind.html#log_metric) function and visualize them in your documentation using the *Metric Over Time* block within the ValidMind Platform. This integration enables seamless tracking of record performance, supporting custom thresholds and facilitating the automation of alerts based on logged metrics.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Metrics over time are most commonly associated with the continued monitoring of a records's performance once it is deployed.</b></span>\n",
+        "<br></br>\n",
+        "While you are able to add Metric Over Time blocks to documentation, we recommend first <a href=\"https://docs.validmind.ai/guide/monitoring/enable-monitoring.html\" style=\"color: #DE257E;\"><b>enabling ongoing monitoring</b></a> for your record to maximize the potential of your performance data.</div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "  - [Initialize the Python environment](#toc2_3__)    \n",
+        "- [Load demo model](#toc3__)    \n",
+        "- [Logging metrics](#toc4__)    \n",
+        "  - [Run unit metrics](#toc4_1__)    \n",
+        "  - [Log unit metrics over time](#toc4_2__)    \n",
+        "  - [Pass thresholds](#toc4_3__)    \n",
+        "  - [Log multiple metrics with custom thresholds](#toc4_4__)    \n",
+        "  - [Add acceptable performance flag](#toc4_5__)    \n",
+        "- [Next steps](#toc5__)    \n",
+        "  - [Work with your model documentation](#toc5_1__)    \n",
+        "  - [Discover more learning resources](#toc5_2__)    \n",
+        "- [Upgrade ValidMind](#toc6__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language.\n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Credit Risk Scorecard`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Initialize the Python environment\n",
+        "\n",
+        "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import xgboost as xgb\n",
+        "import numpy as np\n",
+        "\n",
+        "from datetime import datetime, timedelta\n",
+        "\n",
+        "from validmind.unit_metrics import list_metrics, describe_metric, run_metric\n",
+        "from validmind.api_client import log_metric\n",
+        "\n",
+        "%matplotlib inline"
+      ],
+      "execution_count": 3,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Load demo model\n",
+        "\n",
+        "We'll use a classification model trained on customer churn data to demonstrate ValidMind's metric logging capabilities.\n",
+        "\n",
+        "- We'll employ a built-in classification dataset, process it through train-validation-test splits, and train an XGBoost classifier.\n",
+        "- The trained model and datasets are then initialized in ValidMind's framework, enabling us to track and monitor various performance metrics in the following sections."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Import the sample dataset from the library\n",
+        "\n",
+        "from validmind.datasets.classification import customer_churn\n",
+        "\n",
+        "print(\n",
+        "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{customer_churn.target_column}' \\n\\t• Class labels: {customer_churn.class_labels}\"\n",
+        ")\n",
+        "\n",
+        "raw_df = customer_churn.load_data()\n",
+        "raw_df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "train_df, validation_df, test_df = customer_churn.preprocess(raw_df)\n",
+        "\n",
+        "x_train = train_df.drop(customer_churn.target_column, axis=1)\n",
+        "y_train = train_df[customer_churn.target_column]\n",
+        "x_val = validation_df.drop(customer_churn.target_column, axis=1)\n",
+        "y_val = validation_df[customer_churn.target_column]\n",
+        "\n",
+        "model = xgb.XGBClassifier(early_stopping_rounds=10)\n",
+        "model.set_params(\n",
+        "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
+        ")\n",
+        "model.fit(\n",
+        "    x_train,\n",
+        "    y_train,\n",
+        "    eval_set=[(x_val, y_val)],\n",
+        "    verbose=False,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Once the datasets and model are prepared for validation, let's initialize the ValidMind `dataset` and `model`, specifying features and targets columns.\n",
+        "\n",
+        "- The property `input_id` allows users to uniquely identify each dataset and model.\n",
+        "- This allows for the creation of multiple versions of datasets and models, enabling us to compute metrics by specifying which versions we want to use as inputs."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_raw_dataset = vm.init_dataset(\n",
+        "    dataset=raw_df,\n",
+        "    input_id=\"raw_dataset\",\n",
+        "    target_column=customer_churn.target_column,\n",
+        "    class_labels=customer_churn.class_labels,\n",
+        ")\n",
+        "\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    dataset=train_df,\n",
+        "    input_id=\"train_dataset\",\n",
+        "    target_column=customer_churn.target_column,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    dataset=test_df, input_id=\"test_dataset\", target_column=customer_churn.target_column\n",
+        ")\n",
+        "\n",
+        "# Initialize the ValidMind model object wrapper so that it can be passed as input to tests or test suites\n",
+        "# ValidMind model objects can be any type of record you want to test, document, validate, or monitor\n",
+        "vm_model = vm.init_model(\n",
+        "    model,\n",
+        "    input_id=\"model\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "We can now use the `assign_predictions()` method from the Dataset object to link existing predictions to any model. \n",
+        "\n",
+        "If no prediction values are passed, the method will compute predictions automatically:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds.assign_predictions(\n",
+        "    model=vm_model,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds.assign_predictions(\n",
+        "    model=vm_model,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Logging metrics\n",
+        "\n",
+        "Next, we'll use ValidMind to track the temporal evolution of key model performance metrics.\n",
+        "\n",
+        "We'll set appropriate thresholds for each metric, enable automated alerting when performance drifts beyond acceptable boundaries, and demonstrate how these thresholds can be customized based on business requirements and risk tolerance levels."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "metrics = [metric for metric in list_metrics() if \"classification\" in metric]\n",
+        "\n",
+        "for metric_id in metrics:\n",
+        "    describe_metric(metric_id)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Run unit metrics\n",
+        "\n",
+        "Compute individual metrics using ValidMind's *unit metrics* — single-value metrics that can be computed on a dataset and model. Use the `run_metric()` function from the `validmind.unit_metrics` module to calculate these metrics.\n",
+        "\n",
+        "The `run_metric()` function has a signature similar to `run_test()` from the `validmind.tests` module, but is specifically designed for unit metrics and takes the following arguments:\n",
+        "\n",
+        "- **`metric_id`:** The unique identifier for the metric (for example, `validmind.unit_metrics.classification.ROC_AUC`)\n",
+        "- **`inputs`:** A dictionary containing the input dataset and model or their respective input IDs\n",
+        "- **`params`:** A dictionary containing keyword arguments for the unit metric (optional, accepts any `kwargs` from the underlying sklearn implementation)\n",
+        "\n",
+        "`run_metric()` returns and displays a result object similar to a regular ValidMind test, but only shows the unit metric value. While this result object has a `.log()` method for logging to the ValidMind Platform, in this use case we'll use unit metrics to compute performance metrics and then log them over time using the `log_metric()` function from the `validmind.api_client` module."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_metric(\n",
+        "    \"validmind.unit_metrics.classification.ROC_AUC\",\n",
+        "    inputs={\n",
+        "        \"model\": vm_model,\n",
+        "        \"dataset\": vm_test_ds,\n",
+        "    },\n",
+        ")\n",
+        "auc = result.metric"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_metric(\n",
+        "    \"validmind.unit_metrics.classification.Accuracy\",\n",
+        "    inputs={\n",
+        "        \"model\": vm_model,\n",
+        "        \"dataset\": vm_test_ds,\n",
+        "    },\n",
+        ")\n",
+        "accuracy = result.metric"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_metric(\n",
+        "    \"validmind.unit_metrics.classification.Recall\",\n",
+        "    inputs={\n",
+        "        \"model\": vm_model,\n",
+        "        \"dataset\": vm_test_ds,\n",
+        "    },\n",
+        ")\n",
+        "recall = result.metric"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "f1 = run_metric(\n",
+        "    \"validmind.unit_metrics.classification.F1\",\n",
+        "    inputs={\n",
+        "        \"model\": vm_model,\n",
+        "        \"dataset\": vm_test_ds,\n",
+        "    },\n",
+        ")\n",
+        "f1 = result.metric"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "precision = run_metric(\n",
+        "    \"validmind.unit_metrics.classification.Precision\",\n",
+        "    inputs={\n",
+        "        \"model\": vm_model,\n",
+        "        \"dataset\": vm_test_ds,\n",
+        "    },\n",
+        ")\n",
+        "precision = result.metric"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Log unit metrics over time\n",
+        "\n",
+        "Using the `log_metric()` function from the `validmind.api_client` module, let's log the unit metrics over time. This function takes the following arguments:\n",
+        "\n",
+        "- **`key`:** The name of the metric to log\n",
+        "- **`value`:** The value of the metric to log\n",
+        "- **`recorded_at`:** The timestamp of the metric to log — useful for logging historic predictions\n",
+        "- **`thresholds`:** A dictionary containing the thresholds for the metric to log\n",
+        "- **`params`:** A dictionary containing the keyword arguments for the unit metric (in this case, none are required, but we can pass any `kwargs` that the underlying sklearn implementation accepts)"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "log_metric(\n",
+        "    key=\"AUC Score\",\n",
+        "    value=auc,\n",
+        "    # If `recorded_at` is not included, the time at function run is logged\n",
+        "    recorded_at=datetime(2024, 1, 1), \n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "To visualize the logged metric, we'll use the **[Metrics Over Time block](https://docs.validmind.ai/guide/monitoring/work-with-metrics-over-time.html)** in the ValidMind Platform:\n",
+        "\n",
+        "- After adding this visualization block to your documentation or ongoing monitoring report (as shown in the image below), you'll be able to review your logged metrics plotted over time.\n",
+        "- In this example, since we've only logged a single data point, the visualization shows just one measurement.\n",
+        "- As you continue logging metrics, the graph will populate with more points, enabling you to track trends and patterns.\n",
+        "\n",
+        "![Metric Over Time block](./add_metric_over_time_block.png)\n",
+        "![AUC Score](./log_metric_auc_1.png)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_3__'></a>\n",
+        "\n",
+        "### Pass thresholds\n",
+        "\n",
+        "We can pass *thresholds* to the `log_metric()` function to enhance the metric over time: \n",
+        "\n",
+        "- This is useful for visualizing the metric over time and identifying potential issues. \n",
+        "- The metric visualization component provides a dynamic way to monitor and contextualize metric values through customizable thresholds. \n",
+        "- These thresholds appear as horizontal reference lines on the chart. \n",
+        "- The system always displays the most recent threshold configuration, meaning that if you update threshold values in your client application, the visualization will reflect these changes immediately. \n",
+        "\n",
+        "When a metric is logged without thresholds or with an empty threshold dictionary, the reference lines gracefully disappear from the chart, though the metric line itself remains visible. \n",
+        "\n",
+        "Thresholds are highly flexible in their implementation. You can define them with any meaningful key names (such as `low_risk`, `maximum`, `target`, or `acceptable_range`) in your metric data, and the visualization will adapt accordingly. "
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "log_metric(\n",
+        "    key=\"AUC Score\",\n",
+        "    value=auc,\n",
+        "    recorded_at=datetime(2024, 1, 1),\n",
+        "    thresholds={\n",
+        "        \"min_auc\": 0.7,\n",
+        "    }\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "![AUC Score](./log_metric_auc_2.png)"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "log_metric(\n",
+        "    key=\"AUC Score\",\n",
+        "    value=auc,\n",
+        "    recorded_at=datetime(2024, 1, 1),\n",
+        "    thresholds={\n",
+        "        \"high_risk\": 0.6,\n",
+        "        \"medium_risk\": 0.7,\n",
+        "        \"low_risk\": 0.8,\n",
+        "    }\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "![AUC Score](./log_metric_auc_3.png)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_4__'></a>\n",
+        "\n",
+        "### Log multiple metrics with custom thresholds\n",
+        "\n",
+        "The following code snippet shows an example of how to set up and log multiple performance metrics with custom thresholds for each metric:\n",
+        "\n",
+        "- Using AUC, F1, Precision, Recall, and Accuracy scores as examples, it demonstrates how to define different risk levels (high, medium, low) appropriate for each metric's expected range.\n",
+        "- The code simulates 10 days of metric history by applying a gradual decay and random noise to help visualize how metrics might drift over time in a production environment."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "NUM_DAYS = 10\n",
+        "REFERENCE_DATE = datetime(2024, 1, 1)  # Fixed date: January 1st, 2024\n",
+        "base_date = REFERENCE_DATE - timedelta(days=NUM_DAYS)\n",
+        "\n",
+        "# Initial values with their specific thresholds\n",
+        "performance_metrics = {\n",
+        "    \"AUC Score\": {\n",
+        "        \"value\": auc,\n",
+        "        \"thresholds\": {\n",
+        "            \"high_risk\": 0.7,\n",
+        "            \"medium_risk\": 0.8,\n",
+        "            \"low_risk\": 0.9,\n",
+        "        }\n",
+        "    },\n",
+        "    \"F1 Score\": {\n",
+        "        \"value\": f1,\n",
+        "        \"thresholds\": {\n",
+        "            \"high_risk\": 0.5,\n",
+        "            \"medium_risk\": 0.6,\n",
+        "            \"low_risk\": 0.7,\n",
+        "        }\n",
+        "    },\n",
+        "    \"Precision Score\": {\n",
+        "        \"value\": precision,\n",
+        "        \"thresholds\": {\n",
+        "            \"high_risk\": 0.6,\n",
+        "            \"medium_risk\": 0.7,\n",
+        "            \"low_risk\": 0.8,\n",
+        "        }\n",
+        "    },\n",
+        "    \"Recall Score\": {\n",
+        "        \"value\": recall,\n",
+        "        \"thresholds\": {\n",
+        "            \"high_risk\": 0.4,\n",
+        "            \"medium_risk\": 0.5,\n",
+        "            \"low_risk\": 0.6,\n",
+        "        }\n",
+        "    },\n",
+        "    \"Accuracy Score\": {\n",
+        "        \"value\": accuracy,\n",
+        "        \"thresholds\": {\n",
+        "            \"high_risk\": 0.75,\n",
+        "            \"medium_risk\": 0.8,\n",
+        "            \"low_risk\": 0.85,\n",
+        "        }\n",
+        "    }\n",
+        "}\n",
+        "\n",
+        "# Trend parameters\n",
+        "trend_factor = 0.98  # Slight downward trend\n",
+        "noise_scale = 0.02   # Random fluctuation of ±2%\n",
+        "\n",
+        "for i in range(NUM_DAYS):\n",
+        "    recorded_at = base_date + timedelta(days=i)\n",
+        "    print(f\"\\nrecorded_at: {recorded_at}\")\n",
+        "\n",
+        "    # Log each metric with trend and noise\n",
+        "    for metric_name, metric_info in performance_metrics.items():\n",
+        "        base_value = metric_info[\"value\"]\n",
+        "        thresholds = metric_info[\"thresholds\"]\n",
+        "        \n",
+        "        # Apply trend and add random noise\n",
+        "        trend = base_value * (trend_factor ** i)\n",
+        "        noise = np.random.normal(0, noise_scale * base_value)\n",
+        "        value = max(0, min(1, trend + noise))  # Ensure value stays between 0 and 1\n",
+        "        \n",
+        "        log_metric(\n",
+        "            key=metric_name,\n",
+        "            value=value,\n",
+        "            recorded_at=recorded_at.isoformat(),\n",
+        "            thresholds=thresholds\n",
+        "        )\n",
+        "        \n",
+        "        print(f\"{metric_name:<15}: {value:.4f} (Thresholds: {thresholds})\")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "![AUC Score](./log_metric_auc_4.png)\n",
+        "![Accuracy Score](./log_metric_accuracy.png)\n",
+        "![Precision Score](./log_metric_precision.png)\n",
+        "![Recall Score](./log_metric_recall.png)\n",
+        "![F1 Score](./log_metric_f1.png)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_5__'></a>\n",
+        "\n",
+        "### Add acceptable performance flag\n",
+        "\n",
+        "The `passed` parameter in the `log_metric()` function allows you to explicitly mark whether a specific metric value should be considered \"Satisfactory\" or \"Requires Attention\":\n",
+        "   - When `passed=True`: A green \"Satisfactory\" badge appears on the chart, indicating the metric value meets your acceptance criteria.\n",
+        "   - When `passed=False`: A yellow \"Requires Attention\" badge appears, highlighting potential concerns that may require investigation."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "In the example below, the `passed=True` parameter adds a green \"Satisfactory\" badge to the GINI Score metric visualization, instantly indicating that the 0.75 value meets acceptable performance standards by being above the `medium_risk` threshold of 0.6:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "log_metric(\n",
+        "    key=\"GINI Score\",\n",
+        "    value=0.75,\n",
+        "    recorded_at=datetime(2025, 6, 7),\n",
+        "    thresholds = {\n",
+        "        \"high_risk\": 0.5,\n",
+        "        \"medium_risk\": 0.6,\n",
+        "        \"low_risk\": 0.8,\n",
+        "    },\n",
+        "    passed=True\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "![GINI Score](./log_metric_satisfactory.png)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "In this example, the `passed=False` parameter adds a yellow \"Requires Attention\" badge to the GINI Score metric visualization, immediately highlighting that the value of 0.5 fails to meet acceptable performance standards by not exceeding the `medium_risk` threshold of 0.6:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "log_metric(\n",
+        "    key=\"GINI Score\",\n",
+        "    value=0.5,\n",
+        "    recorded_at=datetime(2025, 6, 9),\n",
+        "    thresholds = {\n",
+        "        \"high_risk\": 0.5,\n",
+        "        \"medium_risk\": 0.6,\n",
+        "        \"low_risk\": 0.8,\n",
+        "    },\n",
+        "    passed=False\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "![GINI Score](./log_metric_attention.png)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Here, a custom function `passed_fn` determines the badge status automatically, displaying a green \"Satisfactory\" badge for the 0.65 GINI Score because it exceeds the `medium_risk` threshold of 0.6, enabling programmatic evaluation of metric performance based on predefined business rules:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "gini = 0.65\n",
+        "\n",
+        "thresholds = {\n",
+        "    \"high_risk\": 0.5,\n",
+        "    \"medium_risk\": 0.6,\n",
+        "    \"low_risk\": 0.8,\n",
+        "}\n",
+        "\n",
+        "def passed_fn(value):\n",
+        "    return value > thresholds[\"medium_risk\"]\n",
+        "\n",
+        "log_metric(\n",
+        "    key=\"GINI Score\",\n",
+        "    value=gini, \n",
+        "    recorded_at=datetime(2025, 6, 10),\n",
+        "    thresholds=thresholds,\n",
+        "    passed=passed_fn(gini)\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "![GINI Score](./log_metric_satisfactory_2.png)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your documentation.\n",
+        "\n",
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Work with your documentation\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
+        "\n",
+        "<a id='toc5_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-584966fafc334aec9585d8f880ddba0c"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.10.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 2
 }
diff --git a/site/notebooks/how_to/metrics/run_unit_metrics.ipynb b/site/notebooks/how_to/metrics/run_unit_metrics.ipynb
index 1b8dc8ce69..bc562eba99 100644
--- a/site/notebooks/how_to/metrics/run_unit_metrics.ipynb
+++ b/site/notebooks/how_to/metrics/run_unit_metrics.ipynb
@@ -89,9 +89,9 @@
     "\n",
     "## About ValidMind\n",
     "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
+    "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
     "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
+    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
     "\n",
     "<a id='toc1_1__'></a>\n",
     "\n",
@@ -105,11 +105,11 @@
     "\n",
     "### New to ValidMind?\n",
     "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
+    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
     "\n",
     "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
     "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+    "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
    ]
   },
   {
@@ -158,17 +158,19 @@
     "\n",
     "#### Register sample model\n",
     "\n",
-    "Let's first register a sample model for use with this notebook:\n",
+    "Let's first register a sample record (model) for use with this notebook:\n",
     "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
+    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
     "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
+    "2. In the left sidebar, select **Inventory**.\n",
     "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
+    "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
     "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
+    "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
     "\n",
-    "5. Click **Register Model** to add the model to your inventory."
+    "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+    "\n",
+    "6. Click **Register Model** to add the model to your inventory."
    ]
   },
   {
@@ -179,10 +181,12 @@
     "\n",
     "#### Apply documentation template\n",
     "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
+    "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
     "\n",
     "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
     "\n",
+    "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+    "\n",
     "2. Under **TEMPLATE**, select `Binary classification`.\n",
     "\n",
     "3. Click **Use Template** to apply the template."
@@ -196,11 +200,13 @@
     "\n",
     "#### Get your code snippet\n",
     "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
+    "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
     "\n",
     "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+    "\n",
     "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+    "\n",
+    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
    ]
   },
   {
@@ -690,27 +696,27 @@
     "\n",
     "## Next steps\n",
     "\n",
-    "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
+    "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your documentation.\n",
     "\n",
     "<a id='toc10_1__'></a>\n",
     "\n",
-    "### Work with your model documentation\n",
+    "### Work with your documentation\n",
     "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
+    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
     "\n",
     "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
     "\n",
-    "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)\n",
+    "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
     "\n",
     "<a id='toc10_2__'></a>\n",
     "\n",
     "### Discover more learning resources\n",
     "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
+    "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
     "\n",
     "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
     "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
+    "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
     "\n",
     "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
    ]
diff --git a/site/notebooks/how_to/qualitative_text/qualitative_text_generation.ipynb b/site/notebooks/how_to/qualitative_text/qualitative_text_generation.ipynb
index d85879f94a..f2c72ce7b3 100644
--- a/site/notebooks/how_to/qualitative_text/qualitative_text_generation.ipynb
+++ b/site/notebooks/how_to/qualitative_text/qualitative_text_generation.ipynb
@@ -71,9 +71,9 @@
         "\n",
         "## About ValidMind\n",
         "\n",
-        "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models. \n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models. \n",
         "\n",
-        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators."
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators."
       ]
     },
     {
@@ -99,11 +99,11 @@
         "\n",
         "### New to ValidMind?\n",
         "\n",
-        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
         "\n",
         "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
         "<br></br>\n",
-        "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
       ]
     },
     {
@@ -115,26 +115,34 @@
         "\n",
         "### Key concepts\n",
         "\n",
-        "**Validation report**: A comprehensive and structured assessment of a model’s development and performance, focusing on verifying its integrity, appropriateness, and alignment with its intended use. It includes analyses of model assumptions, data quality, performance metrics, outcomes of testing procedures, and risk considerations. The validation report supports transparency, regulatory compliance, and informed decision-making by documenting the validator’s independent review and conclusions.\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
         "\n",
-        "**Validation report template**: Serves as a standardized framework for conducting and documenting model validation activities. It outlines the required sections, recommended analyses, and expected validation tests, ensuring consistency and completeness across validation reports. The template helps guide validators through a systematic review process while promoting comparability and traceability of validation outcomes.\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
         "\n",
-        "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets.\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
         "\n",
-        "**Metrics**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
         "\n",
-        "**Custom metrics**: Custom metrics are functions that you define to evaluate your model or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
         "\n",
-        "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
         "\n",
-        "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-        "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-        "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom metric.\n",
-        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom metric. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
         "\n",
-        "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a metric, customize its behavior, or provide additional context.\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
         "\n",
-        "**Outputs**: Custom metrics can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
       ]
     },
     {
@@ -192,17 +200,19 @@
         "\n",
         "#### Register sample model\n",
         "\n",
-        "Let's first register a sample model for use with this notebook:\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
         "\n",
-        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
+        "2. In the left sidebar, select **Inventory**.\n",
         "\n",
-        "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
         "\n",
-        "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
         "\n",
-        "4. Select your own name under the **MODEL OWNER** drop-down.\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
         "\n",
-        "5. Click **Register Model** to add the model to your inventory."
+        "6. Click **Register Model** to add the model to your inventory."
       ]
     },
     {
@@ -214,10 +224,12 @@
         "\n",
         "#### Apply documentation template\n",
         "\n",
-        "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
         "\n",
         "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
         "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
         "2. Under **TEMPLATE**, select `Binary classification`.\n",
         "\n",
         "3. Click **Use Template** to apply the template."
@@ -232,11 +244,13 @@
         "\n",
         "#### Get your code snippet\n",
         "\n",
-        "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
         "\n",
         "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
         "2. Click **Copy snippet to clipboard**.\n",
-        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
       ]
     },
     {
@@ -336,7 +350,7 @@
         "\n",
         "Next, let's head to the ValidMind Platform to see the template in action:\n",
         "\n",
-        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
         "\n",
         "2. In the left sidebar, navigate to **Inventory** and select the model you registered for this notebook.\n",
         "\n",
@@ -494,7 +508,12 @@
       "id": "1ebfda19",
       "metadata": {},
       "source": [
-        "Next, we initialize a ValidMind model object with `vm.init_model()`. This creates a standardized representation of the trained model that can be passed into ValidMind tests and other library functions, making it possible to evaluate the model and connect its results to the documentation."
+        "You'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for our model.\n",
+        "\n",
+        "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+        "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
+        "\n",
+        "Initialize your model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
       ]
     },
     {
@@ -824,7 +843,7 @@
         "\n",
         "## Next steps\n",
         "\n",
-        "You can look at the output produced by the ValidMind Library right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation."
+        "You can look at the output produced by the ValidMind Library right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your documentation."
       ]
     },
     {
@@ -834,13 +853,13 @@
       "source": [
         "<a id='toc9_1__'></a>\n",
         "\n",
-        "### Work with your model documentation\n",
+        "### Work with your documentation\n",
         "\n",
-        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
         "\n",
         "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
         "\n",
-        "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)"
+        "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))"
       ]
     },
     {
@@ -854,14 +873,14 @@
         "\n",
         "For a more in-depth introduction to using the ValidMind Library for development, check out our introductory development series and the accompanying interactive training:\n",
         "\n",
-        "- **[ValidMind for model development](https://docs.validmind.ai/developer/validmind-library.html#for-model-development)**\n",
+        "- **[ValidMind for development](https://docs.validmind.ai/developer/validmind-library.html#development)**\n",
         "- **[Developer Fundamentals](https://docs.validmind.ai/training/developer-fundamentals/developer-fundamentals-register.html)**\n",
         "\n",
-        "We also offer many interactive notebooks to help you document models:\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
         "\n",
         "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
         "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-        "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
         "\n",
         "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
       ]
diff --git a/site/notebooks/how_to/scoring/assign_scores_complete_tutorial.ipynb b/site/notebooks/how_to/scoring/assign_scores_complete_tutorial.ipynb
index 586817850d..599024f471 100644
--- a/site/notebooks/how_to/scoring/assign_scores_complete_tutorial.ipynb
+++ b/site/notebooks/how_to/scoring/assign_scores_complete_tutorial.ipynb
@@ -91,9 +91,9 @@
     "\n",
     "## About ValidMind\n",
     "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
+    "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
     "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
+    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
     "\n",
     "<a id='toc1_1__'></a>\n",
     "\n",
@@ -107,11 +107,11 @@
     "\n",
     "### New to ValidMind?\n",
     "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
+    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
     "\n",
     "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
     "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+    "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
    ]
   },
   {
@@ -160,17 +160,19 @@
     "\n",
     "#### Register sample model\n",
     "\n",
-    "Let's first register a sample model for use with this notebook:\n",
+    "Let's first register a sample record (model) for use with this notebook:\n",
     "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
+    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
     "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
+    "2. In the left sidebar, select **Inventory**.\n",
     "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
+    "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
     "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
+    "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
     "\n",
-    "5. Click **Register Model** to add the model to your inventory."
+    "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+    "\n",
+    "6. Click **Register Model** to add the model to your inventory."
    ]
   },
   {
@@ -181,10 +183,12 @@
     "\n",
     "#### Apply documentation template\n",
     "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
+    "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
     "\n",
     "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
     "\n",
+    "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+    "\n",
     "2. Under **TEMPLATE**, select `Binary classification`.\n",
     "\n",
     "3. Click **Use Template** to apply the template."
@@ -198,11 +202,13 @@
     "\n",
     "#### Get your code snippet\n",
     "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
+    "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
     "\n",
     "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+    "\n",
     "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+    "\n",
+    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
    ]
   },
   {
@@ -713,13 +719,13 @@
     "\n",
     "<a id='toc8_1__'></a>\n",
     "\n",
-    "### Work with your model documentation\n",
+    "### Work with your documentation\n",
     "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
+    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
     "\n",
     "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
     "\n",
-    "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)\n",
+    "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
     "\n",
     "<a id='toc8_2__'></a>\n",
     "\n",
diff --git a/site/notebooks/how_to/tests/custom_tests/implement_custom_tests.ipynb b/site/notebooks/how_to/tests/custom_tests/implement_custom_tests.ipynb
index 8e4be82ac0..38ad4a3086 100644
--- a/site/notebooks/how_to/tests/custom_tests/implement_custom_tests.ipynb
+++ b/site/notebooks/how_to/tests/custom_tests/implement_custom_tests.ipynb
@@ -1,1096 +1,1113 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Implement custom tests\n",
-    "\n",
-    "Custom tests extend the functionality of ValidMind, allowing you to document any model or use case with added flexibility.\n",
-    "\n",
-    "ValidMind provides a comprehensive set of tests out-of-the-box to evaluate and document your models and datasets. We recognize there will be cases where the default tests do not support a model or dataset, or specific documentation is needed. In these cases, you can create and use your own custom code to accomplish what you need. To streamline custom code integration, we support the creation of custom test functions.\n",
-    "\n",
-    "This interactive notebook provides a step-by-step guide for implementing and registering custom tests with ValidMind, running them individually, viewing the results on the ValidMind Platform, and incorporating them into your model documentation template."
-   ]
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Implement custom tests\n",
+        "\n",
+        "Custom tests extend the functionality of ValidMind, allowing you to document any model or use case with added flexibility.\n",
+        "\n",
+        "ValidMind provides a comprehensive set of tests out-of-the-box to evaluate and document your models and datasets. We recognize there will be cases where the default tests do not support a model or dataset, or specific documentation is needed. In these cases, you can create and use your own custom code to accomplish what you need. To streamline custom code integration, we support the creation of custom test functions.\n",
+        "\n",
+        "This interactive notebook provides a step-by-step guide for implementing and registering custom tests with ValidMind, running them individually, viewing the results on the ValidMind Platform, and incorporating them into your model documentation template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "- [Implement a Custom Test](#toc3__)    \n",
+        "- [Run the Custom Test](#toc4__)    \n",
+        "  - [Setup the Model and Dataset](#toc4_1__)    \n",
+        "  - [Run the Custom Test](#toc4_2__)    \n",
+        "- [Adding Custom Test to Model Documentation](#toc5__)    \n",
+        "- [Some More Custom Tests](#toc6__)    \n",
+        "  - [Custom Test: Table of Model Hyperparameters](#toc6_1__)    \n",
+        "  - [Custom Test: External API Call](#toc6_2__)    \n",
+        "  - [Custom Test: Passing Parameters](#toc6_3__)    \n",
+        "  - [Custom Test: Multiple Tables and Plots in a Single Test](#toc6_4__)    \n",
+        "  - [Custom Test: Images](#toc6_5__)    \n",
+        "  - [Custom Test: Description](#toc6_6__)    \n",
+        "- [Conclusion](#toc7__)    \n",
+        "- [Next steps](#toc8__)    \n",
+        "  - [Work with your model documentation](#toc8_1__)    \n",
+        "  - [Discover more learning resources](#toc8_2__)    \n",
+        "- [Upgrade ValidMind](#toc9__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+        "\n",
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Binary classification`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Implement a Custom Test\n",
+        "\n",
+        "Let's start off by creating a simple custom test that creates a Confusion Matrix for a binary classification model. We will use the `sklearn.metrics.confusion_matrix` function to calculate the confusion matrix and then display it as a heatmap using `plotly`. (This is already a built-in test in ValidMind, but we will use it as an example to demonstrate how to create custom tests.)"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import matplotlib.pyplot as plt\n",
+        "from sklearn import metrics\n",
+        "\n",
+        "\n",
+        "@vm.test(\"my_custom_tests.ConfusionMatrix\")\n",
+        "def confusion_matrix(dataset, model):\n",
+        "    \"\"\"The confusion matrix is a table that is often used to describe the performance of a classification model on a set of data for which the true values are known.\n",
+        "\n",
+        "    The confusion matrix is a 2x2 table that contains 4 values:\n",
+        "\n",
+        "    - True Positive (TP): the number of correct positive predictions\n",
+        "    - True Negative (TN): the number of correct negative predictions\n",
+        "    - False Positive (FP): the number of incorrect positive predictions\n",
+        "    - False Negative (FN): the number of incorrect negative predictions\n",
+        "\n",
+        "    The confusion matrix can be used to assess the holistic performance of a classification model by showing the accuracy, precision, recall, and F1 score of the model on a single figure.\n",
+        "    \"\"\"\n",
+        "    y_true = dataset.y\n",
+        "    y_pred = dataset.y_pred(model)\n",
+        "\n",
+        "    confusion_matrix = metrics.confusion_matrix(y_true, y_pred)\n",
+        "\n",
+        "    cm_display = metrics.ConfusionMatrixDisplay(\n",
+        "        confusion_matrix=confusion_matrix, display_labels=[False, True]\n",
+        "    )\n",
+        "    cm_display.plot()\n",
+        "\n",
+        "    plt.close()  # close the plot to avoid displaying it\n",
+        "\n",
+        "    return cm_display.figure_  # return the figure object itself"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Thats our custom test defined and ready to go... Let's take a look at whats going on here:\n",
+        "\n",
+        "- The function `confusion_matrix` takes two arguments `dataset` and `model`. This is a VMDataset and VMModel object respectively.\n",
+        "- The function docstring provides a description of what the test does. This will be displayed along with the result in this notebook as well as in the ValidMind Platform.\n",
+        "- The function body calculates the confusion matrix using the `sklearn.metrics.confusion_matrix` function and then plots it using `sklearn.metric.ConfusionMatrixDisplay`.\n",
+        "- The function then returns the `ConfusionMatrixDisplay.figure_` object - this is important as the ValidMind Library expects the output of the custom test to be a plot or a table.\n",
+        "- The `@vm.test` decorator is doing the work of creating a wrapper around the function that will allow it to be run by the ValidMind Library. It also registers the test so it can be found by the ID `my_custom_tests.ConfusionMatrix` (see the section below on how test IDs work in ValidMind and why this format is important)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Run the Custom Test\n",
+        "\n",
+        "Now that we have defined and registered our custom test, lets see how we can run it and properly use it in the ValidMind Platform."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Setup the Model and Dataset\n",
+        "\n",
+        "First let's setup a an example model and dataset to run our custom metic against. Since this is a Confusion Matrix, we will use the Customer Churn dataset that ValidMind provides and train a simple XGBoost model."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import xgboost as xgb\n",
+        "from validmind.datasets.classification import customer_churn\n",
+        "\n",
+        "raw_df = customer_churn.load_data()\n",
+        "train_df, validation_df, test_df = customer_churn.preprocess(raw_df)\n",
+        "\n",
+        "x_train = train_df.drop(customer_churn.target_column, axis=1)\n",
+        "y_train = train_df[customer_churn.target_column]\n",
+        "x_val = validation_df.drop(customer_churn.target_column, axis=1)\n",
+        "y_val = validation_df[customer_churn.target_column]\n",
+        "\n",
+        "model = xgb.XGBClassifier(early_stopping_rounds=10)\n",
+        "model.set_params(\n",
+        "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
+        ")\n",
+        "model.fit(\n",
+        "    x_train,\n",
+        "    y_train,\n",
+        "    eval_set=[(x_val, y_val)],\n",
+        "    verbose=False,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Easy enough! Now we have a model and dataset setup and trained. One last thing to do is bring the dataset and model into the ValidMind Library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# for now, we'll just use the test dataset\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    dataset=test_df,\n",
+        "    target_column=customer_churn.target_column,\n",
+        "    input_id=\"test_dataset\",\n",
+        ")\n",
+        "\n",
+        "vm_model = vm.init_model(model, input_id=\"model\")\n",
+        "\n",
+        "# link the model to the dataset\n",
+        "vm_test_ds.assign_predictions(model=vm_model)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Run the Custom Test\n",
+        "\n",
+        "Now that we have our model and dataset setup, we have everything we need to run our custom test. We can do this by importing the `run_test` function from the `validmind.tests` module and passing in the test ID of our custom test along with the model and dataset we want to run it against.\n",
+        "\n",
+        ">Notice how the `inputs` dictionary is used to map an `input_id` which we set above to the `model` and `dataset` keys that are expected by our custom test function. This is how the ValidMind Library knows which inputs to pass to different tests and is key when using many different datasets and models."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.tests import run_test\n",
+        "\n",
+        "result = run_test(\n",
+        "    \"my_custom_tests.ConfusionMatrix\",\n",
+        "    inputs={\"model\": \"model\", \"dataset\": \"test_dataset\"},\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You'll notice that the docstring becomes a markdown description of the test. The figure is then displayed as the test result. What you see above is how it will look in the ValidMind Platform as well. Let's go ahead and log the result to see how that works."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Adding Custom Test to Model Documentation\n",
+        "\n",
+        "To do this, go to the documentation page of the model you registered above and navigate to the `Model Development` -> `Model Evaluation` section. Then hover between any existing content block to reveal the `+` button as shown in the screenshot below.\n",
+        "\n",
+        "![screenshot showing insert button for test-driven blocks](./insert-test-driven-block.png)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Now click on the `+` button and select the `Test-Driven Block` option. This will open a dialog where you can select `My Custom Tests Confusion Matrix` from the list of available tests. You can preview the result and then click `Insert Block` to add it to the documentation.\n",
+        "\n",
+        "![screenshot showing how to insert a test-driven block](./insert-test-driven-block-custom.png)\n",
+        "\n",
+        "The test should match the result you see above. It is now part of your documentation and will now be run everytime you run `vm.run_documentation_tests()` for your model. Let's do that now."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.reload()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If you preview the template, it should show the custom test in the `Model Development`->`Model Evaluation` section:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Just so we can run all of the tests in the template, let's initialize the train and raw dataset.\n",
+        "\n",
+        "(Refer to [**Quickstart for documentation**](../../../quickstart/quickstart_documentation.ipynb) and the ValidMind docs for more information on what we are doing here)"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_raw_dataset = vm.init_dataset(\n",
+        "    dataset=raw_df,\n",
+        "    input_id=\"raw_dataset\",\n",
+        "    target_column=customer_churn.target_column,\n",
+        "    class_labels=customer_churn.class_labels,\n",
+        ")\n",
+        "\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    dataset=train_df,\n",
+        "    input_id=\"train_dataset\",\n",
+        "    target_column=customer_churn.target_column,\n",
+        ")\n",
+        "vm_train_ds.assign_predictions(model=vm_model)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "To run all the tests in the template, you can use the `vm.run_documentation_tests()` and pass the inputs we initialized above and the demo config from our customer_churn module. We will have to add a section to the config for our new test to tell it which inputs it should receive. This is done by simply adding a new element in the config dictionary where the key is the ID of the test and the value is a dictionary with the following structure:\n",
+        "```python\n",
+        "{\n",
+        "    \"inputs\": {\n",
+        "        \"model\": \"test_dataset\",\n",
+        "        \"dataset\": \"model\",\n",
+        "    }\n",
+        "}\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.utils import preview_test_config\n",
+        "\n",
+        "test_config = customer_churn.get_demo_test_config()\n",
+        "test_config[\"my_custom_tests.ConfusionMatrix\"] = {\n",
+        "    \"inputs\": {\n",
+        "        \"dataset\": \"test_dataset\",\n",
+        "        \"model\": \"model\",\n",
+        "    }\n",
+        "}\n",
+        "preview_test_config(test_config)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "full_suite = vm.run_documentation_tests(config=test_config)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Some More Custom Tests\n",
+        "\n",
+        "Now that you understand the entire process of creating custom tests and using them in your documentation, let's create a few more to see different ways you can utilize custom tests."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_1__'></a>\n",
+        "\n",
+        "### Custom Test: Table of Model Hyperparameters\n",
+        "\n",
+        "This custom test will display a table of the hyperparameters used in the model:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "@vm.test(\"my_custom_tests.Hyperparameters\")\n",
+        "def hyperparameters(model):\n",
+        "    \"\"\"The hyperparameters of a machine learning model are the settings that control the learning process.\n",
+        "    These settings are specified before the learning process begins and can have a significant impact on the\n",
+        "    performance of the model.\n",
+        "\n",
+        "    The hyperparameters of a model can be used to tune the model to achieve the best possible performance\n",
+        "    on a given dataset. By examining the hyperparameters of a model, you can gain insight into how the model\n",
+        "    was trained and how it might be improved.\n",
+        "    \"\"\"\n",
+        "    hyperparameters = model.model.get_xgb_params()  # dictionary of hyperparameters\n",
+        "\n",
+        "    # turn the dictionary into a table where each row contains a hyperparameter and its value\n",
+        "    return [{\"Hyperparam\": k, \"Value\": v} for k, v in hyperparameters.items() if v]\n",
+        "\n",
+        "\n",
+        "result = run_test(\"my_custom_tests.Hyperparameters\", inputs={\"model\": \"model\"})\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Since the test has been run and logged, you can add it to your documentation using the same process as above. It should look like this:\n",
+        "\n",
+        "![screenshot showing hyperparameters test](./hyperparameters-custom-metric.png)\n",
+        "\n",
+        "For our simple toy model, there are aren't really any proper hyperparameters but you can see how this could be useful for more complex models that have gone through hyperparameter tuning."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2__'></a>\n",
+        "\n",
+        "### Custom Test: External API Call\n",
+        "\n",
+        "This custom test will make an external API call to get the current BTC price and display it as a table. This demonstrates how you might integrate external data sources into your model documentation in a programmatic way. You could, for instance, setup a pipeline that runs a test like this every day to keep your model documentation in sync with an external system."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import requests\n",
+        "import random\n",
+        "\n",
+        "\n",
+        "@vm.test(\"my_custom_tests.ExternalAPI\")\n",
+        "def external_api():\n",
+        "    \"\"\"This test calls an external API to get a list of fake users. It then creates\n",
+        "    a table with the relevant data so it can be displayed in the documentation.\n",
+        "\n",
+        "    The purpose of this test is to demonstrate how to call an external API and use the\n",
+        "    data in a test. A test like this could even be setup to run in a scheduled\n",
+        "    pipeline to keep your documentation in-sync with an external data source.\n",
+        "    \"\"\"\n",
+        "    url = \"https://jsonplaceholder.typicode.com/users\"\n",
+        "    response = requests.get(url)\n",
+        "    data = response.json()\n",
+        "\n",
+        "    # extract the time and the current BTC price in USD\n",
+        "    return {\n",
+        "        \"Model Owners/Stakeholders\": [\n",
+        "            {\n",
+        "                \"Name\": user[\"name\"],\n",
+        "                \"Role\": random.choice([\"Owner\", \"Stakeholder\"]),\n",
+        "                \"Email\": user[\"email\"],\n",
+        "                \"Phone\": user[\"phone\"],\n",
+        "                \"Slack Handle\": f\"@{user['name'].lower().replace(' ', '.')}\",\n",
+        "            }\n",
+        "            for user in data[:3]\n",
+        "        ],\n",
+        "        \"Model Developers\": [\n",
+        "            {\n",
+        "                \"Name\": user[\"name\"],\n",
+        "                \"Role\": \"Developer\",\n",
+        "                \"Email\": user[\"email\"],\n",
+        "            }\n",
+        "            for user in data[3:7]\n",
+        "        ],\n",
+        "        \"Model Validators\": [\n",
+        "            {\n",
+        "                \"Name\": user[\"name\"],\n",
+        "                \"Role\": \"Validator\",\n",
+        "                \"Email\": user[\"email\"],\n",
+        "            }\n",
+        "            for user in data[7:]\n",
+        "        ],\n",
+        "    }\n",
+        "\n",
+        "\n",
+        "result = run_test(\"my_custom_tests.ExternalAPI\")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Again, you can add this to your documentation to see how it looks:\n",
+        "\n",
+        "![screenshot showing BTC price metric](./external-data-custom-test.png)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_3__'></a>\n",
+        "\n",
+        "### Custom Test: Passing Parameters\n",
+        "\n",
+        "Custom test functions, as stated earlier, can take both inputs and params. When you define your function there is no need to distinguish between the two, the ValidMind Library will handle that for you. You simply need to add both to the function as arguments and the library will pass in the correct values.\n",
+        "\n",
+        "So for instance, if you wanted to parameterize the first custom test we created, the confusion matrix, you could do so like this:\n",
+        "\n",
+        "```python\n",
+        "def confusion_matrix(dataset: VMDataset, model: VMModel, my_param: str = \"Default Value\"):\n",
+        "    pass\n",
+        "```\n",
+        "\n",
+        "And then when you run the test, you can pass in the parameter like this:\n",
+        "\n",
+        "```python\n",
+        "vm.run_test(\n",
+        "    \"my_custom_tests.ConfusionMatrix\",\n",
+        "    inputs={\"model\": \"model\", \"dataset\": \"test_dataset\"},\n",
+        "    params={\"my_param\": \"My Value\"},\n",
+        ")\n",
+        "```\n",
+        "\n",
+        "Or if you are running the entire documentation template, you would update the config like this:\n",
+        "\n",
+        "```python\n",
+        "test_config[\"my_custom_tests.ConfusionMatrix\"] = {\n",
+        "    \"inputs\": {\n",
+        "        \"dataset\": \"test_dataset\",\n",
+        "        \"model\": \"model\",\n",
+        "    },\n",
+        "    \"params\": {\n",
+        "        \"my_param\": \"My Value\",\n",
+        "    },\n",
+        "}\n",
+        "```\n",
+        "\n",
+        "Let's go ahead and create a toy test that takes a parameter and uses it in the result:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import plotly.express as px\n",
+        "\n",
+        "\n",
+        "@vm.test(\"my_custom_tests.ParameterExample\")\n",
+        "def parameter_example(\n",
+        "    plot_title=\"Default Plot Title\", x_col=\"sepal_width\", y_col=\"sepal_length\"\n",
+        "):\n",
+        "    \"\"\"This test takes two parameters and creates a scatter plot based on them.\n",
+        "\n",
+        "    The purpose of this test is to demonstrate how to create a test that takes\n",
+        "    parameters and uses them to generate a plot. This can be useful for creating\n",
+        "    tests that are more flexible and can be used in a variety of scenarios.\n",
+        "    \"\"\"\n",
+        "    # return px.scatter(px.data.iris(), x=x_col, y=y_col, color=\"species\")\n",
+        "    return px.scatter(\n",
+        "        px.data.iris(), x=x_col, y=y_col, color=\"species\", title=plot_title\n",
+        "    )\n",
+        "\n",
+        "\n",
+        "result = run_test(\n",
+        "    \"my_custom_tests.ParameterExample\",\n",
+        "    params={\n",
+        "        \"plot_title\": \"My Cool Plot\",\n",
+        "        \"x_col\": \"sepal_width\",\n",
+        "        \"y_col\": \"sepal_length\",\n",
+        "    },\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Play around with this and see how you can use parameters, default values and other features to make your custom tests more flexible and useful.\n",
+        "\n",
+        "Here's how this one looks in the documentation:\n",
+        "![screenshot showing parameterized test](./parameterized-custom-metric.png)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_4__'></a>\n",
+        "\n",
+        "### Custom Test: Multiple Tables and Plots in a Single Test\n",
+        "\n",
+        "Custom test functions, as stated earlier, can return more than just one table or plot. In fact, any number of tables and plots can be returned. Let's see an example of this:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import numpy as np\n",
+        "import plotly.express as px\n",
+        "\n",
+        "\n",
+        "@vm.test(\"my_custom_tests.ComplexOutput\")\n",
+        "def complex_output():\n",
+        "    \"\"\"This test demonstrates how to return many tables and figures in a single test\"\"\"\n",
+        "    # create a couple tables\n",
+        "    table = [{\"A\": 1, \"B\": 2}, {\"A\": 3, \"B\": 4}]\n",
+        "    table2 = [{\"C\": 5, \"D\": 6}, {\"C\": 7, \"D\": 8}]\n",
+        "\n",
+        "    # create a few figures showing some random data\n",
+        "    fig1 = px.line(x=np.arange(10), y=np.random.rand(10), title=\"Random Line Plot\")\n",
+        "    fig2 = px.bar(x=[\"A\", \"B\", \"C\"], y=np.random.rand(3), title=\"Random Bar Plot\")\n",
+        "    fig3 = px.scatter(\n",
+        "        x=np.random.rand(10), y=np.random.rand(10), title=\"Random Scatter Plot\"\n",
+        "    )\n",
+        "\n",
+        "    return (\n",
+        "        {\n",
+        "            \"My Cool Table\": table,\n",
+        "            \"Another Table\": table2,\n",
+        "        },\n",
+        "        {\n",
+        "            # Figures support the same dict-of-titles convention as tables.\n",
+        "            # These titles flow into the document media registry as\n",
+        "            # \"Figure N. <title>\" alongside table captions.\n",
+        "            \"Random Line Plot\": fig1,\n",
+        "            \"Random Bar Plot\": fig2,\n",
+        "            \"Random Scatter Plot\": fig3,\n",
+        "        },\n",
+        "    )\n",
+        "\n",
+        "\n",
+        "result = run_test(\"my_custom_tests.ComplexOutput\")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Notice how you can return the tables as a dictionary where the key is the title of the table and the value is the table itself. The same convention works for **figures** — wrap them in a dict whose keys are the titles you want shown in the document media registry (e.g. *Figure 7. Random Line Plot*). You could also just return the figures by themselves but this way you can give them a title to more easily identify them in the result.\n",
+        "\n",
+        "![screenshot showing multiple tables and plots](./multiple-tables-plots-custom-metric.png)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_5__'></a>\n",
+        "\n",
+        "### Custom Test: Images\n",
+        "\n",
+        "If you are using a plotting library that isn't supported by ValidMind (i.e. not `matplotlib` or `plotly`), you can still return the image directly as a bytes-like object. This could also be used to bring any type of image into your documentation in a programmatic way. For instance, you may want to include a diagram of your model architecture or a screenshot of a dashboard that your model is integrated with. As long as you can produce the image with Python or open it from a file, you can include it in your documentation."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import io\n",
+        "import matplotlib.pyplot as plt\n",
+        "\n",
+        "\n",
+        "@vm.test(\"my_custom_tests.Image\")\n",
+        "def image():\n",
+        "    \"\"\"This test demonstrates how to return an image in a test\"\"\"\n",
+        "\n",
+        "    # create a simple plot\n",
+        "    fig, ax = plt.subplots()\n",
+        "    ax.plot([1, 2, 3, 4])\n",
+        "    ax.set_title(\"Simple Line Plot\")\n",
+        "\n",
+        "    # save the plot as a PNG image (in-memory buffer)\n",
+        "    img_data = io.BytesIO()\n",
+        "    fig.savefig(img_data, format=\"png\")\n",
+        "    img_data.seek(0)\n",
+        "\n",
+        "    plt.close()  # close the plot to avoid displaying it\n",
+        "\n",
+        "    return img_data.read()\n",
+        "\n",
+        "\n",
+        "result = run_test(\"my_custom_tests.Image\")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Adding this custom test to your documentation will display the image:\n",
+        "\n",
+        "![screenshot showing image custom test](./image-in-custom-metric.png)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If you want to log an image as a test result, you can do so by passing the path to the image as a parameter to the custom test and then opening the file in the test function. Here's an example:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "@vm.test(\"my_custom_tests.MyPNGCorrelationMatrix\")\n",
+        "def Image(path: str):\n",
+        "    \"\"\"Opens a png image file and logs it as a test result to ValidMind\"\"\"\n",
+        "    if not path.endswith(\".png\"):\n",
+        "        raise ValueError(\"Image must be a PNG file\")\n",
+        "\n",
+        "    # return raw image bytes\n",
+        "    with open(path, \"rb\") as f:\n",
+        "        return f.read()\n",
+        "    \n",
+        "run_test(\n",
+        "    \"my_custom_tests.MyPNGCorrelationMatrix\",\n",
+        "    params={\"path\": \"./pearson-correlation-matrix.png\"},\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "The image is displayed in the test result:\n",
+        "\n",
+        "![screenshot showing image from file](./pearson-correlation-matrix-test-output.png)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_6__'></a>\n",
+        "\n",
+        "### Custom Test: Description\n",
+        "\n",
+        "If you want to write a custom test description for your custom test instead of it is interpreted through llm, you can do so by returning string in your test."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import pandas as pd\n",
+        "\n",
+        "@vm.test(\"my_custom_tests.MyCustomTest\")\n",
+        "def my_custom_test(dataset, model):\n",
+        "    \"\"\"\n",
+        "    This is a custom computed test that computes confusion matrix for a binary classification model and return  a string as a test description.\n",
+        "    \"\"\"\n",
+        "    y_true = dataset.y\n",
+        "    y_pred = dataset.y_pred(model)\n",
+        "\n",
+        "    confusion_matrix = metrics.confusion_matrix(y_true, y_pred)\n",
+        "\n",
+        "    cm_display = metrics.ConfusionMatrixDisplay(\n",
+        "        confusion_matrix=confusion_matrix, display_labels=[False, True]\n",
+        "    )\n",
+        "    cm_display.plot()\n",
+        "\n",
+        "    plt.close()  # close the plot to avoid displaying it\n",
+        "\n",
+        "    return cm_display.figure_, \"Test Description - Confusion Matrix\", pd.DataFrame({\"Value\": [1, 2, 3]})  # return the figure object itself\n",
+        "\n"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You can see here test result description has been customized here. The same result description will be displayed in the UI."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"my_custom_tests.MyCustomTest\",\n",
+        "    inputs={\"model\": \"model\", \"dataset\": \"test_dataset\"},\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Conclusion\n",
+        "\n",
+        "In this notebook, we have demonstrated how to create custom tests in ValidMind. We have shown how to define custom test functions, register them with the ValidMind Library, run them against models and datasets, and add them to model documentation templates. We have also shown how to return tables and plots from custom tests and how to use them in the ValidMind Platform. We hope this tutorial has been helpful in understanding how to create and use custom tests in ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
+        "\n",
+        "<a id='toc8_1__'></a>\n",
+        "\n",
+        "### Work with your documentation\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
+        "\n",
+        "<a id='toc8_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc9__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-bcdac57ebb8d440f86ba120ee6511db3"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "Python 3 (ipykernel)",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.11.5"
+    }
   },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "- [Implement a Custom Test](#toc3__)    \n",
-    "- [Run the Custom Test](#toc4__)    \n",
-    "  - [Setup the Model and Dataset](#toc4_1__)    \n",
-    "  - [Run the Custom Test](#toc4_2__)    \n",
-    "- [Adding Custom Test to Model Documentation](#toc5__)    \n",
-    "- [Some More Custom Tests](#toc6__)    \n",
-    "  - [Custom Test: Table of Model Hyperparameters](#toc6_1__)    \n",
-    "  - [Custom Test: External API Call](#toc6_2__)    \n",
-    "  - [Custom Test: Passing Parameters](#toc6_3__)    \n",
-    "  - [Custom Test: Multiple Tables and Plots in a Single Test](#toc6_4__)    \n",
-    "  - [Custom Test: Images](#toc6_5__)    \n",
-    "  - [Custom Test: Description](#toc6_6__)    \n",
-    "- [Conclusion](#toc7__)    \n",
-    "- [Next steps](#toc8__)    \n",
-    "  - [Work with your model documentation](#toc8_1__)    \n",
-    "  - [Discover more learning resources](#toc8_2__)    \n",
-    "- [Upgrade ValidMind](#toc9__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
-    "\n",
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Custom tests**: Custom tests are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom test.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom test. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom test can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Binary classification`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Implement a Custom Test\n",
-    "\n",
-    "Let's start off by creating a simple custom test that creates a Confusion Matrix for a binary classification model. We will use the `sklearn.metrics.confusion_matrix` function to calculate the confusion matrix and then display it as a heatmap using `plotly`. (This is already a built-in test in ValidMind, but we will use it as an example to demonstrate how to create custom tests.)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import matplotlib.pyplot as plt\n",
-    "from sklearn import metrics\n",
-    "\n",
-    "\n",
-    "@vm.test(\"my_custom_tests.ConfusionMatrix\")\n",
-    "def confusion_matrix(dataset, model):\n",
-    "    \"\"\"The confusion matrix is a table that is often used to describe the performance of a classification model on a set of data for which the true values are known.\n",
-    "\n",
-    "    The confusion matrix is a 2x2 table that contains 4 values:\n",
-    "\n",
-    "    - True Positive (TP): the number of correct positive predictions\n",
-    "    - True Negative (TN): the number of correct negative predictions\n",
-    "    - False Positive (FP): the number of incorrect positive predictions\n",
-    "    - False Negative (FN): the number of incorrect negative predictions\n",
-    "\n",
-    "    The confusion matrix can be used to assess the holistic performance of a classification model by showing the accuracy, precision, recall, and F1 score of the model on a single figure.\n",
-    "    \"\"\"\n",
-    "    y_true = dataset.y\n",
-    "    y_pred = dataset.y_pred(model)\n",
-    "\n",
-    "    confusion_matrix = metrics.confusion_matrix(y_true, y_pred)\n",
-    "\n",
-    "    cm_display = metrics.ConfusionMatrixDisplay(\n",
-    "        confusion_matrix=confusion_matrix, display_labels=[False, True]\n",
-    "    )\n",
-    "    cm_display.plot()\n",
-    "\n",
-    "    plt.close()  # close the plot to avoid displaying it\n",
-    "\n",
-    "    return cm_display.figure_  # return the figure object itself"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Thats our custom test defined and ready to go... Let's take a look at whats going on here:\n",
-    "\n",
-    "- The function `confusion_matrix` takes two arguments `dataset` and `model`. This is a VMDataset and VMModel object respectively.\n",
-    "- The function docstring provides a description of what the test does. This will be displayed along with the result in this notebook as well as in the ValidMind Platform.\n",
-    "- The function body calculates the confusion matrix using the `sklearn.metrics.confusion_matrix` function and then plots it using `sklearn.metric.ConfusionMatrixDisplay`.\n",
-    "- The function then returns the `ConfusionMatrixDisplay.figure_` object - this is important as the ValidMind Library expects the output of the custom test to be a plot or a table.\n",
-    "- The `@vm.test` decorator is doing the work of creating a wrapper around the function that will allow it to be run by the ValidMind Library. It also registers the test so it can be found by the ID `my_custom_tests.ConfusionMatrix` (see the section below on how test IDs work in ValidMind and why this format is important)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Run the Custom Test\n",
-    "\n",
-    "Now that we have defined and registered our custom test, lets see how we can run it and properly use it in the ValidMind Platform."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Setup the Model and Dataset\n",
-    "\n",
-    "First let's setup a an example model and dataset to run our custom metic against. Since this is a Confusion Matrix, we will use the Customer Churn dataset that ValidMind provides and train a simple XGBoost model."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import xgboost as xgb\n",
-    "from validmind.datasets.classification import customer_churn\n",
-    "\n",
-    "raw_df = customer_churn.load_data()\n",
-    "train_df, validation_df, test_df = customer_churn.preprocess(raw_df)\n",
-    "\n",
-    "x_train = train_df.drop(customer_churn.target_column, axis=1)\n",
-    "y_train = train_df[customer_churn.target_column]\n",
-    "x_val = validation_df.drop(customer_churn.target_column, axis=1)\n",
-    "y_val = validation_df[customer_churn.target_column]\n",
-    "\n",
-    "model = xgb.XGBClassifier(early_stopping_rounds=10)\n",
-    "model.set_params(\n",
-    "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
-    ")\n",
-    "model.fit(\n",
-    "    x_train,\n",
-    "    y_train,\n",
-    "    eval_set=[(x_val, y_val)],\n",
-    "    verbose=False,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Easy enough! Now we have a model and dataset setup and trained. One last thing to do is bring the dataset and model into the ValidMind Library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# for now, we'll just use the test dataset\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    dataset=test_df,\n",
-    "    target_column=customer_churn.target_column,\n",
-    "    input_id=\"test_dataset\",\n",
-    ")\n",
-    "\n",
-    "vm_model = vm.init_model(model, input_id=\"model\")\n",
-    "\n",
-    "# link the model to the dataset\n",
-    "vm_test_ds.assign_predictions(model=vm_model)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Run the Custom Test\n",
-    "\n",
-    "Now that we have our model and dataset setup, we have everything we need to run our custom test. We can do this by importing the `run_test` function from the `validmind.tests` module and passing in the test ID of our custom test along with the model and dataset we want to run it against.\n",
-    "\n",
-    ">Notice how the `inputs` dictionary is used to map an `input_id` which we set above to the `model` and `dataset` keys that are expected by our custom test function. This is how the ValidMind Library knows which inputs to pass to different tests and is key when using many different datasets and models."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.tests import run_test\n",
-    "\n",
-    "result = run_test(\n",
-    "    \"my_custom_tests.ConfusionMatrix\",\n",
-    "    inputs={\"model\": \"model\", \"dataset\": \"test_dataset\"},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You'll notice that the docstring becomes a markdown description of the test. The figure is then displayed as the test result. What you see above is how it will look in the ValidMind Platform as well. Let's go ahead and log the result to see how that works."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Adding Custom Test to Model Documentation\n",
-    "\n",
-    "To do this, go to the documentation page of the model you registered above and navigate to the `Model Development` -> `Model Evaluation` section. Then hover between any existing content block to reveal the `+` button as shown in the screenshot below.\n",
-    "\n",
-    "![screenshot showing insert button for test-driven blocks](./insert-test-driven-block.png)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Now click on the `+` button and select the `Test-Driven Block` option. This will open a dialog where you can select `My Custom Tests Confusion Matrix` from the list of available tests. You can preview the result and then click `Insert Block` to add it to the documentation.\n",
-    "\n",
-    "![screenshot showing how to insert a test-driven block](./insert-test-driven-block-custom.png)\n",
-    "\n",
-    "The test should match the result you see above. It is now part of your documentation and will now be run everytime you run `vm.run_documentation_tests()` for your model. Let's do that now."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.reload()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If you preview the template, it should show the custom test in the `Model Development`->`Model Evaluation` section:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Just so we can run all of the tests in the template, let's initialize the train and raw dataset.\n",
-    "\n",
-    "(Refer to [**Quickstart for model documentation**](../../../quickstart/quickstart_model_documentation.ipynb) and the ValidMind docs for more information on what we are doing here)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_raw_dataset = vm.init_dataset(\n",
-    "    dataset=raw_df,\n",
-    "    input_id=\"raw_dataset\",\n",
-    "    target_column=customer_churn.target_column,\n",
-    "    class_labels=customer_churn.class_labels,\n",
-    ")\n",
-    "\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    dataset=train_df,\n",
-    "    input_id=\"train_dataset\",\n",
-    "    target_column=customer_churn.target_column,\n",
-    ")\n",
-    "vm_train_ds.assign_predictions(model=vm_model)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "To run all the tests in the template, you can use the `vm.run_documentation_tests()` and pass the inputs we initialized above and the demo config from our customer_churn module. We will have to add a section to the config for our new test to tell it which inputs it should receive. This is done by simply adding a new element in the config dictionary where the key is the ID of the test and the value is a dictionary with the following structure:\n",
-    "```python\n",
-    "{\n",
-    "    \"inputs\": {\n",
-    "        \"model\": \"test_dataset\",\n",
-    "        \"dataset\": \"model\",\n",
-    "    }\n",
-    "}\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.utils import preview_test_config\n",
-    "\n",
-    "test_config = customer_churn.get_demo_test_config()\n",
-    "test_config[\"my_custom_tests.ConfusionMatrix\"] = {\n",
-    "    \"inputs\": {\n",
-    "        \"dataset\": \"test_dataset\",\n",
-    "        \"model\": \"model\",\n",
-    "    }\n",
-    "}\n",
-    "preview_test_config(test_config)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "full_suite = vm.run_documentation_tests(config=test_config)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Some More Custom Tests\n",
-    "\n",
-    "Now that you understand the entire process of creating custom tests and using them in your documentation, let's create a few more to see different ways you can utilize custom tests."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1__'></a>\n",
-    "\n",
-    "### Custom Test: Table of Model Hyperparameters\n",
-    "\n",
-    "This custom test will display a table of the hyperparameters used in the model:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "@vm.test(\"my_custom_tests.Hyperparameters\")\n",
-    "def hyperparameters(model):\n",
-    "    \"\"\"The hyperparameters of a machine learning model are the settings that control the learning process.\n",
-    "    These settings are specified before the learning process begins and can have a significant impact on the\n",
-    "    performance of the model.\n",
-    "\n",
-    "    The hyperparameters of a model can be used to tune the model to achieve the best possible performance\n",
-    "    on a given dataset. By examining the hyperparameters of a model, you can gain insight into how the model\n",
-    "    was trained and how it might be improved.\n",
-    "    \"\"\"\n",
-    "    hyperparameters = model.model.get_xgb_params()  # dictionary of hyperparameters\n",
-    "\n",
-    "    # turn the dictionary into a table where each row contains a hyperparameter and its value\n",
-    "    return [{\"Hyperparam\": k, \"Value\": v} for k, v in hyperparameters.items() if v]\n",
-    "\n",
-    "\n",
-    "result = run_test(\"my_custom_tests.Hyperparameters\", inputs={\"model\": \"model\"})\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Since the test has been run and logged, you can add it to your documentation using the same process as above. It should look like this:\n",
-    "\n",
-    "![screenshot showing hyperparameters test](./hyperparameters-custom-metric.png)\n",
-    "\n",
-    "For our simple toy model, there are aren't really any proper hyperparameters but you can see how this could be useful for more complex models that have gone through hyperparameter tuning."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2__'></a>\n",
-    "\n",
-    "### Custom Test: External API Call\n",
-    "\n",
-    "This custom test will make an external API call to get the current BTC price and display it as a table. This demonstrates how you might integrate external data sources into your model documentation in a programmatic way. You could, for instance, setup a pipeline that runs a test like this every day to keep your model documentation in sync with an external system."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import requests\n",
-    "import random\n",
-    "\n",
-    "\n",
-    "@vm.test(\"my_custom_tests.ExternalAPI\")\n",
-    "def external_api():\n",
-    "    \"\"\"This test calls an external API to get a list of fake users. It then creates\n",
-    "    a table with the relevant data so it can be displayed in the documentation.\n",
-    "\n",
-    "    The purpose of this test is to demonstrate how to call an external API and use the\n",
-    "    data in a test. A test like this could even be setup to run in a scheduled\n",
-    "    pipeline to keep your documentation in-sync with an external data source.\n",
-    "    \"\"\"\n",
-    "    url = \"https://jsonplaceholder.typicode.com/users\"\n",
-    "    response = requests.get(url)\n",
-    "    data = response.json()\n",
-    "\n",
-    "    # extract the time and the current BTC price in USD\n",
-    "    return {\n",
-    "        \"Model Owners/Stakeholders\": [\n",
-    "            {\n",
-    "                \"Name\": user[\"name\"],\n",
-    "                \"Role\": random.choice([\"Owner\", \"Stakeholder\"]),\n",
-    "                \"Email\": user[\"email\"],\n",
-    "                \"Phone\": user[\"phone\"],\n",
-    "                \"Slack Handle\": f\"@{user['name'].lower().replace(' ', '.')}\",\n",
-    "            }\n",
-    "            for user in data[:3]\n",
-    "        ],\n",
-    "        \"Model Developers\": [\n",
-    "            {\n",
-    "                \"Name\": user[\"name\"],\n",
-    "                \"Role\": \"Developer\",\n",
-    "                \"Email\": user[\"email\"],\n",
-    "            }\n",
-    "            for user in data[3:7]\n",
-    "        ],\n",
-    "        \"Model Validators\": [\n",
-    "            {\n",
-    "                \"Name\": user[\"name\"],\n",
-    "                \"Role\": \"Validator\",\n",
-    "                \"Email\": user[\"email\"],\n",
-    "            }\n",
-    "            for user in data[7:]\n",
-    "        ],\n",
-    "    }\n",
-    "\n",
-    "\n",
-    "result = run_test(\"my_custom_tests.ExternalAPI\")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Again, you can add this to your documentation to see how it looks:\n",
-    "\n",
-    "![screenshot showing BTC price metric](./external-data-custom-test.png)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_3__'></a>\n",
-    "\n",
-    "### Custom Test: Passing Parameters\n",
-    "\n",
-    "Custom test functions, as stated earlier, can take both inputs and params. When you define your function there is no need to distinguish between the two, the ValidMind Library will handle that for you. You simply need to add both to the function as arguments and the library will pass in the correct values.\n",
-    "\n",
-    "So for instance, if you wanted to parameterize the first custom test we created, the confusion matrix, you could do so like this:\n",
-    "\n",
-    "```python\n",
-    "def confusion_matrix(dataset: VMDataset, model: VMModel, my_param: str = \"Default Value\"):\n",
-    "    pass\n",
-    "```\n",
-    "\n",
-    "And then when you run the test, you can pass in the parameter like this:\n",
-    "\n",
-    "```python\n",
-    "vm.run_test(\n",
-    "    \"my_custom_tests.ConfusionMatrix\",\n",
-    "    inputs={\"model\": \"model\", \"dataset\": \"test_dataset\"},\n",
-    "    params={\"my_param\": \"My Value\"},\n",
-    ")\n",
-    "```\n",
-    "\n",
-    "Or if you are running the entire documentation template, you would update the config like this:\n",
-    "\n",
-    "```python\n",
-    "test_config[\"my_custom_tests.ConfusionMatrix\"] = {\n",
-    "    \"inputs\": {\n",
-    "        \"dataset\": \"test_dataset\",\n",
-    "        \"model\": \"model\",\n",
-    "    },\n",
-    "    \"params\": {\n",
-    "        \"my_param\": \"My Value\",\n",
-    "    },\n",
-    "}\n",
-    "```\n",
-    "\n",
-    "Let's go ahead and create a toy test that takes a parameter and uses it in the result:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import plotly.express as px\n",
-    "\n",
-    "\n",
-    "@vm.test(\"my_custom_tests.ParameterExample\")\n",
-    "def parameter_example(\n",
-    "    plot_title=\"Default Plot Title\", x_col=\"sepal_width\", y_col=\"sepal_length\"\n",
-    "):\n",
-    "    \"\"\"This test takes two parameters and creates a scatter plot based on them.\n",
-    "\n",
-    "    The purpose of this test is to demonstrate how to create a test that takes\n",
-    "    parameters and uses them to generate a plot. This can be useful for creating\n",
-    "    tests that are more flexible and can be used in a variety of scenarios.\n",
-    "    \"\"\"\n",
-    "    # return px.scatter(px.data.iris(), x=x_col, y=y_col, color=\"species\")\n",
-    "    return px.scatter(\n",
-    "        px.data.iris(), x=x_col, y=y_col, color=\"species\", title=plot_title\n",
-    "    )\n",
-    "\n",
-    "\n",
-    "result = run_test(\n",
-    "    \"my_custom_tests.ParameterExample\",\n",
-    "    params={\n",
-    "        \"plot_title\": \"My Cool Plot\",\n",
-    "        \"x_col\": \"sepal_width\",\n",
-    "        \"y_col\": \"sepal_length\",\n",
-    "    },\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Play around with this and see how you can use parameters, default values and other features to make your custom tests more flexible and useful.\n",
-    "\n",
-    "Here's how this one looks in the documentation:\n",
-    "![screenshot showing parameterized test](./parameterized-custom-metric.png)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_4__'></a>\n",
-    "\n",
-    "### Custom Test: Multiple Tables and Plots in a Single Test\n",
-    "\n",
-    "Custom test functions, as stated earlier, can return more than just one table or plot. In fact, any number of tables and plots can be returned. Let's see an example of this:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import numpy as np\n",
-    "import plotly.express as px\n",
-    "\n",
-    "\n",
-    "@vm.test(\"my_custom_tests.ComplexOutput\")\n",
-    "def complex_output():\n",
-    "    \"\"\"This test demonstrates how to return many tables and figures in a single test\"\"\"\n",
-    "    # create a couple tables\n",
-    "    table = [{\"A\": 1, \"B\": 2}, {\"A\": 3, \"B\": 4}]\n",
-    "    table2 = [{\"C\": 5, \"D\": 6}, {\"C\": 7, \"D\": 8}]\n",
-    "\n",
-    "    # create a few figures showing some random data\n",
-    "    fig1 = px.line(x=np.arange(10), y=np.random.rand(10), title=\"Random Line Plot\")\n",
-    "    fig2 = px.bar(x=[\"A\", \"B\", \"C\"], y=np.random.rand(3), title=\"Random Bar Plot\")\n",
-    "    fig3 = px.scatter(\n",
-    "        x=np.random.rand(10), y=np.random.rand(10), title=\"Random Scatter Plot\"\n",
-    "    )\n",
-    "\n",
-    "    return (\n",
-    "        {\n",
-    "            \"My Cool Table\": table,\n",
-    "            \"Another Table\": table2,\n",
-    "        },\n",
-    "        fig1,\n",
-    "        fig2,\n",
-    "        fig3,\n",
-    "    )\n",
-    "\n",
-    "\n",
-    "result = run_test(\"my_custom_tests.ComplexOutput\")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Notice how you can return the tables as a dictionary where the key is the title of the table and the value is the table itself. You could also just return the tables by themselves but this way you can give them a title to more easily identify them in the result.\n",
-    "\n",
-    "![screenshot showing multiple tables and plots](./multiple-tables-plots-custom-metric.png)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_5__'></a>\n",
-    "\n",
-    "### Custom Test: Images\n",
-    "\n",
-    "If you are using a plotting library that isn't supported by ValidMind (i.e. not `matplotlib` or `plotly`), you can still return the image directly as a bytes-like object. This could also be used to bring any type of image into your documentation in a programmatic way. For instance, you may want to include a diagram of your model architecture or a screenshot of a dashboard that your model is integrated with. As long as you can produce the image with Python or open it from a file, you can include it in your documentation."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import io\n",
-    "import matplotlib.pyplot as plt\n",
-    "\n",
-    "\n",
-    "@vm.test(\"my_custom_tests.Image\")\n",
-    "def image():\n",
-    "    \"\"\"This test demonstrates how to return an image in a test\"\"\"\n",
-    "\n",
-    "    # create a simple plot\n",
-    "    fig, ax = plt.subplots()\n",
-    "    ax.plot([1, 2, 3, 4])\n",
-    "    ax.set_title(\"Simple Line Plot\")\n",
-    "\n",
-    "    # save the plot as a PNG image (in-memory buffer)\n",
-    "    img_data = io.BytesIO()\n",
-    "    fig.savefig(img_data, format=\"png\")\n",
-    "    img_data.seek(0)\n",
-    "\n",
-    "    plt.close()  # close the plot to avoid displaying it\n",
-    "\n",
-    "    return img_data.read()\n",
-    "\n",
-    "\n",
-    "result = run_test(\"my_custom_tests.Image\")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Adding this custom test to your documentation will display the image:\n",
-    "\n",
-    "![screenshot showing image custom test](./image-in-custom-metric.png)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If you want to log an image as a test result, you can do so by passing the path to the image as a parameter to the custom test and then opening the file in the test function. Here's an example:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "@vm.test(\"my_custom_tests.MyPNGCorrelationMatrix\")\n",
-    "def Image(path: str):\n",
-    "    \"\"\"Opens a png image file and logs it as a test result to ValidMind\"\"\"\n",
-    "    if not path.endswith(\".png\"):\n",
-    "        raise ValueError(\"Image must be a PNG file\")\n",
-    "\n",
-    "    # return raw image bytes\n",
-    "    with open(path, \"rb\") as f:\n",
-    "        return f.read()\n",
-    "    \n",
-    "run_test(\n",
-    "    \"my_custom_tests.MyPNGCorrelationMatrix\",\n",
-    "    params={\"path\": \"./pearson-correlation-matrix.png\"},\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "The image is displayed in the test result:\n",
-    "\n",
-    "![screenshot showing image from file](./pearson-correlation-matrix-test-output.png)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_6__'></a>\n",
-    "\n",
-    "### Custom Test: Description\n",
-    "\n",
-    "If you want to write a custom test description for your custom test instead of it is interpreted through llm, you can do so by returning string in your test."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import pandas as pd\n",
-    "\n",
-    "@vm.test(\"my_custom_tests.MyCustomTest\")\n",
-    "def my_custom_test(dataset, model):\n",
-    "    \"\"\"\n",
-    "    This is a custom computed test that computes confusion matrix for a binary classification model and return  a string as a test description.\n",
-    "    \"\"\"\n",
-    "    y_true = dataset.y\n",
-    "    y_pred = dataset.y_pred(model)\n",
-    "\n",
-    "    confusion_matrix = metrics.confusion_matrix(y_true, y_pred)\n",
-    "\n",
-    "    cm_display = metrics.ConfusionMatrixDisplay(\n",
-    "        confusion_matrix=confusion_matrix, display_labels=[False, True]\n",
-    "    )\n",
-    "    cm_display.plot()\n",
-    "\n",
-    "    plt.close()  # close the plot to avoid displaying it\n",
-    "\n",
-    "    return cm_display.figure_, \"Test Description - Confusion Matrix\", pd.DataFrame({\"Value\": [1, 2, 3]})  # return the figure object itself\n",
-    "\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You can see here test result description has been customized here. The same result description will be displayed in the UI."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"my_custom_tests.MyCustomTest\",\n",
-    "    inputs={\"model\": \"model\", \"dataset\": \"test_dataset\"},\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Conclusion\n",
-    "\n",
-    "In this notebook, we have demonstrated how to create custom tests in ValidMind. We have shown how to define custom test functions, register them with the ValidMind Library, run them against models and datasets, and add them to model documentation templates. We have also shown how to return tables and plots from custom tests and how to use them in the ValidMind Platform. We hope this tutorial has been helpful in understanding how to create and use custom tests in ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc8__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
-    "\n",
-    "<a id='toc8_1__'></a>\n",
-    "\n",
-    "### Work with your model documentation\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)\n",
-    "\n",
-    "<a id='toc8_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc9__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-bcdac57ebb8d440f86ba120ee6511db3",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3 (ipykernel)",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.11.5"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 4
-}
+  "nbformat": 4,
+  "nbformat_minor": 4
+}
\ No newline at end of file
diff --git a/site/notebooks/how_to/tests/custom_tests/integrate_external_test_providers.ipynb b/site/notebooks/how_to/tests/custom_tests/integrate_external_test_providers.ipynb
index eaff3a5790..df995d23ae 100644
--- a/site/notebooks/how_to/tests/custom_tests/integrate_external_test_providers.ipynb
+++ b/site/notebooks/how_to/tests/custom_tests/integrate_external_test_providers.ipynb
@@ -113,7 +113,9 @@
     "\n",
     "## About ValidMind\n",
     "\n",
-    "ValidMind's suite of tools enables organizations to identify, document, and manage model risks for all types of models, including AI/ML models, LLMs, and statistical models. As a model developer, you use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
+    "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+    "\n",
+    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
     "\n",
     "If this is your first time trying out ValidMind, we recommend going through the following resources first:\n",
     "\n",
@@ -126,7 +128,7 @@
     "\n",
     "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
     "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+    "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
    ]
   },
   {
@@ -175,17 +177,19 @@
     "\n",
     "#### Register sample model\n",
     "\n",
-    "Let's first register a sample model for use with this notebook:\n",
+    "Let's first register a sample record (model) for use with this notebook:\n",
+    "\n",
+    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
     "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
+    "2. In the left sidebar, select **Inventory**.\n",
     "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
+    "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
     "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
+    "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
     "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
+    "5. Select your own name under the **RECORD OWNER** drop-down.\n",
     "\n",
-    "5. Click **Register Model** to add the model to your inventory."
+    "6. Click **Register Model** to add the model to your inventory."
    ]
   },
   {
@@ -196,10 +200,12 @@
     "\n",
     "#### Apply documentation template\n",
     "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
+    "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
     "\n",
     "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
     "\n",
+    "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+    "\n",
     "2. Under **TEMPLATE**, select `Binary classification`.\n",
     "\n",
     "3. Click **Use Template** to apply the template."
@@ -213,11 +219,13 @@
     "\n",
     "#### Get your code snippet\n",
     "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
+    "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
     "\n",
     "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+    "\n",
     "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+    "\n",
+    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
    ]
   },
   {
@@ -894,23 +902,23 @@
     "\n",
     "<a id='toc9_1__'></a>\n",
     "\n",
-    "### Work with your model documentation\n",
+    "### Work with your documentation\n",
     "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
+    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
     "\n",
     "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
     "\n",
-    "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)\n",
+    "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
     "\n",
     "<a id='toc9_2__'></a>\n",
     "\n",
     "### Discover more learning resources\n",
     "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
+    "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
     "\n",
     "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
     "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
+    "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
     "\n",
     "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
    ]
diff --git a/site/notebooks/how_to/tests/explore_tests/explore_test_suites.ipynb b/site/notebooks/how_to/tests/explore_tests/explore_test_suites.ipynb
index 976eaedefe..2191dbd98e 100644
--- a/site/notebooks/how_to/tests/explore_tests/explore_test_suites.ipynb
+++ b/site/notebooks/how_to/tests/explore_tests/explore_test_suites.ipynb
@@ -1,962 +1,932 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Explore test suites\n",
-    "\n",
-    "Explore ValidMind test suites, pre-built collections of related tests used to evaluate specific aspects of your model. Retrieve available test suites and details for tests within a suite to understand their functionality, allowing you to select the appropriate test suites for your use cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [Contents](#toc1__)    \n",
-    "- [About ValidMind](#toc2__)    \n",
-    "  - [Before you begin](#toc2_1__)    \n",
-    "  - [New to ValidMind?](#toc2_2__)    \n",
-    "  - [Key concepts](#toc2_3__)    \n",
-    "- [Install the ValidMind Library](#toc3__)    \n",
-    "- [List available test suites](#toc4__)    \n",
-    "- [View test suite details](#toc5__)    \n",
-    "  - [View test details](#toc5_1__)    \n",
-    "- [Next steps](#toc6__)    \n",
-    "  - [Discover more learning resources](#toc6_1__)    \n",
-    "- [Upgrade ValidMind](#toc7__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## Contents\n",
-    "- [About ValidMind](#toc1_)    \n",
-    "  - [Before you begin](#toc1_1_)    \n",
-    "  - [New to ValidMind?](#toc1_2_)    \n",
-    "  - [Key concepts](#toc1_3_)    \n",
-    "- [Install the ValidMind Library](#toc2_)    \n",
-    "- [List available test suites](#toc3_)    \n",
-    "- [View test suite details](#toc4_)    \n",
-    "  - [View test details](#toc4_1_)           \n",
-    "- [Next steps](#toc5_)    \n",
-    "  - [Discover more learning resources](#toc5_1_)\n",
-    "  \n",
-    ":::\n",
-    "<!-- vscode-jupyter-toc-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/vscode-jupyter-toc-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
-    "\n",
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Custom tests**: Custom tests are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom test.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom test. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Install the ValidMind Library\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
-    "<br></br>\n",
-    "Python 3.8 <= x <= 3.14</div>\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## List available test suites\n",
-    "After we import the ValidMind Library, we'll call [test_suites.list_suites()](https://docs.validmind.ai/validmind/validmind/test_suites.html#list_suites) to retrieve a structured list of all available test suites, that includes each suite's name, description, and associated tests:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 2,
-   "metadata": {},
-   "outputs": [
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Explore test suites\n",
+        "\n",
+        "Explore ValidMind test suites, pre-built collections of related tests used to evaluate specific aspects of your model. Retrieve available test suites and details for tests within a suite to understand their functionality, allowing you to select the appropriate test suites for your use cases."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Install the ValidMind Library](#toc2__)    \n",
+        "- [List available test suites](#toc3__)    \n",
+        "- [View test suite details](#toc4__)    \n",
+        "  - [View test details](#toc4_1__)    \n",
+        "- [Next steps](#toc5__)    \n",
+        "  - [Discover more learning resources](#toc5_1__)    \n",
+        "- [Upgrade ValidMind](#toc6__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+        "\n",
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Install the ValidMind Library\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
+        "<br></br>\n",
+        "Python 3.8 <= x <= 3.14</div>\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
     {
-     "data": {
-      "text/html": [
-       "<style type=\"text/css\">\n",
-       "#T_9e889 th {\n",
-       "  text-align: left;\n",
-       "}\n",
-       "#T_9e889_row0_col0, #T_9e889_row0_col1, #T_9e889_row0_col2, #T_9e889_row0_col3, #T_9e889_row1_col0, #T_9e889_row1_col1, #T_9e889_row1_col2, #T_9e889_row1_col3, #T_9e889_row2_col0, #T_9e889_row2_col1, #T_9e889_row2_col2, #T_9e889_row2_col3, #T_9e889_row3_col0, #T_9e889_row3_col1, #T_9e889_row3_col2, #T_9e889_row3_col3, #T_9e889_row4_col0, #T_9e889_row4_col1, #T_9e889_row4_col2, #T_9e889_row4_col3, #T_9e889_row5_col0, #T_9e889_row5_col1, #T_9e889_row5_col2, #T_9e889_row5_col3, #T_9e889_row6_col0, #T_9e889_row6_col1, #T_9e889_row6_col2, #T_9e889_row6_col3, #T_9e889_row7_col0, #T_9e889_row7_col1, #T_9e889_row7_col2, #T_9e889_row7_col3, #T_9e889_row8_col0, #T_9e889_row8_col1, #T_9e889_row8_col2, #T_9e889_row8_col3, #T_9e889_row9_col0, #T_9e889_row9_col1, #T_9e889_row9_col2, #T_9e889_row9_col3, #T_9e889_row10_col0, #T_9e889_row10_col1, #T_9e889_row10_col2, #T_9e889_row10_col3, #T_9e889_row11_col0, #T_9e889_row11_col1, #T_9e889_row11_col2, #T_9e889_row11_col3, #T_9e889_row12_col0, #T_9e889_row12_col1, #T_9e889_row12_col2, #T_9e889_row12_col3, #T_9e889_row13_col0, #T_9e889_row13_col1, #T_9e889_row13_col2, #T_9e889_row13_col3, #T_9e889_row14_col0, #T_9e889_row14_col1, #T_9e889_row14_col2, #T_9e889_row14_col3, #T_9e889_row15_col0, #T_9e889_row15_col1, #T_9e889_row15_col2, #T_9e889_row15_col3, #T_9e889_row16_col0, #T_9e889_row16_col1, #T_9e889_row16_col2, #T_9e889_row16_col3, #T_9e889_row17_col0, #T_9e889_row17_col1, #T_9e889_row17_col2, #T_9e889_row17_col3, #T_9e889_row18_col0, #T_9e889_row18_col1, #T_9e889_row18_col2, #T_9e889_row18_col3, #T_9e889_row19_col0, #T_9e889_row19_col1, #T_9e889_row19_col2, #T_9e889_row19_col3, #T_9e889_row20_col0, #T_9e889_row20_col1, #T_9e889_row20_col2, #T_9e889_row20_col3, #T_9e889_row21_col0, #T_9e889_row21_col1, #T_9e889_row21_col2, #T_9e889_row21_col3, #T_9e889_row22_col0, #T_9e889_row22_col1, #T_9e889_row22_col2, #T_9e889_row22_col3, #T_9e889_row23_col0, #T_9e889_row23_col1, #T_9e889_row23_col2, #T_9e889_row23_col3, #T_9e889_row24_col0, #T_9e889_row24_col1, #T_9e889_row24_col2, #T_9e889_row24_col3, #T_9e889_row25_col0, #T_9e889_row25_col1, #T_9e889_row25_col2, #T_9e889_row25_col3, #T_9e889_row26_col0, #T_9e889_row26_col1, #T_9e889_row26_col2, #T_9e889_row26_col3, #T_9e889_row27_col0, #T_9e889_row27_col1, #T_9e889_row27_col2, #T_9e889_row27_col3, #T_9e889_row28_col0, #T_9e889_row28_col1, #T_9e889_row28_col2, #T_9e889_row28_col3, #T_9e889_row29_col0, #T_9e889_row29_col1, #T_9e889_row29_col2, #T_9e889_row29_col3 {\n",
-       "  text-align: left;\n",
-       "}\n",
-       "</style>\n",
-       "<table id=\"T_9e889\">\n",
-       "  <thead>\n",
-       "    <tr>\n",
-       "      <th id=\"T_9e889_level0_col0\" class=\"col_heading level0 col0\" >ID</th>\n",
-       "      <th id=\"T_9e889_level0_col1\" class=\"col_heading level0 col1\" >Name</th>\n",
-       "      <th id=\"T_9e889_level0_col2\" class=\"col_heading level0 col2\" >Description</th>\n",
-       "      <th id=\"T_9e889_level0_col3\" class=\"col_heading level0 col3\" >Tests</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row0_col0\" class=\"data row0 col0\" >classifier_model_diagnosis</td>\n",
-       "      <td id=\"T_9e889_row0_col1\" class=\"data row0 col1\" >ClassifierDiagnosis</td>\n",
-       "      <td id=\"T_9e889_row0_col2\" class=\"data row0 col2\" >Test suite for sklearn classifier model diagnosis tests</td>\n",
-       "      <td id=\"T_9e889_row0_col3\" class=\"data row0 col3\" >validmind.model_validation.sklearn.OverfitDiagnosis, validmind.model_validation.sklearn.WeakspotsDiagnosis, validmind.model_validation.sklearn.RobustnessDiagnosis</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row1_col0\" class=\"data row1 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_9e889_row1_col1\" class=\"data row1 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_9e889_row1_col2\" class=\"data row1 col2\" >Full test suite for binary classification models.</td>\n",
-       "      <td id=\"T_9e889_row1_col3\" class=\"data row1 col3\" >validmind.data_validation.DatasetDescription, validmind.data_validation.DescriptiveStatistics, validmind.data_validation.PearsonCorrelationMatrix, validmind.data_validation.ClassImbalance, validmind.data_validation.Duplicates, validmind.data_validation.HighCardinality, validmind.data_validation.HighPearsonCorrelation, validmind.data_validation.MissingValues, validmind.data_validation.Skewness, validmind.data_validation.UniqueRows, validmind.data_validation.TooManyZeroValues, validmind.model_validation.ModelMetadata, validmind.data_validation.DatasetSplit, validmind.model_validation.sklearn.ConfusionMatrix, validmind.model_validation.sklearn.ClassifierPerformance, validmind.model_validation.sklearn.PermutationFeatureImportance, validmind.model_validation.sklearn.PrecisionRecallCurve, validmind.model_validation.sklearn.ROCCurve, validmind.model_validation.sklearn.PopulationStabilityIndex, validmind.model_validation.sklearn.SHAPGlobalImportance, validmind.model_validation.sklearn.MinimumAccuracy, validmind.model_validation.sklearn.MinimumF1Score, validmind.model_validation.sklearn.MinimumROCAUCScore, validmind.model_validation.sklearn.TrainingTestDegradation, validmind.model_validation.sklearn.ModelsPerformanceComparison, validmind.model_validation.sklearn.OverfitDiagnosis, validmind.model_validation.sklearn.WeakspotsDiagnosis, validmind.model_validation.sklearn.RobustnessDiagnosis</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row2_col0\" class=\"data row2 col0\" >classifier_metrics</td>\n",
-       "      <td id=\"T_9e889_row2_col1\" class=\"data row2 col1\" >ClassifierMetrics</td>\n",
-       "      <td id=\"T_9e889_row2_col2\" class=\"data row2 col2\" >Test suite for sklearn classifier metrics</td>\n",
-       "      <td id=\"T_9e889_row2_col3\" class=\"data row2 col3\" >validmind.model_validation.ModelMetadata, validmind.data_validation.DatasetSplit, validmind.model_validation.sklearn.ConfusionMatrix, validmind.model_validation.sklearn.ClassifierPerformance, validmind.model_validation.sklearn.PermutationFeatureImportance, validmind.model_validation.sklearn.PrecisionRecallCurve, validmind.model_validation.sklearn.ROCCurve, validmind.model_validation.sklearn.PopulationStabilityIndex, validmind.model_validation.sklearn.SHAPGlobalImportance</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row3_col0\" class=\"data row3 col0\" >classifier_model_validation</td>\n",
-       "      <td id=\"T_9e889_row3_col1\" class=\"data row3 col1\" >ClassifierModelValidation</td>\n",
-       "      <td id=\"T_9e889_row3_col2\" class=\"data row3 col2\" >Test suite for binary classification models.</td>\n",
-       "      <td id=\"T_9e889_row3_col3\" class=\"data row3 col3\" >validmind.model_validation.ModelMetadata, validmind.data_validation.DatasetSplit, validmind.model_validation.sklearn.ConfusionMatrix, validmind.model_validation.sklearn.ClassifierPerformance, validmind.model_validation.sklearn.PermutationFeatureImportance, validmind.model_validation.sklearn.PrecisionRecallCurve, validmind.model_validation.sklearn.ROCCurve, validmind.model_validation.sklearn.PopulationStabilityIndex, validmind.model_validation.sklearn.SHAPGlobalImportance, validmind.model_validation.sklearn.MinimumAccuracy, validmind.model_validation.sklearn.MinimumF1Score, validmind.model_validation.sklearn.MinimumROCAUCScore, validmind.model_validation.sklearn.TrainingTestDegradation, validmind.model_validation.sklearn.ModelsPerformanceComparison, validmind.model_validation.sklearn.OverfitDiagnosis, validmind.model_validation.sklearn.WeakspotsDiagnosis, validmind.model_validation.sklearn.RobustnessDiagnosis</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row4_col0\" class=\"data row4 col0\" >classifier_validation</td>\n",
-       "      <td id=\"T_9e889_row4_col1\" class=\"data row4 col1\" >ClassifierPerformance</td>\n",
-       "      <td id=\"T_9e889_row4_col2\" class=\"data row4 col2\" >Test suite for sklearn classifier models</td>\n",
-       "      <td id=\"T_9e889_row4_col3\" class=\"data row4 col3\" >validmind.model_validation.sklearn.MinimumAccuracy, validmind.model_validation.sklearn.MinimumF1Score, validmind.model_validation.sklearn.MinimumROCAUCScore, validmind.model_validation.sklearn.TrainingTestDegradation, validmind.model_validation.sklearn.ModelsPerformanceComparison</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row5_col0\" class=\"data row5 col0\" >cluster_full_suite</td>\n",
-       "      <td id=\"T_9e889_row5_col1\" class=\"data row5 col1\" >ClusterFullSuite</td>\n",
-       "      <td id=\"T_9e889_row5_col2\" class=\"data row5 col2\" >Full test suite for clustering models.</td>\n",
-       "      <td id=\"T_9e889_row5_col3\" class=\"data row5 col3\" >validmind.model_validation.ModelMetadata, validmind.data_validation.DatasetSplit, validmind.model_validation.sklearn.HomogeneityScore, validmind.model_validation.sklearn.CompletenessScore, validmind.model_validation.sklearn.VMeasure, validmind.model_validation.sklearn.AdjustedRandIndex, validmind.model_validation.sklearn.AdjustedMutualInformation, validmind.model_validation.sklearn.FowlkesMallowsScore, validmind.model_validation.sklearn.ClusterPerformanceMetrics, validmind.model_validation.sklearn.ClusterCosineSimilarity, validmind.model_validation.sklearn.SilhouettePlot, validmind.model_validation.ClusterSizeDistribution, validmind.model_validation.sklearn.HyperParametersTuning, validmind.model_validation.sklearn.KMeansClustersOptimization</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row6_col0\" class=\"data row6 col0\" >cluster_metrics</td>\n",
-       "      <td id=\"T_9e889_row6_col1\" class=\"data row6 col1\" >ClusterMetrics</td>\n",
-       "      <td id=\"T_9e889_row6_col2\" class=\"data row6 col2\" >Test suite for sklearn clustering metrics</td>\n",
-       "      <td id=\"T_9e889_row6_col3\" class=\"data row6 col3\" >validmind.model_validation.ModelMetadata, validmind.data_validation.DatasetSplit, validmind.model_validation.sklearn.HomogeneityScore, validmind.model_validation.sklearn.CompletenessScore, validmind.model_validation.sklearn.VMeasure, validmind.model_validation.sklearn.AdjustedRandIndex, validmind.model_validation.sklearn.AdjustedMutualInformation, validmind.model_validation.sklearn.FowlkesMallowsScore, validmind.model_validation.sklearn.ClusterPerformanceMetrics, validmind.model_validation.sklearn.ClusterCosineSimilarity, validmind.model_validation.sklearn.SilhouettePlot</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row7_col0\" class=\"data row7 col0\" >cluster_performance</td>\n",
-       "      <td id=\"T_9e889_row7_col1\" class=\"data row7 col1\" >ClusterPerformance</td>\n",
-       "      <td id=\"T_9e889_row7_col2\" class=\"data row7 col2\" >Test suite for sklearn cluster performance</td>\n",
-       "      <td id=\"T_9e889_row7_col3\" class=\"data row7 col3\" >validmind.model_validation.ClusterSizeDistribution</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row8_col0\" class=\"data row8 col0\" >embeddings_full_suite</td>\n",
-       "      <td id=\"T_9e889_row8_col1\" class=\"data row8 col1\" >EmbeddingsFullSuite</td>\n",
-       "      <td id=\"T_9e889_row8_col2\" class=\"data row8 col2\" >Full test suite for embeddings models.</td>\n",
-       "      <td id=\"T_9e889_row8_col3\" class=\"data row8 col3\" >validmind.model_validation.ModelMetadata, validmind.data_validation.DatasetSplit, validmind.model_validation.embeddings.DescriptiveAnalytics, validmind.model_validation.embeddings.CosineSimilarityDistribution, validmind.model_validation.embeddings.ClusterDistribution, validmind.model_validation.embeddings.EmbeddingsVisualization2D, validmind.model_validation.embeddings.StabilityAnalysisRandomNoise, validmind.model_validation.embeddings.StabilityAnalysisSynonyms, validmind.model_validation.embeddings.StabilityAnalysisKeyword, validmind.model_validation.embeddings.StabilityAnalysisTranslation</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row9_col0\" class=\"data row9 col0\" >embeddings_metrics</td>\n",
-       "      <td id=\"T_9e889_row9_col1\" class=\"data row9 col1\" >EmbeddingsMetrics</td>\n",
-       "      <td id=\"T_9e889_row9_col2\" class=\"data row9 col2\" >Test suite for embeddings metrics</td>\n",
-       "      <td id=\"T_9e889_row9_col3\" class=\"data row9 col3\" >validmind.model_validation.ModelMetadata, validmind.data_validation.DatasetSplit, validmind.model_validation.embeddings.DescriptiveAnalytics, validmind.model_validation.embeddings.CosineSimilarityDistribution, validmind.model_validation.embeddings.ClusterDistribution, validmind.model_validation.embeddings.EmbeddingsVisualization2D</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row10_col0\" class=\"data row10 col0\" >embeddings_model_performance</td>\n",
-       "      <td id=\"T_9e889_row10_col1\" class=\"data row10 col1\" >EmbeddingsPerformance</td>\n",
-       "      <td id=\"T_9e889_row10_col2\" class=\"data row10 col2\" >Test suite for embeddings model performance</td>\n",
-       "      <td id=\"T_9e889_row10_col3\" class=\"data row10 col3\" >validmind.model_validation.embeddings.StabilityAnalysisRandomNoise, validmind.model_validation.embeddings.StabilityAnalysisSynonyms, validmind.model_validation.embeddings.StabilityAnalysisKeyword, validmind.model_validation.embeddings.StabilityAnalysisTranslation</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row11_col0\" class=\"data row11 col0\" >hyper_parameters_optimization</td>\n",
-       "      <td id=\"T_9e889_row11_col1\" class=\"data row11 col1\" >KmeansParametersOptimization</td>\n",
-       "      <td id=\"T_9e889_row11_col2\" class=\"data row11 col2\" >Test suite for sklearn hyperparameters optimization</td>\n",
-       "      <td id=\"T_9e889_row11_col3\" class=\"data row11 col3\" >validmind.model_validation.sklearn.HyperParametersTuning, validmind.model_validation.sklearn.KMeansClustersOptimization</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row12_col0\" class=\"data row12 col0\" >llm_classifier_full_suite</td>\n",
-       "      <td id=\"T_9e889_row12_col1\" class=\"data row12 col1\" >LLMClassifierFullSuite</td>\n",
-       "      <td id=\"T_9e889_row12_col2\" class=\"data row12 col2\" >Full test suite for LLM classification models.</td>\n",
-       "      <td id=\"T_9e889_row12_col3\" class=\"data row12 col3\" >validmind.data_validation.ClassImbalance, validmind.data_validation.Duplicates, validmind.data_validation.nlp.StopWords, validmind.data_validation.nlp.Punctuations, validmind.data_validation.nlp.CommonWords, validmind.data_validation.nlp.TextDescription, validmind.model_validation.ModelMetadata, validmind.data_validation.DatasetSplit, validmind.model_validation.sklearn.ConfusionMatrix, validmind.model_validation.sklearn.ClassifierPerformance, validmind.model_validation.sklearn.PermutationFeatureImportance, validmind.model_validation.sklearn.PrecisionRecallCurve, validmind.model_validation.sklearn.ROCCurve, validmind.model_validation.sklearn.PopulationStabilityIndex, validmind.model_validation.sklearn.SHAPGlobalImportance, validmind.model_validation.sklearn.MinimumAccuracy, validmind.model_validation.sklearn.MinimumF1Score, validmind.model_validation.sklearn.MinimumROCAUCScore, validmind.model_validation.sklearn.TrainingTestDegradation, validmind.model_validation.sklearn.ModelsPerformanceComparison, validmind.model_validation.sklearn.OverfitDiagnosis, validmind.model_validation.sklearn.WeakspotsDiagnosis, validmind.model_validation.sklearn.RobustnessDiagnosis, validmind.prompt_validation.Bias, validmind.prompt_validation.Clarity, validmind.prompt_validation.Conciseness, validmind.prompt_validation.Delimitation, validmind.prompt_validation.NegativeInstruction, validmind.prompt_validation.Robustness, validmind.prompt_validation.Specificity</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row13_col0\" class=\"data row13 col0\" >prompt_validation</td>\n",
-       "      <td id=\"T_9e889_row13_col1\" class=\"data row13 col1\" >PromptValidation</td>\n",
-       "      <td id=\"T_9e889_row13_col2\" class=\"data row13 col2\" >Test suite for prompt validation</td>\n",
-       "      <td id=\"T_9e889_row13_col3\" class=\"data row13 col3\" >validmind.prompt_validation.Bias, validmind.prompt_validation.Clarity, validmind.prompt_validation.Conciseness, validmind.prompt_validation.Delimitation, validmind.prompt_validation.NegativeInstruction, validmind.prompt_validation.Robustness, validmind.prompt_validation.Specificity</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row14_col0\" class=\"data row14 col0\" >nlp_classifier_full_suite</td>\n",
-       "      <td id=\"T_9e889_row14_col1\" class=\"data row14 col1\" >NLPClassifierFullSuite</td>\n",
-       "      <td id=\"T_9e889_row14_col2\" class=\"data row14 col2\" >Full test suite for NLP classification models.</td>\n",
-       "      <td id=\"T_9e889_row14_col3\" class=\"data row14 col3\" >validmind.data_validation.ClassImbalance, validmind.data_validation.Duplicates, validmind.data_validation.nlp.StopWords, validmind.data_validation.nlp.Punctuations, validmind.data_validation.nlp.CommonWords, validmind.data_validation.nlp.TextDescription, validmind.model_validation.ModelMetadata, validmind.data_validation.DatasetSplit, validmind.model_validation.sklearn.ConfusionMatrix, validmind.model_validation.sklearn.ClassifierPerformance, validmind.model_validation.sklearn.PermutationFeatureImportance, validmind.model_validation.sklearn.PrecisionRecallCurve, validmind.model_validation.sklearn.ROCCurve, validmind.model_validation.sklearn.PopulationStabilityIndex, validmind.model_validation.sklearn.SHAPGlobalImportance, validmind.model_validation.sklearn.MinimumAccuracy, validmind.model_validation.sklearn.MinimumF1Score, validmind.model_validation.sklearn.MinimumROCAUCScore, validmind.model_validation.sklearn.TrainingTestDegradation, validmind.model_validation.sklearn.ModelsPerformanceComparison, validmind.model_validation.sklearn.OverfitDiagnosis, validmind.model_validation.sklearn.WeakspotsDiagnosis, validmind.model_validation.sklearn.RobustnessDiagnosis</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row15_col0\" class=\"data row15 col0\" >regression_metrics</td>\n",
-       "      <td id=\"T_9e889_row15_col1\" class=\"data row15 col1\" >RegressionMetrics</td>\n",
-       "      <td id=\"T_9e889_row15_col2\" class=\"data row15 col2\" >Test suite for performance metrics of regression metrics</td>\n",
-       "      <td id=\"T_9e889_row15_col3\" class=\"data row15 col3\" >validmind.data_validation.DatasetSplit, validmind.model_validation.ModelMetadata, validmind.model_validation.sklearn.PermutationFeatureImportance</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row16_col0\" class=\"data row16 col0\" >regression_model_description</td>\n",
-       "      <td id=\"T_9e889_row16_col1\" class=\"data row16 col1\" >RegressionModelDescription</td>\n",
-       "      <td id=\"T_9e889_row16_col2\" class=\"data row16 col2\" >Test suite for performance metric of regression model of statsmodels library</td>\n",
-       "      <td id=\"T_9e889_row16_col3\" class=\"data row16 col3\" >validmind.data_validation.DatasetSplit, validmind.model_validation.ModelMetadata</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row17_col0\" class=\"data row17 col0\" >regression_models_evaluation</td>\n",
-       "      <td id=\"T_9e889_row17_col1\" class=\"data row17 col1\" >RegressionModelsEvaluation</td>\n",
-       "      <td id=\"T_9e889_row17_col2\" class=\"data row17 col2\" >Test suite for metrics comparison of regression model of statsmodels library</td>\n",
-       "      <td id=\"T_9e889_row17_col3\" class=\"data row17 col3\" >validmind.model_validation.statsmodels.RegressionModelCoeffs, validmind.model_validation.sklearn.RegressionModelsPerformanceComparison</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row18_col0\" class=\"data row18 col0\" >regression_full_suite</td>\n",
-       "      <td id=\"T_9e889_row18_col1\" class=\"data row18 col1\" >RegressionFullSuite</td>\n",
-       "      <td id=\"T_9e889_row18_col2\" class=\"data row18 col2\" >Full test suite for regression models.</td>\n",
-       "      <td id=\"T_9e889_row18_col3\" class=\"data row18 col3\" >validmind.data_validation.DatasetDescription, validmind.data_validation.DescriptiveStatistics, validmind.data_validation.PearsonCorrelationMatrix, validmind.data_validation.ClassImbalance, validmind.data_validation.Duplicates, validmind.data_validation.HighCardinality, validmind.data_validation.HighPearsonCorrelation, validmind.data_validation.MissingValues, validmind.data_validation.Skewness, validmind.data_validation.UniqueRows, validmind.data_validation.TooManyZeroValues, validmind.data_validation.DatasetSplit, validmind.model_validation.ModelMetadata, validmind.model_validation.sklearn.PermutationFeatureImportance, validmind.model_validation.sklearn.RegressionErrors, validmind.model_validation.sklearn.RegressionR2Square</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row19_col0\" class=\"data row19 col0\" >regression_performance</td>\n",
-       "      <td id=\"T_9e889_row19_col1\" class=\"data row19 col1\" >RegressionPerformance</td>\n",
-       "      <td id=\"T_9e889_row19_col2\" class=\"data row19 col2\" >Test suite for regression model performance</td>\n",
-       "      <td id=\"T_9e889_row19_col3\" class=\"data row19 col3\" >validmind.model_validation.sklearn.RegressionErrors, validmind.model_validation.sklearn.RegressionR2Square</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row20_col0\" class=\"data row20 col0\" >summarization_metrics</td>\n",
-       "      <td id=\"T_9e889_row20_col1\" class=\"data row20 col1\" >SummarizationMetrics</td>\n",
-       "      <td id=\"T_9e889_row20_col2\" class=\"data row20 col2\" >Test suite for Summarization metrics</td>\n",
-       "      <td id=\"T_9e889_row20_col3\" class=\"data row20 col3\" >validmind.model_validation.TokenDisparity, validmind.model_validation.BleuScore, validmind.model_validation.BertScore, validmind.model_validation.ContextualRecall</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row21_col0\" class=\"data row21 col0\" >tabular_dataset</td>\n",
-       "      <td id=\"T_9e889_row21_col1\" class=\"data row21 col1\" >TabularDataset</td>\n",
-       "      <td id=\"T_9e889_row21_col2\" class=\"data row21 col2\" >Test suite for tabular datasets.</td>\n",
-       "      <td id=\"T_9e889_row21_col3\" class=\"data row21 col3\" >validmind.data_validation.DatasetDescription, validmind.data_validation.DescriptiveStatistics, validmind.data_validation.PearsonCorrelationMatrix, validmind.data_validation.ClassImbalance, validmind.data_validation.Duplicates, validmind.data_validation.HighCardinality, validmind.data_validation.HighPearsonCorrelation, validmind.data_validation.MissingValues, validmind.data_validation.Skewness, validmind.data_validation.UniqueRows, validmind.data_validation.TooManyZeroValues</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row22_col0\" class=\"data row22 col0\" >tabular_dataset_description</td>\n",
-       "      <td id=\"T_9e889_row22_col1\" class=\"data row22 col1\" >TabularDatasetDescription</td>\n",
-       "      <td id=\"T_9e889_row22_col2\" class=\"data row22 col2\" >Test suite to extract metadata and descriptive\n",
-       "statistics from a tabular dataset</td>\n",
-       "      <td id=\"T_9e889_row22_col3\" class=\"data row22 col3\" >validmind.data_validation.DatasetDescription, validmind.data_validation.DescriptiveStatistics, validmind.data_validation.PearsonCorrelationMatrix</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row23_col0\" class=\"data row23 col0\" >tabular_data_quality</td>\n",
-       "      <td id=\"T_9e889_row23_col1\" class=\"data row23 col1\" >TabularDataQuality</td>\n",
-       "      <td id=\"T_9e889_row23_col2\" class=\"data row23 col2\" >Test suite for data quality on tabular datasets</td>\n",
-       "      <td id=\"T_9e889_row23_col3\" class=\"data row23 col3\" >validmind.data_validation.ClassImbalance, validmind.data_validation.Duplicates, validmind.data_validation.HighCardinality, validmind.data_validation.HighPearsonCorrelation, validmind.data_validation.MissingValues, validmind.data_validation.Skewness, validmind.data_validation.UniqueRows, validmind.data_validation.TooManyZeroValues</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row24_col0\" class=\"data row24 col0\" >text_data_quality</td>\n",
-       "      <td id=\"T_9e889_row24_col1\" class=\"data row24 col1\" >TextDataQuality</td>\n",
-       "      <td id=\"T_9e889_row24_col2\" class=\"data row24 col2\" >Test suite for data quality on text data</td>\n",
-       "      <td id=\"T_9e889_row24_col3\" class=\"data row24 col3\" >validmind.data_validation.ClassImbalance, validmind.data_validation.Duplicates, validmind.data_validation.nlp.StopWords, validmind.data_validation.nlp.Punctuations, validmind.data_validation.nlp.CommonWords, validmind.data_validation.nlp.TextDescription</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row25_col0\" class=\"data row25 col0\" >time_series_data_quality</td>\n",
-       "      <td id=\"T_9e889_row25_col1\" class=\"data row25 col1\" >TimeSeriesDataQuality</td>\n",
-       "      <td id=\"T_9e889_row25_col2\" class=\"data row25 col2\" >Test suite for data quality on time series datasets</td>\n",
-       "      <td id=\"T_9e889_row25_col3\" class=\"data row25 col3\" >validmind.data_validation.TimeSeriesOutliers, validmind.data_validation.TimeSeriesMissingValues, validmind.data_validation.TimeSeriesFrequency</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row26_col0\" class=\"data row26 col0\" >time_series_dataset</td>\n",
-       "      <td id=\"T_9e889_row26_col1\" class=\"data row26 col1\" >TimeSeriesDataset</td>\n",
-       "      <td id=\"T_9e889_row26_col2\" class=\"data row26 col2\" >Test suite for time series datasets.</td>\n",
-       "      <td id=\"T_9e889_row26_col3\" class=\"data row26 col3\" >validmind.data_validation.TimeSeriesOutliers, validmind.data_validation.TimeSeriesMissingValues, validmind.data_validation.TimeSeriesFrequency, validmind.data_validation.TimeSeriesLinePlot, validmind.data_validation.TimeSeriesHistogram, validmind.data_validation.ACFandPACFPlot, validmind.data_validation.SeasonalDecompose, validmind.data_validation.AutoSeasonality, validmind.data_validation.AutoStationarity, validmind.data_validation.RollingStatsPlot, validmind.data_validation.AutoAR, validmind.data_validation.AutoMA, validmind.data_validation.ScatterPlot, validmind.data_validation.LaggedCorrelationHeatmap, validmind.data_validation.EngleGrangerCoint, validmind.data_validation.SpreadPlot</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row27_col0\" class=\"data row27 col0\" >time_series_model_validation</td>\n",
-       "      <td id=\"T_9e889_row27_col1\" class=\"data row27 col1\" >TimeSeriesModelValidation</td>\n",
-       "      <td id=\"T_9e889_row27_col2\" class=\"data row27 col2\" >Test suite for time series model validation.</td>\n",
-       "      <td id=\"T_9e889_row27_col3\" class=\"data row27 col3\" >validmind.data_validation.DatasetSplit, validmind.model_validation.ModelMetadata, validmind.model_validation.statsmodels.RegressionModelCoeffs, validmind.model_validation.sklearn.RegressionModelsPerformanceComparison</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row28_col0\" class=\"data row28 col0\" >time_series_multivariate</td>\n",
-       "      <td id=\"T_9e889_row28_col1\" class=\"data row28 col1\" >TimeSeriesMultivariate</td>\n",
-       "      <td id=\"T_9e889_row28_col2\" class=\"data row28 col2\" >This test suite provides a preliminary understanding of the features\n",
-       "and relationship in multivariate dataset. It presents various\n",
-       "multivariate visualizations that can help identify patterns, trends,\n",
-       "and relationships between pairs of variables. The visualizations are\n",
-       "designed to explore the relationships between multiple features\n",
-       "simultaneously. They allow you to quickly identify any patterns or\n",
-       "trends in the data, as well as any potential outliers or anomalies.\n",
-       "The individual feature distribution can also be explored to provide\n",
-       "insight into the range and frequency of values observed in the data.\n",
-       "This multivariate analysis test suite aims to provide an overview of\n",
-       "the data structure and guide further exploration and modeling.</td>\n",
-       "      <td id=\"T_9e889_row28_col3\" class=\"data row28 col3\" >validmind.data_validation.ScatterPlot, validmind.data_validation.LaggedCorrelationHeatmap, validmind.data_validation.EngleGrangerCoint, validmind.data_validation.SpreadPlot</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_9e889_row29_col0\" class=\"data row29 col0\" >time_series_univariate</td>\n",
-       "      <td id=\"T_9e889_row29_col1\" class=\"data row29 col1\" >TimeSeriesUnivariate</td>\n",
-       "      <td id=\"T_9e889_row29_col2\" class=\"data row29 col2\" >This test suite provides a preliminary understanding of the target variable(s)\n",
-       "used in the time series dataset. It visualizations that present the raw time\n",
-       "series data and a histogram of the target variable(s).\n",
-       "\n",
-       "The raw time series data provides a visual inspection of the target variable's\n",
-       "behavior over time. This helps to identify any patterns or trends in the data,\n",
-       "as well as any potential outliers or anomalies. The histogram of the target\n",
-       "variable displays the distribution of values, providing insight into the range\n",
-       "and frequency of values observed in the data.</td>\n",
-       "      <td id=\"T_9e889_row29_col3\" class=\"data row29 col3\" >validmind.data_validation.TimeSeriesLinePlot, validmind.data_validation.TimeSeriesHistogram, validmind.data_validation.ACFandPACFPlot, validmind.data_validation.SeasonalDecompose, validmind.data_validation.AutoSeasonality, validmind.data_validation.AutoStationarity, validmind.data_validation.RollingStatsPlot, validmind.data_validation.AutoAR, validmind.data_validation.AutoMA</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n"
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
       ],
-      "text/plain": [
-       "<pandas.io.formats.style.Styler at 0x16a11ae00>"
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## List available test suites\n",
+        "After we import the ValidMind Library, we'll call [test_suites.list_suites()](https://docs.validmind.ai/validmind/validmind/test_suites.html#list_suites) to retrieve a structured list of all available test suites, that includes each suite's name, description, and associated tests:"
       ]
-     },
-     "execution_count": 2,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "import validmind as vm\n",
-    "\n",
-    "vm.test_suites.list_suites()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## View test suite details\n",
-    "\n",
-    "Use the [test_suites.describe_suite()](https://docs.validmind.ai/validmind/validmind/test_suites.html#describe_suite) function to retrieve information about a test suite, including its name, description, and the list of tests it contains. \n",
-    "\n",
-    "You can call `test_suites.describe_suite()` with just the test suite ID to get basic details, or pass an additional `verbose` parameter for a more comprehensive output: \n",
-    "\n",
-    "- **Test ID** - The identifier of the test suite you want to inspect.\n",
-    "- **Verbose** - A Boolean flag. Set `verbose=True` to return a full breakdown of the test suite."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 3,
-   "metadata": {},
-   "outputs": [
+    },
     {
-     "data": {
-      "text/html": [
-       "<style type=\"text/css\">\n",
-       "#T_7cb1b th {\n",
-       "  text-align: left;\n",
-       "}\n",
-       "#T_7cb1b_row0_col0, #T_7cb1b_row0_col1, #T_7cb1b_row0_col2, #T_7cb1b_row0_col3, #T_7cb1b_row0_col4, #T_7cb1b_row1_col0, #T_7cb1b_row1_col1, #T_7cb1b_row1_col2, #T_7cb1b_row1_col3, #T_7cb1b_row1_col4, #T_7cb1b_row2_col0, #T_7cb1b_row2_col1, #T_7cb1b_row2_col2, #T_7cb1b_row2_col3, #T_7cb1b_row2_col4, #T_7cb1b_row3_col0, #T_7cb1b_row3_col1, #T_7cb1b_row3_col2, #T_7cb1b_row3_col3, #T_7cb1b_row3_col4, #T_7cb1b_row4_col0, #T_7cb1b_row4_col1, #T_7cb1b_row4_col2, #T_7cb1b_row4_col3, #T_7cb1b_row4_col4, #T_7cb1b_row5_col0, #T_7cb1b_row5_col1, #T_7cb1b_row5_col2, #T_7cb1b_row5_col3, #T_7cb1b_row5_col4, #T_7cb1b_row6_col0, #T_7cb1b_row6_col1, #T_7cb1b_row6_col2, #T_7cb1b_row6_col3, #T_7cb1b_row6_col4, #T_7cb1b_row7_col0, #T_7cb1b_row7_col1, #T_7cb1b_row7_col2, #T_7cb1b_row7_col3, #T_7cb1b_row7_col4, #T_7cb1b_row8_col0, #T_7cb1b_row8_col1, #T_7cb1b_row8_col2, #T_7cb1b_row8_col3, #T_7cb1b_row8_col4, #T_7cb1b_row9_col0, #T_7cb1b_row9_col1, #T_7cb1b_row9_col2, #T_7cb1b_row9_col3, #T_7cb1b_row9_col4, #T_7cb1b_row10_col0, #T_7cb1b_row10_col1, #T_7cb1b_row10_col2, #T_7cb1b_row10_col3, #T_7cb1b_row10_col4, #T_7cb1b_row11_col0, #T_7cb1b_row11_col1, #T_7cb1b_row11_col2, #T_7cb1b_row11_col3, #T_7cb1b_row11_col4, #T_7cb1b_row12_col0, #T_7cb1b_row12_col1, #T_7cb1b_row12_col2, #T_7cb1b_row12_col3, #T_7cb1b_row12_col4, #T_7cb1b_row13_col0, #T_7cb1b_row13_col1, #T_7cb1b_row13_col2, #T_7cb1b_row13_col3, #T_7cb1b_row13_col4, #T_7cb1b_row14_col0, #T_7cb1b_row14_col1, #T_7cb1b_row14_col2, #T_7cb1b_row14_col3, #T_7cb1b_row14_col4, #T_7cb1b_row15_col0, #T_7cb1b_row15_col1, #T_7cb1b_row15_col2, #T_7cb1b_row15_col3, #T_7cb1b_row15_col4, #T_7cb1b_row16_col0, #T_7cb1b_row16_col1, #T_7cb1b_row16_col2, #T_7cb1b_row16_col3, #T_7cb1b_row16_col4, #T_7cb1b_row17_col0, #T_7cb1b_row17_col1, #T_7cb1b_row17_col2, #T_7cb1b_row17_col3, #T_7cb1b_row17_col4, #T_7cb1b_row18_col0, #T_7cb1b_row18_col1, #T_7cb1b_row18_col2, #T_7cb1b_row18_col3, #T_7cb1b_row18_col4, #T_7cb1b_row19_col0, #T_7cb1b_row19_col1, #T_7cb1b_row19_col2, #T_7cb1b_row19_col3, #T_7cb1b_row19_col4, #T_7cb1b_row20_col0, #T_7cb1b_row20_col1, #T_7cb1b_row20_col2, #T_7cb1b_row20_col3, #T_7cb1b_row20_col4, #T_7cb1b_row21_col0, #T_7cb1b_row21_col1, #T_7cb1b_row21_col2, #T_7cb1b_row21_col3, #T_7cb1b_row21_col4, #T_7cb1b_row22_col0, #T_7cb1b_row22_col1, #T_7cb1b_row22_col2, #T_7cb1b_row22_col3, #T_7cb1b_row22_col4, #T_7cb1b_row23_col0, #T_7cb1b_row23_col1, #T_7cb1b_row23_col2, #T_7cb1b_row23_col3, #T_7cb1b_row23_col4, #T_7cb1b_row24_col0, #T_7cb1b_row24_col1, #T_7cb1b_row24_col2, #T_7cb1b_row24_col3, #T_7cb1b_row24_col4, #T_7cb1b_row25_col0, #T_7cb1b_row25_col1, #T_7cb1b_row25_col2, #T_7cb1b_row25_col3, #T_7cb1b_row25_col4, #T_7cb1b_row26_col0, #T_7cb1b_row26_col1, #T_7cb1b_row26_col2, #T_7cb1b_row26_col3, #T_7cb1b_row26_col4, #T_7cb1b_row27_col0, #T_7cb1b_row27_col1, #T_7cb1b_row27_col2, #T_7cb1b_row27_col3, #T_7cb1b_row27_col4 {\n",
-       "  text-align: left;\n",
-       "}\n",
-       "</style>\n",
-       "<table id=\"T_7cb1b\">\n",
-       "  <thead>\n",
-       "    <tr>\n",
-       "      <th id=\"T_7cb1b_level0_col0\" class=\"col_heading level0 col0\" >Test Suite ID</th>\n",
-       "      <th id=\"T_7cb1b_level0_col1\" class=\"col_heading level0 col1\" >Test Suite Name</th>\n",
-       "      <th id=\"T_7cb1b_level0_col2\" class=\"col_heading level0 col2\" >Test Suite Section</th>\n",
-       "      <th id=\"T_7cb1b_level0_col3\" class=\"col_heading level0 col3\" >Test ID</th>\n",
-       "      <th id=\"T_7cb1b_level0_col4\" class=\"col_heading level0 col4\" >Test Name</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row0_col0\" class=\"data row0 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row0_col1\" class=\"data row0 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row0_col2\" class=\"data row0 col2\" >tabular_dataset_description</td>\n",
-       "      <td id=\"T_7cb1b_row0_col3\" class=\"data row0 col3\" >validmind.data_validation.DatasetDescription</td>\n",
-       "      <td id=\"T_7cb1b_row0_col4\" class=\"data row0 col4\" >Dataset Description</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row1_col0\" class=\"data row1 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row1_col1\" class=\"data row1 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row1_col2\" class=\"data row1 col2\" >tabular_dataset_description</td>\n",
-       "      <td id=\"T_7cb1b_row1_col3\" class=\"data row1 col3\" >validmind.data_validation.DescriptiveStatistics</td>\n",
-       "      <td id=\"T_7cb1b_row1_col4\" class=\"data row1 col4\" >Descriptive Statistics</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row2_col0\" class=\"data row2 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row2_col1\" class=\"data row2 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row2_col2\" class=\"data row2 col2\" >tabular_dataset_description</td>\n",
-       "      <td id=\"T_7cb1b_row2_col3\" class=\"data row2 col3\" >validmind.data_validation.PearsonCorrelationMatrix</td>\n",
-       "      <td id=\"T_7cb1b_row2_col4\" class=\"data row2 col4\" >Pearson Correlation Matrix</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row3_col0\" class=\"data row3 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row3_col1\" class=\"data row3 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row3_col2\" class=\"data row3 col2\" >tabular_data_quality</td>\n",
-       "      <td id=\"T_7cb1b_row3_col3\" class=\"data row3 col3\" >validmind.data_validation.ClassImbalance</td>\n",
-       "      <td id=\"T_7cb1b_row3_col4\" class=\"data row3 col4\" >Class Imbalance</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row4_col0\" class=\"data row4 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row4_col1\" class=\"data row4 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row4_col2\" class=\"data row4 col2\" >tabular_data_quality</td>\n",
-       "      <td id=\"T_7cb1b_row4_col3\" class=\"data row4 col3\" >validmind.data_validation.Duplicates</td>\n",
-       "      <td id=\"T_7cb1b_row4_col4\" class=\"data row4 col4\" >Duplicates</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row5_col0\" class=\"data row5 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row5_col1\" class=\"data row5 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row5_col2\" class=\"data row5 col2\" >tabular_data_quality</td>\n",
-       "      <td id=\"T_7cb1b_row5_col3\" class=\"data row5 col3\" >validmind.data_validation.HighCardinality</td>\n",
-       "      <td id=\"T_7cb1b_row5_col4\" class=\"data row5 col4\" >High Cardinality</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row6_col0\" class=\"data row6 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row6_col1\" class=\"data row6 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row6_col2\" class=\"data row6 col2\" >tabular_data_quality</td>\n",
-       "      <td id=\"T_7cb1b_row6_col3\" class=\"data row6 col3\" >validmind.data_validation.HighPearsonCorrelation</td>\n",
-       "      <td id=\"T_7cb1b_row6_col4\" class=\"data row6 col4\" >High Pearson Correlation</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row7_col0\" class=\"data row7 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row7_col1\" class=\"data row7 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row7_col2\" class=\"data row7 col2\" >tabular_data_quality</td>\n",
-       "      <td id=\"T_7cb1b_row7_col3\" class=\"data row7 col3\" >validmind.data_validation.MissingValues</td>\n",
-       "      <td id=\"T_7cb1b_row7_col4\" class=\"data row7 col4\" >Missing Values</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row8_col0\" class=\"data row8 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row8_col1\" class=\"data row8 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row8_col2\" class=\"data row8 col2\" >tabular_data_quality</td>\n",
-       "      <td id=\"T_7cb1b_row8_col3\" class=\"data row8 col3\" >validmind.data_validation.Skewness</td>\n",
-       "      <td id=\"T_7cb1b_row8_col4\" class=\"data row8 col4\" >Skewness</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row9_col0\" class=\"data row9 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row9_col1\" class=\"data row9 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row9_col2\" class=\"data row9 col2\" >tabular_data_quality</td>\n",
-       "      <td id=\"T_7cb1b_row9_col3\" class=\"data row9 col3\" >validmind.data_validation.UniqueRows</td>\n",
-       "      <td id=\"T_7cb1b_row9_col4\" class=\"data row9 col4\" >Unique Rows</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row10_col0\" class=\"data row10 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row10_col1\" class=\"data row10 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row10_col2\" class=\"data row10 col2\" >tabular_data_quality</td>\n",
-       "      <td id=\"T_7cb1b_row10_col3\" class=\"data row10 col3\" >validmind.data_validation.TooManyZeroValues</td>\n",
-       "      <td id=\"T_7cb1b_row10_col4\" class=\"data row10 col4\" >Too Many Zero Values</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row11_col0\" class=\"data row11 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row11_col1\" class=\"data row11 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row11_col2\" class=\"data row11 col2\" >classifier_metrics</td>\n",
-       "      <td id=\"T_7cb1b_row11_col3\" class=\"data row11 col3\" >validmind.model_validation.ModelMetadata</td>\n",
-       "      <td id=\"T_7cb1b_row11_col4\" class=\"data row11 col4\" >Model Metadata</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row12_col0\" class=\"data row12 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row12_col1\" class=\"data row12 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row12_col2\" class=\"data row12 col2\" >classifier_metrics</td>\n",
-       "      <td id=\"T_7cb1b_row12_col3\" class=\"data row12 col3\" >validmind.data_validation.DatasetSplit</td>\n",
-       "      <td id=\"T_7cb1b_row12_col4\" class=\"data row12 col4\" >Dataset Split</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row13_col0\" class=\"data row13 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row13_col1\" class=\"data row13 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row13_col2\" class=\"data row13 col2\" >classifier_metrics</td>\n",
-       "      <td id=\"T_7cb1b_row13_col3\" class=\"data row13 col3\" >validmind.model_validation.sklearn.ConfusionMatrix</td>\n",
-       "      <td id=\"T_7cb1b_row13_col4\" class=\"data row13 col4\" >Confusion Matrix</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row14_col0\" class=\"data row14 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row14_col1\" class=\"data row14 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row14_col2\" class=\"data row14 col2\" >classifier_metrics</td>\n",
-       "      <td id=\"T_7cb1b_row14_col3\" class=\"data row14 col3\" >validmind.model_validation.sklearn.ClassifierPerformance</td>\n",
-       "      <td id=\"T_7cb1b_row14_col4\" class=\"data row14 col4\" >Classifier Performance</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row15_col0\" class=\"data row15 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row15_col1\" class=\"data row15 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row15_col2\" class=\"data row15 col2\" >classifier_metrics</td>\n",
-       "      <td id=\"T_7cb1b_row15_col3\" class=\"data row15 col3\" >validmind.model_validation.sklearn.PermutationFeatureImportance</td>\n",
-       "      <td id=\"T_7cb1b_row15_col4\" class=\"data row15 col4\" >Permutation Feature Importance</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row16_col0\" class=\"data row16 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row16_col1\" class=\"data row16 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row16_col2\" class=\"data row16 col2\" >classifier_metrics</td>\n",
-       "      <td id=\"T_7cb1b_row16_col3\" class=\"data row16 col3\" >validmind.model_validation.sklearn.PrecisionRecallCurve</td>\n",
-       "      <td id=\"T_7cb1b_row16_col4\" class=\"data row16 col4\" >Precision Recall Curve</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row17_col0\" class=\"data row17 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row17_col1\" class=\"data row17 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row17_col2\" class=\"data row17 col2\" >classifier_metrics</td>\n",
-       "      <td id=\"T_7cb1b_row17_col3\" class=\"data row17 col3\" >validmind.model_validation.sklearn.ROCCurve</td>\n",
-       "      <td id=\"T_7cb1b_row17_col4\" class=\"data row17 col4\" >ROC Curve</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row18_col0\" class=\"data row18 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row18_col1\" class=\"data row18 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row18_col2\" class=\"data row18 col2\" >classifier_metrics</td>\n",
-       "      <td id=\"T_7cb1b_row18_col3\" class=\"data row18 col3\" >validmind.model_validation.sklearn.PopulationStabilityIndex</td>\n",
-       "      <td id=\"T_7cb1b_row18_col4\" class=\"data row18 col4\" >Population Stability Index</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row19_col0\" class=\"data row19 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row19_col1\" class=\"data row19 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row19_col2\" class=\"data row19 col2\" >classifier_metrics</td>\n",
-       "      <td id=\"T_7cb1b_row19_col3\" class=\"data row19 col3\" >validmind.model_validation.sklearn.SHAPGlobalImportance</td>\n",
-       "      <td id=\"T_7cb1b_row19_col4\" class=\"data row19 col4\" >SHAP Global Importance</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row20_col0\" class=\"data row20 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row20_col1\" class=\"data row20 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row20_col2\" class=\"data row20 col2\" >classifier_validation</td>\n",
-       "      <td id=\"T_7cb1b_row20_col3\" class=\"data row20 col3\" >validmind.model_validation.sklearn.MinimumAccuracy</td>\n",
-       "      <td id=\"T_7cb1b_row20_col4\" class=\"data row20 col4\" >Minimum Accuracy</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row21_col0\" class=\"data row21 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row21_col1\" class=\"data row21 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row21_col2\" class=\"data row21 col2\" >classifier_validation</td>\n",
-       "      <td id=\"T_7cb1b_row21_col3\" class=\"data row21 col3\" >validmind.model_validation.sklearn.MinimumF1Score</td>\n",
-       "      <td id=\"T_7cb1b_row21_col4\" class=\"data row21 col4\" >Minimum F1 Score</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row22_col0\" class=\"data row22 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row22_col1\" class=\"data row22 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row22_col2\" class=\"data row22 col2\" >classifier_validation</td>\n",
-       "      <td id=\"T_7cb1b_row22_col3\" class=\"data row22 col3\" >validmind.model_validation.sklearn.MinimumROCAUCScore</td>\n",
-       "      <td id=\"T_7cb1b_row22_col4\" class=\"data row22 col4\" >Minimum ROCAUC Score</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row23_col0\" class=\"data row23 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row23_col1\" class=\"data row23 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row23_col2\" class=\"data row23 col2\" >classifier_validation</td>\n",
-       "      <td id=\"T_7cb1b_row23_col3\" class=\"data row23 col3\" >validmind.model_validation.sklearn.TrainingTestDegradation</td>\n",
-       "      <td id=\"T_7cb1b_row23_col4\" class=\"data row23 col4\" >Training Test Degradation</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row24_col0\" class=\"data row24 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row24_col1\" class=\"data row24 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row24_col2\" class=\"data row24 col2\" >classifier_validation</td>\n",
-       "      <td id=\"T_7cb1b_row24_col3\" class=\"data row24 col3\" >validmind.model_validation.sklearn.ModelsPerformanceComparison</td>\n",
-       "      <td id=\"T_7cb1b_row24_col4\" class=\"data row24 col4\" >Models Performance Comparison</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row25_col0\" class=\"data row25 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row25_col1\" class=\"data row25 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row25_col2\" class=\"data row25 col2\" >classifier_model_diagnosis</td>\n",
-       "      <td id=\"T_7cb1b_row25_col3\" class=\"data row25 col3\" >validmind.model_validation.sklearn.OverfitDiagnosis</td>\n",
-       "      <td id=\"T_7cb1b_row25_col4\" class=\"data row25 col4\" >Overfit Diagnosis</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row26_col0\" class=\"data row26 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row26_col1\" class=\"data row26 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row26_col2\" class=\"data row26 col2\" >classifier_model_diagnosis</td>\n",
-       "      <td id=\"T_7cb1b_row26_col3\" class=\"data row26 col3\" >validmind.model_validation.sklearn.WeakspotsDiagnosis</td>\n",
-       "      <td id=\"T_7cb1b_row26_col4\" class=\"data row26 col4\" >Weakspots Diagnosis</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_7cb1b_row27_col0\" class=\"data row27 col0\" >classifier_full_suite</td>\n",
-       "      <td id=\"T_7cb1b_row27_col1\" class=\"data row27 col1\" >ClassifierFullSuite</td>\n",
-       "      <td id=\"T_7cb1b_row27_col2\" class=\"data row27 col2\" >classifier_model_diagnosis</td>\n",
-       "      <td id=\"T_7cb1b_row27_col3\" class=\"data row27 col3\" >validmind.model_validation.sklearn.RobustnessDiagnosis</td>\n",
-       "      <td id=\"T_7cb1b_row27_col4\" class=\"data row27 col4\" >Robustness Diagnosis</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n"
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import validmind as vm\n",
+        "\n",
+        "vm.test_suites.list_suites()"
       ],
-      "text/plain": [
-       "<pandas.io.formats.style.Styler at 0x16a167fa0>"
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "execute_result",
+          "data": {
+            "text/html": [
+              "<style type=\"text/css\">\n",
+              "#T_9e889 th {\n",
+              "  text-align: left;\n",
+              "}\n",
+              "#T_9e889_row0_col0, #T_9e889_row0_col1, #T_9e889_row0_col2, #T_9e889_row0_col3, #T_9e889_row1_col0, #T_9e889_row1_col1, #T_9e889_row1_col2, #T_9e889_row1_col3, #T_9e889_row2_col0, #T_9e889_row2_col1, #T_9e889_row2_col2, #T_9e889_row2_col3, #T_9e889_row3_col0, #T_9e889_row3_col1, #T_9e889_row3_col2, #T_9e889_row3_col3, #T_9e889_row4_col0, #T_9e889_row4_col1, #T_9e889_row4_col2, #T_9e889_row4_col3, #T_9e889_row5_col0, #T_9e889_row5_col1, #T_9e889_row5_col2, #T_9e889_row5_col3, #T_9e889_row6_col0, #T_9e889_row6_col1, #T_9e889_row6_col2, #T_9e889_row6_col3, #T_9e889_row7_col0, #T_9e889_row7_col1, #T_9e889_row7_col2, #T_9e889_row7_col3, #T_9e889_row8_col0, #T_9e889_row8_col1, #T_9e889_row8_col2, #T_9e889_row8_col3, #T_9e889_row9_col0, #T_9e889_row9_col1, #T_9e889_row9_col2, #T_9e889_row9_col3, #T_9e889_row10_col0, #T_9e889_row10_col1, #T_9e889_row10_col2, #T_9e889_row10_col3, #T_9e889_row11_col0, #T_9e889_row11_col1, #T_9e889_row11_col2, #T_9e889_row11_col3, #T_9e889_row12_col0, #T_9e889_row12_col1, #T_9e889_row12_col2, #T_9e889_row12_col3, #T_9e889_row13_col0, #T_9e889_row13_col1, #T_9e889_row13_col2, #T_9e889_row13_col3, #T_9e889_row14_col0, #T_9e889_row14_col1, #T_9e889_row14_col2, #T_9e889_row14_col3, #T_9e889_row15_col0, #T_9e889_row15_col1, #T_9e889_row15_col2, #T_9e889_row15_col3, #T_9e889_row16_col0, #T_9e889_row16_col1, #T_9e889_row16_col2, #T_9e889_row16_col3, #T_9e889_row17_col0, #T_9e889_row17_col1, #T_9e889_row17_col2, #T_9e889_row17_col3, #T_9e889_row18_col0, #T_9e889_row18_col1, #T_9e889_row18_col2, #T_9e889_row18_col3, #T_9e889_row19_col0, #T_9e889_row19_col1, #T_9e889_row19_col2, #T_9e889_row19_col3, #T_9e889_row20_col0, #T_9e889_row20_col1, #T_9e889_row20_col2, #T_9e889_row20_col3, #T_9e889_row21_col0, #T_9e889_row21_col1, #T_9e889_row21_col2, #T_9e889_row21_col3, #T_9e889_row22_col0, #T_9e889_row22_col1, #T_9e889_row22_col2, #T_9e889_row22_col3, #T_9e889_row23_col0, #T_9e889_row23_col1, #T_9e889_row23_col2, #T_9e889_row23_col3, #T_9e889_row24_col0, #T_9e889_row24_col1, #T_9e889_row24_col2, #T_9e889_row24_col3, #T_9e889_row25_col0, #T_9e889_row25_col1, #T_9e889_row25_col2, #T_9e889_row25_col3, #T_9e889_row26_col0, #T_9e889_row26_col1, #T_9e889_row26_col2, #T_9e889_row26_col3, #T_9e889_row27_col0, #T_9e889_row27_col1, #T_9e889_row27_col2, #T_9e889_row27_col3, #T_9e889_row28_col0, #T_9e889_row28_col1, #T_9e889_row28_col2, #T_9e889_row28_col3, #T_9e889_row29_col0, #T_9e889_row29_col1, #T_9e889_row29_col2, #T_9e889_row29_col3 {\n",
+              "  text-align: left;\n",
+              "}\n",
+              "</style>\n",
+              "<table id=\"T_9e889\">\n",
+              "  <thead>\n",
+              "    <tr>\n",
+              "      <th id=\"T_9e889_level0_col0\" class=\"col_heading level0 col0\" >ID</th>\n",
+              "      <th id=\"T_9e889_level0_col1\" class=\"col_heading level0 col1\" >Name</th>\n",
+              "      <th id=\"T_9e889_level0_col2\" class=\"col_heading level0 col2\" >Description</th>\n",
+              "      <th id=\"T_9e889_level0_col3\" class=\"col_heading level0 col3\" >Tests</th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row0_col0\" class=\"data row0 col0\" >classifier_model_diagnosis</td>\n",
+              "      <td id=\"T_9e889_row0_col1\" class=\"data row0 col1\" >ClassifierDiagnosis</td>\n",
+              "      <td id=\"T_9e889_row0_col2\" class=\"data row0 col2\" >Test suite for sklearn classifier model diagnosis tests</td>\n",
+              "      <td id=\"T_9e889_row0_col3\" class=\"data row0 col3\" >validmind.model_validation.sklearn.OverfitDiagnosis, validmind.model_validation.sklearn.WeakspotsDiagnosis, validmind.model_validation.sklearn.RobustnessDiagnosis</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row1_col0\" class=\"data row1 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_9e889_row1_col1\" class=\"data row1 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_9e889_row1_col2\" class=\"data row1 col2\" >Full test suite for binary classification models.</td>\n",
+              "      <td id=\"T_9e889_row1_col3\" class=\"data row1 col3\" >validmind.data_validation.DatasetDescription, validmind.data_validation.DescriptiveStatistics, validmind.data_validation.PearsonCorrelationMatrix, validmind.data_validation.ClassImbalance, validmind.data_validation.Duplicates, validmind.data_validation.HighCardinality, validmind.data_validation.HighPearsonCorrelation, validmind.data_validation.MissingValues, validmind.data_validation.Skewness, validmind.data_validation.UniqueRows, validmind.data_validation.TooManyZeroValues, validmind.model_validation.ModelMetadata, validmind.data_validation.DatasetSplit, validmind.model_validation.sklearn.ConfusionMatrix, validmind.model_validation.sklearn.ClassifierPerformance, validmind.model_validation.sklearn.PermutationFeatureImportance, validmind.model_validation.sklearn.PrecisionRecallCurve, validmind.model_validation.sklearn.ROCCurve, validmind.model_validation.sklearn.PopulationStabilityIndex, validmind.model_validation.sklearn.SHAPGlobalImportance, validmind.model_validation.sklearn.MinimumAccuracy, validmind.model_validation.sklearn.MinimumF1Score, validmind.model_validation.sklearn.MinimumROCAUCScore, validmind.model_validation.sklearn.TrainingTestDegradation, validmind.model_validation.sklearn.ModelsPerformanceComparison, validmind.model_validation.sklearn.OverfitDiagnosis, validmind.model_validation.sklearn.WeakspotsDiagnosis, validmind.model_validation.sklearn.RobustnessDiagnosis</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row2_col0\" class=\"data row2 col0\" >classifier_metrics</td>\n",
+              "      <td id=\"T_9e889_row2_col1\" class=\"data row2 col1\" >ClassifierMetrics</td>\n",
+              "      <td id=\"T_9e889_row2_col2\" class=\"data row2 col2\" >Test suite for sklearn classifier metrics</td>\n",
+              "      <td id=\"T_9e889_row2_col3\" class=\"data row2 col3\" >validmind.model_validation.ModelMetadata, validmind.data_validation.DatasetSplit, validmind.model_validation.sklearn.ConfusionMatrix, validmind.model_validation.sklearn.ClassifierPerformance, validmind.model_validation.sklearn.PermutationFeatureImportance, validmind.model_validation.sklearn.PrecisionRecallCurve, validmind.model_validation.sklearn.ROCCurve, validmind.model_validation.sklearn.PopulationStabilityIndex, validmind.model_validation.sklearn.SHAPGlobalImportance</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row3_col0\" class=\"data row3 col0\" >classifier_model_validation</td>\n",
+              "      <td id=\"T_9e889_row3_col1\" class=\"data row3 col1\" >ClassifierModelValidation</td>\n",
+              "      <td id=\"T_9e889_row3_col2\" class=\"data row3 col2\" >Test suite for binary classification models.</td>\n",
+              "      <td id=\"T_9e889_row3_col3\" class=\"data row3 col3\" >validmind.model_validation.ModelMetadata, validmind.data_validation.DatasetSplit, validmind.model_validation.sklearn.ConfusionMatrix, validmind.model_validation.sklearn.ClassifierPerformance, validmind.model_validation.sklearn.PermutationFeatureImportance, validmind.model_validation.sklearn.PrecisionRecallCurve, validmind.model_validation.sklearn.ROCCurve, validmind.model_validation.sklearn.PopulationStabilityIndex, validmind.model_validation.sklearn.SHAPGlobalImportance, validmind.model_validation.sklearn.MinimumAccuracy, validmind.model_validation.sklearn.MinimumF1Score, validmind.model_validation.sklearn.MinimumROCAUCScore, validmind.model_validation.sklearn.TrainingTestDegradation, validmind.model_validation.sklearn.ModelsPerformanceComparison, validmind.model_validation.sklearn.OverfitDiagnosis, validmind.model_validation.sklearn.WeakspotsDiagnosis, validmind.model_validation.sklearn.RobustnessDiagnosis</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row4_col0\" class=\"data row4 col0\" >classifier_validation</td>\n",
+              "      <td id=\"T_9e889_row4_col1\" class=\"data row4 col1\" >ClassifierPerformance</td>\n",
+              "      <td id=\"T_9e889_row4_col2\" class=\"data row4 col2\" >Test suite for sklearn classifier models</td>\n",
+              "      <td id=\"T_9e889_row4_col3\" class=\"data row4 col3\" >validmind.model_validation.sklearn.MinimumAccuracy, validmind.model_validation.sklearn.MinimumF1Score, validmind.model_validation.sklearn.MinimumROCAUCScore, validmind.model_validation.sklearn.TrainingTestDegradation, validmind.model_validation.sklearn.ModelsPerformanceComparison</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row5_col0\" class=\"data row5 col0\" >cluster_full_suite</td>\n",
+              "      <td id=\"T_9e889_row5_col1\" class=\"data row5 col1\" >ClusterFullSuite</td>\n",
+              "      <td id=\"T_9e889_row5_col2\" class=\"data row5 col2\" >Full test suite for clustering models.</td>\n",
+              "      <td id=\"T_9e889_row5_col3\" class=\"data row5 col3\" >validmind.model_validation.ModelMetadata, validmind.data_validation.DatasetSplit, validmind.model_validation.sklearn.HomogeneityScore, validmind.model_validation.sklearn.CompletenessScore, validmind.model_validation.sklearn.VMeasure, validmind.model_validation.sklearn.AdjustedRandIndex, validmind.model_validation.sklearn.AdjustedMutualInformation, validmind.model_validation.sklearn.FowlkesMallowsScore, validmind.model_validation.sklearn.ClusterPerformanceMetrics, validmind.model_validation.sklearn.ClusterCosineSimilarity, validmind.model_validation.sklearn.SilhouettePlot, validmind.model_validation.ClusterSizeDistribution, validmind.model_validation.sklearn.HyperParametersTuning, validmind.model_validation.sklearn.KMeansClustersOptimization</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row6_col0\" class=\"data row6 col0\" >cluster_metrics</td>\n",
+              "      <td id=\"T_9e889_row6_col1\" class=\"data row6 col1\" >ClusterMetrics</td>\n",
+              "      <td id=\"T_9e889_row6_col2\" class=\"data row6 col2\" >Test suite for sklearn clustering metrics</td>\n",
+              "      <td id=\"T_9e889_row6_col3\" class=\"data row6 col3\" >validmind.model_validation.ModelMetadata, validmind.data_validation.DatasetSplit, validmind.model_validation.sklearn.HomogeneityScore, validmind.model_validation.sklearn.CompletenessScore, validmind.model_validation.sklearn.VMeasure, validmind.model_validation.sklearn.AdjustedRandIndex, validmind.model_validation.sklearn.AdjustedMutualInformation, validmind.model_validation.sklearn.FowlkesMallowsScore, validmind.model_validation.sklearn.ClusterPerformanceMetrics, validmind.model_validation.sklearn.ClusterCosineSimilarity, validmind.model_validation.sklearn.SilhouettePlot</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row7_col0\" class=\"data row7 col0\" >cluster_performance</td>\n",
+              "      <td id=\"T_9e889_row7_col1\" class=\"data row7 col1\" >ClusterPerformance</td>\n",
+              "      <td id=\"T_9e889_row7_col2\" class=\"data row7 col2\" >Test suite for sklearn cluster performance</td>\n",
+              "      <td id=\"T_9e889_row7_col3\" class=\"data row7 col3\" >validmind.model_validation.ClusterSizeDistribution</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row8_col0\" class=\"data row8 col0\" >embeddings_full_suite</td>\n",
+              "      <td id=\"T_9e889_row8_col1\" class=\"data row8 col1\" >EmbeddingsFullSuite</td>\n",
+              "      <td id=\"T_9e889_row8_col2\" class=\"data row8 col2\" >Full test suite for embeddings models.</td>\n",
+              "      <td id=\"T_9e889_row8_col3\" class=\"data row8 col3\" >validmind.model_validation.ModelMetadata, validmind.data_validation.DatasetSplit, validmind.model_validation.embeddings.DescriptiveAnalytics, validmind.model_validation.embeddings.CosineSimilarityDistribution, validmind.model_validation.embeddings.ClusterDistribution, validmind.model_validation.embeddings.EmbeddingsVisualization2D, validmind.model_validation.embeddings.StabilityAnalysisRandomNoise, validmind.model_validation.embeddings.StabilityAnalysisSynonyms, validmind.model_validation.embeddings.StabilityAnalysisKeyword, validmind.model_validation.embeddings.StabilityAnalysisTranslation</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row9_col0\" class=\"data row9 col0\" >embeddings_metrics</td>\n",
+              "      <td id=\"T_9e889_row9_col1\" class=\"data row9 col1\" >EmbeddingsMetrics</td>\n",
+              "      <td id=\"T_9e889_row9_col2\" class=\"data row9 col2\" >Test suite for embeddings metrics</td>\n",
+              "      <td id=\"T_9e889_row9_col3\" class=\"data row9 col3\" >validmind.model_validation.ModelMetadata, validmind.data_validation.DatasetSplit, validmind.model_validation.embeddings.DescriptiveAnalytics, validmind.model_validation.embeddings.CosineSimilarityDistribution, validmind.model_validation.embeddings.ClusterDistribution, validmind.model_validation.embeddings.EmbeddingsVisualization2D</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row10_col0\" class=\"data row10 col0\" >embeddings_model_performance</td>\n",
+              "      <td id=\"T_9e889_row10_col1\" class=\"data row10 col1\" >EmbeddingsPerformance</td>\n",
+              "      <td id=\"T_9e889_row10_col2\" class=\"data row10 col2\" >Test suite for embeddings model performance</td>\n",
+              "      <td id=\"T_9e889_row10_col3\" class=\"data row10 col3\" >validmind.model_validation.embeddings.StabilityAnalysisRandomNoise, validmind.model_validation.embeddings.StabilityAnalysisSynonyms, validmind.model_validation.embeddings.StabilityAnalysisKeyword, validmind.model_validation.embeddings.StabilityAnalysisTranslation</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row11_col0\" class=\"data row11 col0\" >hyper_parameters_optimization</td>\n",
+              "      <td id=\"T_9e889_row11_col1\" class=\"data row11 col1\" >KmeansParametersOptimization</td>\n",
+              "      <td id=\"T_9e889_row11_col2\" class=\"data row11 col2\" >Test suite for sklearn hyperparameters optimization</td>\n",
+              "      <td id=\"T_9e889_row11_col3\" class=\"data row11 col3\" >validmind.model_validation.sklearn.HyperParametersTuning, validmind.model_validation.sklearn.KMeansClustersOptimization</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row12_col0\" class=\"data row12 col0\" >llm_classifier_full_suite</td>\n",
+              "      <td id=\"T_9e889_row12_col1\" class=\"data row12 col1\" >LLMClassifierFullSuite</td>\n",
+              "      <td id=\"T_9e889_row12_col2\" class=\"data row12 col2\" >Full test suite for LLM classification models.</td>\n",
+              "      <td id=\"T_9e889_row12_col3\" class=\"data row12 col3\" >validmind.data_validation.ClassImbalance, validmind.data_validation.Duplicates, validmind.data_validation.nlp.StopWords, validmind.data_validation.nlp.Punctuations, validmind.data_validation.nlp.CommonWords, validmind.data_validation.nlp.TextDescription, validmind.model_validation.ModelMetadata, validmind.data_validation.DatasetSplit, validmind.model_validation.sklearn.ConfusionMatrix, validmind.model_validation.sklearn.ClassifierPerformance, validmind.model_validation.sklearn.PermutationFeatureImportance, validmind.model_validation.sklearn.PrecisionRecallCurve, validmind.model_validation.sklearn.ROCCurve, validmind.model_validation.sklearn.PopulationStabilityIndex, validmind.model_validation.sklearn.SHAPGlobalImportance, validmind.model_validation.sklearn.MinimumAccuracy, validmind.model_validation.sklearn.MinimumF1Score, validmind.model_validation.sklearn.MinimumROCAUCScore, validmind.model_validation.sklearn.TrainingTestDegradation, validmind.model_validation.sklearn.ModelsPerformanceComparison, validmind.model_validation.sklearn.OverfitDiagnosis, validmind.model_validation.sklearn.WeakspotsDiagnosis, validmind.model_validation.sklearn.RobustnessDiagnosis, validmind.prompt_validation.Bias, validmind.prompt_validation.Clarity, validmind.prompt_validation.Conciseness, validmind.prompt_validation.Delimitation, validmind.prompt_validation.NegativeInstruction, validmind.prompt_validation.Robustness, validmind.prompt_validation.Specificity</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row13_col0\" class=\"data row13 col0\" >prompt_validation</td>\n",
+              "      <td id=\"T_9e889_row13_col1\" class=\"data row13 col1\" >PromptValidation</td>\n",
+              "      <td id=\"T_9e889_row13_col2\" class=\"data row13 col2\" >Test suite for prompt validation</td>\n",
+              "      <td id=\"T_9e889_row13_col3\" class=\"data row13 col3\" >validmind.prompt_validation.Bias, validmind.prompt_validation.Clarity, validmind.prompt_validation.Conciseness, validmind.prompt_validation.Delimitation, validmind.prompt_validation.NegativeInstruction, validmind.prompt_validation.Robustness, validmind.prompt_validation.Specificity</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row14_col0\" class=\"data row14 col0\" >nlp_classifier_full_suite</td>\n",
+              "      <td id=\"T_9e889_row14_col1\" class=\"data row14 col1\" >NLPClassifierFullSuite</td>\n",
+              "      <td id=\"T_9e889_row14_col2\" class=\"data row14 col2\" >Full test suite for NLP classification models.</td>\n",
+              "      <td id=\"T_9e889_row14_col3\" class=\"data row14 col3\" >validmind.data_validation.ClassImbalance, validmind.data_validation.Duplicates, validmind.data_validation.nlp.StopWords, validmind.data_validation.nlp.Punctuations, validmind.data_validation.nlp.CommonWords, validmind.data_validation.nlp.TextDescription, validmind.model_validation.ModelMetadata, validmind.data_validation.DatasetSplit, validmind.model_validation.sklearn.ConfusionMatrix, validmind.model_validation.sklearn.ClassifierPerformance, validmind.model_validation.sklearn.PermutationFeatureImportance, validmind.model_validation.sklearn.PrecisionRecallCurve, validmind.model_validation.sklearn.ROCCurve, validmind.model_validation.sklearn.PopulationStabilityIndex, validmind.model_validation.sklearn.SHAPGlobalImportance, validmind.model_validation.sklearn.MinimumAccuracy, validmind.model_validation.sklearn.MinimumF1Score, validmind.model_validation.sklearn.MinimumROCAUCScore, validmind.model_validation.sklearn.TrainingTestDegradation, validmind.model_validation.sklearn.ModelsPerformanceComparison, validmind.model_validation.sklearn.OverfitDiagnosis, validmind.model_validation.sklearn.WeakspotsDiagnosis, validmind.model_validation.sklearn.RobustnessDiagnosis</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row15_col0\" class=\"data row15 col0\" >regression_metrics</td>\n",
+              "      <td id=\"T_9e889_row15_col1\" class=\"data row15 col1\" >RegressionMetrics</td>\n",
+              "      <td id=\"T_9e889_row15_col2\" class=\"data row15 col2\" >Test suite for performance metrics of regression metrics</td>\n",
+              "      <td id=\"T_9e889_row15_col3\" class=\"data row15 col3\" >validmind.data_validation.DatasetSplit, validmind.model_validation.ModelMetadata, validmind.model_validation.sklearn.PermutationFeatureImportance</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row16_col0\" class=\"data row16 col0\" >regression_model_description</td>\n",
+              "      <td id=\"T_9e889_row16_col1\" class=\"data row16 col1\" >RegressionModelDescription</td>\n",
+              "      <td id=\"T_9e889_row16_col2\" class=\"data row16 col2\" >Test suite for performance metric of regression model of statsmodels library</td>\n",
+              "      <td id=\"T_9e889_row16_col3\" class=\"data row16 col3\" >validmind.data_validation.DatasetSplit, validmind.model_validation.ModelMetadata</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row17_col0\" class=\"data row17 col0\" >regression_models_evaluation</td>\n",
+              "      <td id=\"T_9e889_row17_col1\" class=\"data row17 col1\" >RegressionModelsEvaluation</td>\n",
+              "      <td id=\"T_9e889_row17_col2\" class=\"data row17 col2\" >Test suite for metrics comparison of regression model of statsmodels library</td>\n",
+              "      <td id=\"T_9e889_row17_col3\" class=\"data row17 col3\" >validmind.model_validation.statsmodels.RegressionModelCoeffs, validmind.model_validation.sklearn.RegressionModelsPerformanceComparison</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row18_col0\" class=\"data row18 col0\" >regression_full_suite</td>\n",
+              "      <td id=\"T_9e889_row18_col1\" class=\"data row18 col1\" >RegressionFullSuite</td>\n",
+              "      <td id=\"T_9e889_row18_col2\" class=\"data row18 col2\" >Full test suite for regression models.</td>\n",
+              "      <td id=\"T_9e889_row18_col3\" class=\"data row18 col3\" >validmind.data_validation.DatasetDescription, validmind.data_validation.DescriptiveStatistics, validmind.data_validation.PearsonCorrelationMatrix, validmind.data_validation.ClassImbalance, validmind.data_validation.Duplicates, validmind.data_validation.HighCardinality, validmind.data_validation.HighPearsonCorrelation, validmind.data_validation.MissingValues, validmind.data_validation.Skewness, validmind.data_validation.UniqueRows, validmind.data_validation.TooManyZeroValues, validmind.data_validation.DatasetSplit, validmind.model_validation.ModelMetadata, validmind.model_validation.sklearn.PermutationFeatureImportance, validmind.model_validation.sklearn.RegressionErrors, validmind.model_validation.sklearn.RegressionR2Square</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row19_col0\" class=\"data row19 col0\" >regression_performance</td>\n",
+              "      <td id=\"T_9e889_row19_col1\" class=\"data row19 col1\" >RegressionPerformance</td>\n",
+              "      <td id=\"T_9e889_row19_col2\" class=\"data row19 col2\" >Test suite for regression model performance</td>\n",
+              "      <td id=\"T_9e889_row19_col3\" class=\"data row19 col3\" >validmind.model_validation.sklearn.RegressionErrors, validmind.model_validation.sklearn.RegressionR2Square</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row20_col0\" class=\"data row20 col0\" >summarization_metrics</td>\n",
+              "      <td id=\"T_9e889_row20_col1\" class=\"data row20 col1\" >SummarizationMetrics</td>\n",
+              "      <td id=\"T_9e889_row20_col2\" class=\"data row20 col2\" >Test suite for Summarization metrics</td>\n",
+              "      <td id=\"T_9e889_row20_col3\" class=\"data row20 col3\" >validmind.model_validation.TokenDisparity, validmind.model_validation.BleuScore, validmind.model_validation.BertScore, validmind.model_validation.ContextualRecall</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row21_col0\" class=\"data row21 col0\" >tabular_dataset</td>\n",
+              "      <td id=\"T_9e889_row21_col1\" class=\"data row21 col1\" >TabularDataset</td>\n",
+              "      <td id=\"T_9e889_row21_col2\" class=\"data row21 col2\" >Test suite for tabular datasets.</td>\n",
+              "      <td id=\"T_9e889_row21_col3\" class=\"data row21 col3\" >validmind.data_validation.DatasetDescription, validmind.data_validation.DescriptiveStatistics, validmind.data_validation.PearsonCorrelationMatrix, validmind.data_validation.ClassImbalance, validmind.data_validation.Duplicates, validmind.data_validation.HighCardinality, validmind.data_validation.HighPearsonCorrelation, validmind.data_validation.MissingValues, validmind.data_validation.Skewness, validmind.data_validation.UniqueRows, validmind.data_validation.TooManyZeroValues</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row22_col0\" class=\"data row22 col0\" >tabular_dataset_description</td>\n",
+              "      <td id=\"T_9e889_row22_col1\" class=\"data row22 col1\" >TabularDatasetDescription</td>\n",
+              "      <td id=\"T_9e889_row22_col2\" class=\"data row22 col2\" >Test suite to extract metadata and descriptive\n",
+              "statistics from a tabular dataset</td>\n",
+              "      <td id=\"T_9e889_row22_col3\" class=\"data row22 col3\" >validmind.data_validation.DatasetDescription, validmind.data_validation.DescriptiveStatistics, validmind.data_validation.PearsonCorrelationMatrix</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row23_col0\" class=\"data row23 col0\" >tabular_data_quality</td>\n",
+              "      <td id=\"T_9e889_row23_col1\" class=\"data row23 col1\" >TabularDataQuality</td>\n",
+              "      <td id=\"T_9e889_row23_col2\" class=\"data row23 col2\" >Test suite for data quality on tabular datasets</td>\n",
+              "      <td id=\"T_9e889_row23_col3\" class=\"data row23 col3\" >validmind.data_validation.ClassImbalance, validmind.data_validation.Duplicates, validmind.data_validation.HighCardinality, validmind.data_validation.HighPearsonCorrelation, validmind.data_validation.MissingValues, validmind.data_validation.Skewness, validmind.data_validation.UniqueRows, validmind.data_validation.TooManyZeroValues</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row24_col0\" class=\"data row24 col0\" >text_data_quality</td>\n",
+              "      <td id=\"T_9e889_row24_col1\" class=\"data row24 col1\" >TextDataQuality</td>\n",
+              "      <td id=\"T_9e889_row24_col2\" class=\"data row24 col2\" >Test suite for data quality on text data</td>\n",
+              "      <td id=\"T_9e889_row24_col3\" class=\"data row24 col3\" >validmind.data_validation.ClassImbalance, validmind.data_validation.Duplicates, validmind.data_validation.nlp.StopWords, validmind.data_validation.nlp.Punctuations, validmind.data_validation.nlp.CommonWords, validmind.data_validation.nlp.TextDescription</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row25_col0\" class=\"data row25 col0\" >time_series_data_quality</td>\n",
+              "      <td id=\"T_9e889_row25_col1\" class=\"data row25 col1\" >TimeSeriesDataQuality</td>\n",
+              "      <td id=\"T_9e889_row25_col2\" class=\"data row25 col2\" >Test suite for data quality on time series datasets</td>\n",
+              "      <td id=\"T_9e889_row25_col3\" class=\"data row25 col3\" >validmind.data_validation.TimeSeriesOutliers, validmind.data_validation.TimeSeriesMissingValues, validmind.data_validation.TimeSeriesFrequency</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row26_col0\" class=\"data row26 col0\" >time_series_dataset</td>\n",
+              "      <td id=\"T_9e889_row26_col1\" class=\"data row26 col1\" >TimeSeriesDataset</td>\n",
+              "      <td id=\"T_9e889_row26_col2\" class=\"data row26 col2\" >Test suite for time series datasets.</td>\n",
+              "      <td id=\"T_9e889_row26_col3\" class=\"data row26 col3\" >validmind.data_validation.TimeSeriesOutliers, validmind.data_validation.TimeSeriesMissingValues, validmind.data_validation.TimeSeriesFrequency, validmind.data_validation.TimeSeriesLinePlot, validmind.data_validation.TimeSeriesHistogram, validmind.data_validation.ACFandPACFPlot, validmind.data_validation.SeasonalDecompose, validmind.data_validation.AutoSeasonality, validmind.data_validation.AutoStationarity, validmind.data_validation.RollingStatsPlot, validmind.data_validation.AutoAR, validmind.data_validation.AutoMA, validmind.data_validation.ScatterPlot, validmind.data_validation.LaggedCorrelationHeatmap, validmind.data_validation.EngleGrangerCoint, validmind.data_validation.SpreadPlot</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row27_col0\" class=\"data row27 col0\" >time_series_model_validation</td>\n",
+              "      <td id=\"T_9e889_row27_col1\" class=\"data row27 col1\" >TimeSeriesModelValidation</td>\n",
+              "      <td id=\"T_9e889_row27_col2\" class=\"data row27 col2\" >Test suite for time series model validation.</td>\n",
+              "      <td id=\"T_9e889_row27_col3\" class=\"data row27 col3\" >validmind.data_validation.DatasetSplit, validmind.model_validation.ModelMetadata, validmind.model_validation.statsmodels.RegressionModelCoeffs, validmind.model_validation.sklearn.RegressionModelsPerformanceComparison</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row28_col0\" class=\"data row28 col0\" >time_series_multivariate</td>\n",
+              "      <td id=\"T_9e889_row28_col1\" class=\"data row28 col1\" >TimeSeriesMultivariate</td>\n",
+              "      <td id=\"T_9e889_row28_col2\" class=\"data row28 col2\" >This test suite provides a preliminary understanding of the features\n",
+              "and relationship in multivariate dataset. It presents various\n",
+              "multivariate visualizations that can help identify patterns, trends,\n",
+              "and relationships between pairs of variables. The visualizations are\n",
+              "designed to explore the relationships between multiple features\n",
+              "simultaneously. They allow you to quickly identify any patterns or\n",
+              "trends in the data, as well as any potential outliers or anomalies.\n",
+              "The individual feature distribution can also be explored to provide\n",
+              "insight into the range and frequency of values observed in the data.\n",
+              "This multivariate analysis test suite aims to provide an overview of\n",
+              "the data structure and guide further exploration and modeling.</td>\n",
+              "      <td id=\"T_9e889_row28_col3\" class=\"data row28 col3\" >validmind.data_validation.ScatterPlot, validmind.data_validation.LaggedCorrelationHeatmap, validmind.data_validation.EngleGrangerCoint, validmind.data_validation.SpreadPlot</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_9e889_row29_col0\" class=\"data row29 col0\" >time_series_univariate</td>\n",
+              "      <td id=\"T_9e889_row29_col1\" class=\"data row29 col1\" >TimeSeriesUnivariate</td>\n",
+              "      <td id=\"T_9e889_row29_col2\" class=\"data row29 col2\" >This test suite provides a preliminary understanding of the target variable(s)\n",
+              "used in the time series dataset. It visualizations that present the raw time\n",
+              "series data and a histogram of the target variable(s).\n",
+              "\n",
+              "The raw time series data provides a visual inspection of the target variable's\n",
+              "behavior over time. This helps to identify any patterns or trends in the data,\n",
+              "as well as any potential outliers or anomalies. The histogram of the target\n",
+              "variable displays the distribution of values, providing insight into the range\n",
+              "and frequency of values observed in the data.</td>\n",
+              "      <td id=\"T_9e889_row29_col3\" class=\"data row29 col3\" >validmind.data_validation.TimeSeriesLinePlot, validmind.data_validation.TimeSeriesHistogram, validmind.data_validation.ACFandPACFPlot, validmind.data_validation.SeasonalDecompose, validmind.data_validation.AutoSeasonality, validmind.data_validation.AutoStationarity, validmind.data_validation.RollingStatsPlot, validmind.data_validation.AutoAR, validmind.data_validation.AutoMA</td>\n",
+              "    </tr>\n",
+              "  </tbody>\n",
+              "</table>\n"
+            ],
+            "text/plain": [
+              "<pandas.io.formats.style.Styler at 0x16a11ae00>"
+            ]
+          }
+        }
       ]
-     },
-     "execution_count": 3,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "vm.test_suites.describe_suite(\"classifier_full_suite\", verbose=True)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_1__'></a>\n",
-    "\n",
-    "### View test details\n",
-    "\n",
-    "To inspect a specific test in a suite, pass the name of the test to [tests.describe_test()](https://docs.validmind.ai/validmind/validmind/tests.html#describe_test) to get detailed information about the test such as its purpose, strengths and limitations:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 4,
-   "metadata": {},
-   "outputs": [
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## View test suite details\n",
+        "\n",
+        "Use the [test_suites.describe_suite()](https://docs.validmind.ai/validmind/validmind/test_suites.html#describe_suite) function to retrieve information about a test suite, including its name, description, and the list of tests it contains. \n",
+        "\n",
+        "You can call `test_suites.describe_suite()` with just the test suite ID to get basic details, or pass an additional `verbose` parameter for a more comprehensive output: \n",
+        "\n",
+        "- **Test ID** - The identifier of the test suite you want to inspect.\n",
+        "- **Verbose** - A Boolean flag. Set `verbose=True` to return a full breakdown of the test suite."
+      ]
+    },
     {
-     "data": {
-      "text/html": [
-       "\n",
-       "        <div class=\"vm-accordion\" id=\"accordion-c38a3af7\">\n",
-       "            \n",
-       "            <div class=\"vm-accordion-item\">\n",
-       "                <div class=\"vm-accordion-header\"\n",
-       "                     onclick=\"toggleAccordionItem('accordion-c38a3af7-item-0')\"\n",
-       "                     style=\"cursor: pointer; padding: 10px; background-color: #f8f9fa; border: 1px solid #dee2e6; font-weight: bold;\">\n",
-       "                    <span class=\"vm-accordion-toggle\" id=\"accordion-c38a3af7-item-0-toggle\">▶</span>\n",
-       "                    Test: Descriptive Statistics ('validmind.data_validation.DescriptiveStatistics')\n",
-       "                </div>\n",
-       "                <div class=\"vm-accordion-content\"\n",
-       "                     id=\"accordion-c38a3af7-item-0\"\n",
-       "                     style=\"display: none; padding: 15px; border: 1px solid #dee2e6; border-top: none;\">\n",
-       "                    \n",
-       "<div>\n",
-       "  <h2>Descriptive Statistics</h2>\n",
-       "  <div style=\"border: 1px solid #ddd; border-radius: 4px; padding: 10px; margin: 10px 0;\">\n",
-       "    <p>Performs a detailed descriptive statistical analysis of both numerical and categorical data within a model's\n",
-       "dataset.</p>\n",
-       "<h3>Purpose</h3>\n",
-       "<p>The purpose of the Descriptive Statistics metric is to provide a comprehensive summary of both numerical and\n",
-       "categorical data within a dataset. This involves statistics such as count, mean, standard deviation, minimum and\n",
-       "maximum values for numerical data. For categorical data, it calculates the count, number of unique values, most\n",
-       "common value and its frequency, and the proportion of the most frequent value relative to the total. The goal is to\n",
-       "visualize the overall distribution of the variables in the dataset, aiding in understanding the model's behavior\n",
-       "and predicting its performance.</p>\n",
-       "<h3>Test Mechanism</h3>\n",
-       "<p>The testing mechanism utilizes two in-built functions of pandas dataframes: <code>describe()</code> for numerical fields and\n",
-       "<code>value_counts()</code> for categorical fields. The <code>describe()</code> function pulls out several summary statistics, while\n",
-       "<code>value_counts()</code> accounts for unique values. The resulting data is formatted into two distinct tables, one for\n",
-       "numerical and another for categorical variable summaries. These tables provide a clear summary of the main\n",
-       "characteristics of the variables, which can be instrumental in assessing the model's performance.</p>\n",
-       "<h3>Signs of High Risk</h3>\n",
-       "<ul>\n",
-       "<li>Skewed data or significant outliers can represent high risk. For numerical data, this may be reflected via a\n",
-       "significant difference between the mean and median (50% percentile).</li>\n",
-       "<li>For categorical data, a lack of diversity (low count of unique values), or overdominance of a single category\n",
-       "(high frequency of the top value) can indicate high risk.</li>\n",
-       "</ul>\n",
-       "<h3>Strengths</h3>\n",
-       "<ul>\n",
-       "<li>Provides a comprehensive summary of the dataset, shedding light on the distribution and characteristics of the\n",
-       "variables under consideration.</li>\n",
-       "<li>It is a versatile and robust method, applicable to both numerical and categorical data.</li>\n",
-       "<li>Helps highlight crucial anomalies such as outliers, extreme skewness, or lack of diversity, which are vital in\n",
-       "understanding model behavior during testing and validation.</li>\n",
-       "</ul>\n",
-       "<h3>Limitations</h3>\n",
-       "<ul>\n",
-       "<li>While this metric offers a high-level overview of the data, it may fail to detect subtle correlations or complex\n",
-       "patterns.</li>\n",
-       "<li>Does not offer any insights on the relationship between variables.</li>\n",
-       "<li>Alone, descriptive statistics cannot be used to infer properties about future unseen data.</li>\n",
-       "<li>Should be used in conjunction with other statistical tests to provide a comprehensive understanding of the\n",
-       "model's data.</li>\n",
-       "</ul>\n",
-       "\n",
-       "  </div>\n",
-       "</div>\n",
-       "\n",
-       "<h4 class=\"vm_required_context\">\n",
-       "  Required Inputs: <span style=\"font-size: 13px\"><i>dataset</i></span>\n",
-       "</h4>\n",
-       "\n",
-       "<div style=\"display: none;\">\n",
-       "  <h4>Parameters:</h4>\n",
-       "  <table class=\"vm_params_table\" style=\"display: none;\">\n",
-       "      <tr>\n",
-       "          <th>Parameter</th>\n",
-       "          <th>Default Value</th>\n",
-       "      </tr>\n",
-       "      \n",
-       "  </table>\n",
-       "</div>\n",
-       "\n",
-       "<div class=\"unset\">\n",
-       "  <h3>How to Run:</h3>\n",
-       "\n",
-       "  <button\n",
-       "      onclick=\"(() => {e = document.getElementById('expandable_instructions_7e3e1a19-00f2-4e0b-95b6-720bc7e3ba8b'); e.style.display === 'none' ? e.style.display = 'block' : e.style.display = 'none'})()\"\n",
-       "  >Show/Hide Instructions</button>\n",
-       "\n",
-       "  <div id=\"expandable_instructions_7e3e1a19-00f2-4e0b-95b6-720bc7e3ba8b\" style=\"display: block;\">\n",
-       "  <h4>Code:</h4>\n",
-       "    <pre>\n",
-       "        <code class='language-python'>\n",
-       "import validmind as vm\n",
-       "\n",
-       "# inputs dictionary maps your inputs to the expected input names\n",
-       "# keys are the expected input names and values are the actual inputs\n",
-       "# values may be string input_ids or the actual VMDataset or VMModel objects\n",
-       "inputs = {\n",
-       "    \"dataset\": \"my_vm_dataset\"\n",
-       "}\n",
-       "params = {}\n",
-       "\n",
-       "# to run and view the result of this test, run the following code:\n",
-       "result = vm.tests.run_test(\n",
-       "  \"validmind.data_validation.DescriptiveStatistics\", inputs=inputs, params=params\n",
-       ")\n",
-       "\n",
-       "# To see the result of the test, ensure that you have called `vm.init()` and then run:\n",
-       "result.log()</code>\n",
-       "    </pre>\n",
-       "  </div>\n",
-       "</div>\n",
-       "\n",
-       "<style>\n",
-       "h5.vm_required_context {\n",
-       "    margin-top: 25px;\n",
-       "}\n",
-       "table.vm_params_table {\n",
-       "  margin-top: 20px;\n",
-       "  width: 350px;\n",
-       "  border-collapse: collapse;\n",
-       "  border-color: --jp-border-color0;\n",
-       "}\n",
-       "table.vm_params_table td, table.vm_params_table th {\n",
-       "  text-align: right;\n",
-       "}\n",
-       "table.vm_params_table td:first-child, table.vm_params_table th:first-child {\n",
-       "  text-align: left;\n",
-       "}\n",
-       "table.vm_params_table th {\n",
-       "  background-color: --jp-content-color0;\n",
-       "  font-weight: bold;\n",
-       "  font-size: 14px !important;\n",
-       "}\n",
-       "table.vm_params_table tr:nth-child(even) {\n",
-       "  background-color: --jp-layout-color1;\n",
-       "}\n",
-       "table.vm_params_table tr:nth-child(odd) {\n",
-       "  background-color: --jp-layout-color2;\n",
-       "}\n",
-       "table.vm_params_table tr:hover {\n",
-       "  background-color: --jp-layout-color3;\n",
-       "}\n",
-       "table.vm_params_table td, table.vm_params_table th {\n",
-       "  padding: 5px;\n",
-       "  border: .8px solid --jp-border-color0;\n",
-       "}\n",
-       "</style>\n",
-       "\n",
-       "                </div>\n",
-       "            </div>\n",
-       "            \n",
-       "        </div>\n",
-       "\n",
-       "        <script>\n",
-       "        function toggleAccordionItem(itemId) {\n",
-       "            const content = document.getElementById(itemId);\n",
-       "            const toggle = document.getElementById(itemId + '-toggle');\n",
-       "\n",
-       "            if (content.style.display === 'none' || content.style.display === '') {\n",
-       "                content.style.display = 'block';\n",
-       "                toggle.innerHTML = '▼';\n",
-       "            } else {\n",
-       "                content.style.display = 'none';\n",
-       "                toggle.innerHTML = '▶';\n",
-       "            }\n",
-       "        }\n",
-       "        </script>\n",
-       "        "
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.test_suites.describe_suite(\"classifier_full_suite\", verbose=True)"
       ],
-      "text/plain": [
-       "<IPython.core.display.HTML object>"
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "execute_result",
+          "data": {
+            "text/html": [
+              "<style type=\"text/css\">\n",
+              "#T_7cb1b th {\n",
+              "  text-align: left;\n",
+              "}\n",
+              "#T_7cb1b_row0_col0, #T_7cb1b_row0_col1, #T_7cb1b_row0_col2, #T_7cb1b_row0_col3, #T_7cb1b_row0_col4, #T_7cb1b_row1_col0, #T_7cb1b_row1_col1, #T_7cb1b_row1_col2, #T_7cb1b_row1_col3, #T_7cb1b_row1_col4, #T_7cb1b_row2_col0, #T_7cb1b_row2_col1, #T_7cb1b_row2_col2, #T_7cb1b_row2_col3, #T_7cb1b_row2_col4, #T_7cb1b_row3_col0, #T_7cb1b_row3_col1, #T_7cb1b_row3_col2, #T_7cb1b_row3_col3, #T_7cb1b_row3_col4, #T_7cb1b_row4_col0, #T_7cb1b_row4_col1, #T_7cb1b_row4_col2, #T_7cb1b_row4_col3, #T_7cb1b_row4_col4, #T_7cb1b_row5_col0, #T_7cb1b_row5_col1, #T_7cb1b_row5_col2, #T_7cb1b_row5_col3, #T_7cb1b_row5_col4, #T_7cb1b_row6_col0, #T_7cb1b_row6_col1, #T_7cb1b_row6_col2, #T_7cb1b_row6_col3, #T_7cb1b_row6_col4, #T_7cb1b_row7_col0, #T_7cb1b_row7_col1, #T_7cb1b_row7_col2, #T_7cb1b_row7_col3, #T_7cb1b_row7_col4, #T_7cb1b_row8_col0, #T_7cb1b_row8_col1, #T_7cb1b_row8_col2, #T_7cb1b_row8_col3, #T_7cb1b_row8_col4, #T_7cb1b_row9_col0, #T_7cb1b_row9_col1, #T_7cb1b_row9_col2, #T_7cb1b_row9_col3, #T_7cb1b_row9_col4, #T_7cb1b_row10_col0, #T_7cb1b_row10_col1, #T_7cb1b_row10_col2, #T_7cb1b_row10_col3, #T_7cb1b_row10_col4, #T_7cb1b_row11_col0, #T_7cb1b_row11_col1, #T_7cb1b_row11_col2, #T_7cb1b_row11_col3, #T_7cb1b_row11_col4, #T_7cb1b_row12_col0, #T_7cb1b_row12_col1, #T_7cb1b_row12_col2, #T_7cb1b_row12_col3, #T_7cb1b_row12_col4, #T_7cb1b_row13_col0, #T_7cb1b_row13_col1, #T_7cb1b_row13_col2, #T_7cb1b_row13_col3, #T_7cb1b_row13_col4, #T_7cb1b_row14_col0, #T_7cb1b_row14_col1, #T_7cb1b_row14_col2, #T_7cb1b_row14_col3, #T_7cb1b_row14_col4, #T_7cb1b_row15_col0, #T_7cb1b_row15_col1, #T_7cb1b_row15_col2, #T_7cb1b_row15_col3, #T_7cb1b_row15_col4, #T_7cb1b_row16_col0, #T_7cb1b_row16_col1, #T_7cb1b_row16_col2, #T_7cb1b_row16_col3, #T_7cb1b_row16_col4, #T_7cb1b_row17_col0, #T_7cb1b_row17_col1, #T_7cb1b_row17_col2, #T_7cb1b_row17_col3, #T_7cb1b_row17_col4, #T_7cb1b_row18_col0, #T_7cb1b_row18_col1, #T_7cb1b_row18_col2, #T_7cb1b_row18_col3, #T_7cb1b_row18_col4, #T_7cb1b_row19_col0, #T_7cb1b_row19_col1, #T_7cb1b_row19_col2, #T_7cb1b_row19_col3, #T_7cb1b_row19_col4, #T_7cb1b_row20_col0, #T_7cb1b_row20_col1, #T_7cb1b_row20_col2, #T_7cb1b_row20_col3, #T_7cb1b_row20_col4, #T_7cb1b_row21_col0, #T_7cb1b_row21_col1, #T_7cb1b_row21_col2, #T_7cb1b_row21_col3, #T_7cb1b_row21_col4, #T_7cb1b_row22_col0, #T_7cb1b_row22_col1, #T_7cb1b_row22_col2, #T_7cb1b_row22_col3, #T_7cb1b_row22_col4, #T_7cb1b_row23_col0, #T_7cb1b_row23_col1, #T_7cb1b_row23_col2, #T_7cb1b_row23_col3, #T_7cb1b_row23_col4, #T_7cb1b_row24_col0, #T_7cb1b_row24_col1, #T_7cb1b_row24_col2, #T_7cb1b_row24_col3, #T_7cb1b_row24_col4, #T_7cb1b_row25_col0, #T_7cb1b_row25_col1, #T_7cb1b_row25_col2, #T_7cb1b_row25_col3, #T_7cb1b_row25_col4, #T_7cb1b_row26_col0, #T_7cb1b_row26_col1, #T_7cb1b_row26_col2, #T_7cb1b_row26_col3, #T_7cb1b_row26_col4, #T_7cb1b_row27_col0, #T_7cb1b_row27_col1, #T_7cb1b_row27_col2, #T_7cb1b_row27_col3, #T_7cb1b_row27_col4 {\n",
+              "  text-align: left;\n",
+              "}\n",
+              "</style>\n",
+              "<table id=\"T_7cb1b\">\n",
+              "  <thead>\n",
+              "    <tr>\n",
+              "      <th id=\"T_7cb1b_level0_col0\" class=\"col_heading level0 col0\" >Test Suite ID</th>\n",
+              "      <th id=\"T_7cb1b_level0_col1\" class=\"col_heading level0 col1\" >Test Suite Name</th>\n",
+              "      <th id=\"T_7cb1b_level0_col2\" class=\"col_heading level0 col2\" >Test Suite Section</th>\n",
+              "      <th id=\"T_7cb1b_level0_col3\" class=\"col_heading level0 col3\" >Test ID</th>\n",
+              "      <th id=\"T_7cb1b_level0_col4\" class=\"col_heading level0 col4\" >Test Name</th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row0_col0\" class=\"data row0 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row0_col1\" class=\"data row0 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row0_col2\" class=\"data row0 col2\" >tabular_dataset_description</td>\n",
+              "      <td id=\"T_7cb1b_row0_col3\" class=\"data row0 col3\" >validmind.data_validation.DatasetDescription</td>\n",
+              "      <td id=\"T_7cb1b_row0_col4\" class=\"data row0 col4\" >Dataset Description</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row1_col0\" class=\"data row1 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row1_col1\" class=\"data row1 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row1_col2\" class=\"data row1 col2\" >tabular_dataset_description</td>\n",
+              "      <td id=\"T_7cb1b_row1_col3\" class=\"data row1 col3\" >validmind.data_validation.DescriptiveStatistics</td>\n",
+              "      <td id=\"T_7cb1b_row1_col4\" class=\"data row1 col4\" >Descriptive Statistics</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row2_col0\" class=\"data row2 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row2_col1\" class=\"data row2 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row2_col2\" class=\"data row2 col2\" >tabular_dataset_description</td>\n",
+              "      <td id=\"T_7cb1b_row2_col3\" class=\"data row2 col3\" >validmind.data_validation.PearsonCorrelationMatrix</td>\n",
+              "      <td id=\"T_7cb1b_row2_col4\" class=\"data row2 col4\" >Pearson Correlation Matrix</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row3_col0\" class=\"data row3 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row3_col1\" class=\"data row3 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row3_col2\" class=\"data row3 col2\" >tabular_data_quality</td>\n",
+              "      <td id=\"T_7cb1b_row3_col3\" class=\"data row3 col3\" >validmind.data_validation.ClassImbalance</td>\n",
+              "      <td id=\"T_7cb1b_row3_col4\" class=\"data row3 col4\" >Class Imbalance</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row4_col0\" class=\"data row4 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row4_col1\" class=\"data row4 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row4_col2\" class=\"data row4 col2\" >tabular_data_quality</td>\n",
+              "      <td id=\"T_7cb1b_row4_col3\" class=\"data row4 col3\" >validmind.data_validation.Duplicates</td>\n",
+              "      <td id=\"T_7cb1b_row4_col4\" class=\"data row4 col4\" >Duplicates</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row5_col0\" class=\"data row5 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row5_col1\" class=\"data row5 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row5_col2\" class=\"data row5 col2\" >tabular_data_quality</td>\n",
+              "      <td id=\"T_7cb1b_row5_col3\" class=\"data row5 col3\" >validmind.data_validation.HighCardinality</td>\n",
+              "      <td id=\"T_7cb1b_row5_col4\" class=\"data row5 col4\" >High Cardinality</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row6_col0\" class=\"data row6 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row6_col1\" class=\"data row6 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row6_col2\" class=\"data row6 col2\" >tabular_data_quality</td>\n",
+              "      <td id=\"T_7cb1b_row6_col3\" class=\"data row6 col3\" >validmind.data_validation.HighPearsonCorrelation</td>\n",
+              "      <td id=\"T_7cb1b_row6_col4\" class=\"data row6 col4\" >High Pearson Correlation</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row7_col0\" class=\"data row7 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row7_col1\" class=\"data row7 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row7_col2\" class=\"data row7 col2\" >tabular_data_quality</td>\n",
+              "      <td id=\"T_7cb1b_row7_col3\" class=\"data row7 col3\" >validmind.data_validation.MissingValues</td>\n",
+              "      <td id=\"T_7cb1b_row7_col4\" class=\"data row7 col4\" >Missing Values</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row8_col0\" class=\"data row8 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row8_col1\" class=\"data row8 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row8_col2\" class=\"data row8 col2\" >tabular_data_quality</td>\n",
+              "      <td id=\"T_7cb1b_row8_col3\" class=\"data row8 col3\" >validmind.data_validation.Skewness</td>\n",
+              "      <td id=\"T_7cb1b_row8_col4\" class=\"data row8 col4\" >Skewness</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row9_col0\" class=\"data row9 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row9_col1\" class=\"data row9 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row9_col2\" class=\"data row9 col2\" >tabular_data_quality</td>\n",
+              "      <td id=\"T_7cb1b_row9_col3\" class=\"data row9 col3\" >validmind.data_validation.UniqueRows</td>\n",
+              "      <td id=\"T_7cb1b_row9_col4\" class=\"data row9 col4\" >Unique Rows</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row10_col0\" class=\"data row10 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row10_col1\" class=\"data row10 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row10_col2\" class=\"data row10 col2\" >tabular_data_quality</td>\n",
+              "      <td id=\"T_7cb1b_row10_col3\" class=\"data row10 col3\" >validmind.data_validation.TooManyZeroValues</td>\n",
+              "      <td id=\"T_7cb1b_row10_col4\" class=\"data row10 col4\" >Too Many Zero Values</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row11_col0\" class=\"data row11 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row11_col1\" class=\"data row11 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row11_col2\" class=\"data row11 col2\" >classifier_metrics</td>\n",
+              "      <td id=\"T_7cb1b_row11_col3\" class=\"data row11 col3\" >validmind.model_validation.ModelMetadata</td>\n",
+              "      <td id=\"T_7cb1b_row11_col4\" class=\"data row11 col4\" >Model Metadata</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row12_col0\" class=\"data row12 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row12_col1\" class=\"data row12 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row12_col2\" class=\"data row12 col2\" >classifier_metrics</td>\n",
+              "      <td id=\"T_7cb1b_row12_col3\" class=\"data row12 col3\" >validmind.data_validation.DatasetSplit</td>\n",
+              "      <td id=\"T_7cb1b_row12_col4\" class=\"data row12 col4\" >Dataset Split</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row13_col0\" class=\"data row13 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row13_col1\" class=\"data row13 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row13_col2\" class=\"data row13 col2\" >classifier_metrics</td>\n",
+              "      <td id=\"T_7cb1b_row13_col3\" class=\"data row13 col3\" >validmind.model_validation.sklearn.ConfusionMatrix</td>\n",
+              "      <td id=\"T_7cb1b_row13_col4\" class=\"data row13 col4\" >Confusion Matrix</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row14_col0\" class=\"data row14 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row14_col1\" class=\"data row14 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row14_col2\" class=\"data row14 col2\" >classifier_metrics</td>\n",
+              "      <td id=\"T_7cb1b_row14_col3\" class=\"data row14 col3\" >validmind.model_validation.sklearn.ClassifierPerformance</td>\n",
+              "      <td id=\"T_7cb1b_row14_col4\" class=\"data row14 col4\" >Classifier Performance</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row15_col0\" class=\"data row15 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row15_col1\" class=\"data row15 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row15_col2\" class=\"data row15 col2\" >classifier_metrics</td>\n",
+              "      <td id=\"T_7cb1b_row15_col3\" class=\"data row15 col3\" >validmind.model_validation.sklearn.PermutationFeatureImportance</td>\n",
+              "      <td id=\"T_7cb1b_row15_col4\" class=\"data row15 col4\" >Permutation Feature Importance</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row16_col0\" class=\"data row16 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row16_col1\" class=\"data row16 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row16_col2\" class=\"data row16 col2\" >classifier_metrics</td>\n",
+              "      <td id=\"T_7cb1b_row16_col3\" class=\"data row16 col3\" >validmind.model_validation.sklearn.PrecisionRecallCurve</td>\n",
+              "      <td id=\"T_7cb1b_row16_col4\" class=\"data row16 col4\" >Precision Recall Curve</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row17_col0\" class=\"data row17 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row17_col1\" class=\"data row17 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row17_col2\" class=\"data row17 col2\" >classifier_metrics</td>\n",
+              "      <td id=\"T_7cb1b_row17_col3\" class=\"data row17 col3\" >validmind.model_validation.sklearn.ROCCurve</td>\n",
+              "      <td id=\"T_7cb1b_row17_col4\" class=\"data row17 col4\" >ROC Curve</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row18_col0\" class=\"data row18 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row18_col1\" class=\"data row18 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row18_col2\" class=\"data row18 col2\" >classifier_metrics</td>\n",
+              "      <td id=\"T_7cb1b_row18_col3\" class=\"data row18 col3\" >validmind.model_validation.sklearn.PopulationStabilityIndex</td>\n",
+              "      <td id=\"T_7cb1b_row18_col4\" class=\"data row18 col4\" >Population Stability Index</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row19_col0\" class=\"data row19 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row19_col1\" class=\"data row19 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row19_col2\" class=\"data row19 col2\" >classifier_metrics</td>\n",
+              "      <td id=\"T_7cb1b_row19_col3\" class=\"data row19 col3\" >validmind.model_validation.sklearn.SHAPGlobalImportance</td>\n",
+              "      <td id=\"T_7cb1b_row19_col4\" class=\"data row19 col4\" >SHAP Global Importance</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row20_col0\" class=\"data row20 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row20_col1\" class=\"data row20 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row20_col2\" class=\"data row20 col2\" >classifier_validation</td>\n",
+              "      <td id=\"T_7cb1b_row20_col3\" class=\"data row20 col3\" >validmind.model_validation.sklearn.MinimumAccuracy</td>\n",
+              "      <td id=\"T_7cb1b_row20_col4\" class=\"data row20 col4\" >Minimum Accuracy</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row21_col0\" class=\"data row21 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row21_col1\" class=\"data row21 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row21_col2\" class=\"data row21 col2\" >classifier_validation</td>\n",
+              "      <td id=\"T_7cb1b_row21_col3\" class=\"data row21 col3\" >validmind.model_validation.sklearn.MinimumF1Score</td>\n",
+              "      <td id=\"T_7cb1b_row21_col4\" class=\"data row21 col4\" >Minimum F1 Score</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row22_col0\" class=\"data row22 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row22_col1\" class=\"data row22 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row22_col2\" class=\"data row22 col2\" >classifier_validation</td>\n",
+              "      <td id=\"T_7cb1b_row22_col3\" class=\"data row22 col3\" >validmind.model_validation.sklearn.MinimumROCAUCScore</td>\n",
+              "      <td id=\"T_7cb1b_row22_col4\" class=\"data row22 col4\" >Minimum ROCAUC Score</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row23_col0\" class=\"data row23 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row23_col1\" class=\"data row23 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row23_col2\" class=\"data row23 col2\" >classifier_validation</td>\n",
+              "      <td id=\"T_7cb1b_row23_col3\" class=\"data row23 col3\" >validmind.model_validation.sklearn.TrainingTestDegradation</td>\n",
+              "      <td id=\"T_7cb1b_row23_col4\" class=\"data row23 col4\" >Training Test Degradation</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row24_col0\" class=\"data row24 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row24_col1\" class=\"data row24 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row24_col2\" class=\"data row24 col2\" >classifier_validation</td>\n",
+              "      <td id=\"T_7cb1b_row24_col3\" class=\"data row24 col3\" >validmind.model_validation.sklearn.ModelsPerformanceComparison</td>\n",
+              "      <td id=\"T_7cb1b_row24_col4\" class=\"data row24 col4\" >Models Performance Comparison</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row25_col0\" class=\"data row25 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row25_col1\" class=\"data row25 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row25_col2\" class=\"data row25 col2\" >classifier_model_diagnosis</td>\n",
+              "      <td id=\"T_7cb1b_row25_col3\" class=\"data row25 col3\" >validmind.model_validation.sklearn.OverfitDiagnosis</td>\n",
+              "      <td id=\"T_7cb1b_row25_col4\" class=\"data row25 col4\" >Overfit Diagnosis</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row26_col0\" class=\"data row26 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row26_col1\" class=\"data row26 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row26_col2\" class=\"data row26 col2\" >classifier_model_diagnosis</td>\n",
+              "      <td id=\"T_7cb1b_row26_col3\" class=\"data row26 col3\" >validmind.model_validation.sklearn.WeakspotsDiagnosis</td>\n",
+              "      <td id=\"T_7cb1b_row26_col4\" class=\"data row26 col4\" >Weakspots Diagnosis</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_7cb1b_row27_col0\" class=\"data row27 col0\" >classifier_full_suite</td>\n",
+              "      <td id=\"T_7cb1b_row27_col1\" class=\"data row27 col1\" >ClassifierFullSuite</td>\n",
+              "      <td id=\"T_7cb1b_row27_col2\" class=\"data row27 col2\" >classifier_model_diagnosis</td>\n",
+              "      <td id=\"T_7cb1b_row27_col3\" class=\"data row27 col3\" >validmind.model_validation.sklearn.RobustnessDiagnosis</td>\n",
+              "      <td id=\"T_7cb1b_row27_col4\" class=\"data row27 col4\" >Robustness Diagnosis</td>\n",
+              "    </tr>\n",
+              "  </tbody>\n",
+              "</table>\n"
+            ],
+            "text/plain": [
+              "<pandas.io.formats.style.Styler at 0x16a167fa0>"
+            ]
+          }
+        }
       ]
-     },
-     "metadata": {},
-     "output_type": "display_data"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### View test details\n",
+        "\n",
+        "To inspect a specific test in a suite, pass the name of the test to [tests.describe_test()](https://docs.validmind.ai/validmind/validmind/tests.html#describe_test) to get detailed information about the test such as its purpose, strengths and limitations:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.describe_test(\"validmind.data_validation.DescriptiveStatistics\")"
+      ],
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "display_data",
+          "data": {
+            "text/html": [
+              "\n",
+              "        <div class=\"vm-accordion\" id=\"accordion-c38a3af7\">\n",
+              "            \n",
+              "            <div class=\"vm-accordion-item\">\n",
+              "                <div class=\"vm-accordion-header\"\n",
+              "                     onclick=\"toggleAccordionItem('accordion-c38a3af7-item-0')\"\n",
+              "                     style=\"cursor: pointer; padding: 10px; background-color: #f8f9fa; border: 1px solid #dee2e6; font-weight: bold;\">\n",
+              "                    <span class=\"vm-accordion-toggle\" id=\"accordion-c38a3af7-item-0-toggle\">▶</span>\n",
+              "                    Test: Descriptive Statistics ('validmind.data_validation.DescriptiveStatistics')\n",
+              "                </div>\n",
+              "                <div class=\"vm-accordion-content\"\n",
+              "                     id=\"accordion-c38a3af7-item-0\"\n",
+              "                     style=\"display: none; padding: 15px; border: 1px solid #dee2e6; border-top: none;\">\n",
+              "                    \n",
+              "<div>\n",
+              "  <h2>Descriptive Statistics</h2>\n",
+              "  <div style=\"border: 1px solid #ddd; border-radius: 4px; padding: 10px; margin: 10px 0;\">\n",
+              "    <p>Performs a detailed descriptive statistical analysis of both numerical and categorical data within a model's\n",
+              "dataset.</p>\n",
+              "<h3>Purpose</h3>\n",
+              "<p>The purpose of the Descriptive Statistics metric is to provide a comprehensive summary of both numerical and\n",
+              "categorical data within a dataset. This involves statistics such as count, mean, standard deviation, minimum and\n",
+              "maximum values for numerical data. For categorical data, it calculates the count, number of unique values, most\n",
+              "common value and its frequency, and the proportion of the most frequent value relative to the total. The goal is to\n",
+              "visualize the overall distribution of the variables in the dataset, aiding in understanding the model's behavior\n",
+              "and predicting its performance.</p>\n",
+              "<h3>Test Mechanism</h3>\n",
+              "<p>The testing mechanism utilizes two in-built functions of pandas dataframes: <code>describe()</code> for numerical fields and\n",
+              "<code>value_counts()</code> for categorical fields. The <code>describe()</code> function pulls out several summary statistics, while\n",
+              "<code>value_counts()</code> accounts for unique values. The resulting data is formatted into two distinct tables, one for\n",
+              "numerical and another for categorical variable summaries. These tables provide a clear summary of the main\n",
+              "characteristics of the variables, which can be instrumental in assessing the model's performance.</p>\n",
+              "<h3>Signs of High Risk</h3>\n",
+              "<ul>\n",
+              "<li>Skewed data or significant outliers can represent high risk. For numerical data, this may be reflected via a\n",
+              "significant difference between the mean and median (50% percentile).</li>\n",
+              "<li>For categorical data, a lack of diversity (low count of unique values), or overdominance of a single category\n",
+              "(high frequency of the top value) can indicate high risk.</li>\n",
+              "</ul>\n",
+              "<h3>Strengths</h3>\n",
+              "<ul>\n",
+              "<li>Provides a comprehensive summary of the dataset, shedding light on the distribution and characteristics of the\n",
+              "variables under consideration.</li>\n",
+              "<li>It is a versatile and robust method, applicable to both numerical and categorical data.</li>\n",
+              "<li>Helps highlight crucial anomalies such as outliers, extreme skewness, or lack of diversity, which are vital in\n",
+              "understanding model behavior during testing and validation.</li>\n",
+              "</ul>\n",
+              "<h3>Limitations</h3>\n",
+              "<ul>\n",
+              "<li>While this metric offers a high-level overview of the data, it may fail to detect subtle correlations or complex\n",
+              "patterns.</li>\n",
+              "<li>Does not offer any insights on the relationship between variables.</li>\n",
+              "<li>Alone, descriptive statistics cannot be used to infer properties about future unseen data.</li>\n",
+              "<li>Should be used in conjunction with other statistical tests to provide a comprehensive understanding of the\n",
+              "model's data.</li>\n",
+              "</ul>\n",
+              "\n",
+              "  </div>\n",
+              "</div>\n",
+              "\n",
+              "<h4 class=\"vm_required_context\">\n",
+              "  Required Inputs: <span style=\"font-size: 13px\"><i>dataset</i></span>\n",
+              "</h4>\n",
+              "\n",
+              "<div style=\"display: none;\">\n",
+              "  <h4>Parameters:</h4>\n",
+              "  <table class=\"vm_params_table\" style=\"display: none;\">\n",
+              "      <tr>\n",
+              "          <th>Parameter</th>\n",
+              "          <th>Default Value</th>\n",
+              "      </tr>\n",
+              "      \n",
+              "  </table>\n",
+              "</div>\n",
+              "\n",
+              "<div class=\"unset\">\n",
+              "  <h3>How to Run:</h3>\n",
+              "\n",
+              "  <button\n",
+              "      onclick=\"(() => {e = document.getElementById('expandable_instructions_7e3e1a19-00f2-4e0b-95b6-720bc7e3ba8b'); e.style.display === 'none' ? e.style.display = 'block' : e.style.display = 'none'})()\"\n",
+              "  >Show/Hide Instructions</button>\n",
+              "\n",
+              "  <div id=\"expandable_instructions_7e3e1a19-00f2-4e0b-95b6-720bc7e3ba8b\" style=\"display: block;\">\n",
+              "  <h4>Code:</h4>\n",
+              "    <pre>\n",
+              "        <code class='language-python'>\n",
+              "import validmind as vm\n",
+              "\n",
+              "# inputs dictionary maps your inputs to the expected input names\n",
+              "# keys are the expected input names and values are the actual inputs\n",
+              "# values may be string input_ids or the actual VMDataset or VMModel objects\n",
+              "inputs = {\n",
+              "    \"dataset\": \"my_vm_dataset\"\n",
+              "}\n",
+              "params = {}\n",
+              "\n",
+              "# to run and view the result of this test, run the following code:\n",
+              "result = vm.tests.run_test(\n",
+              "  \"validmind.data_validation.DescriptiveStatistics\", inputs=inputs, params=params\n",
+              ")\n",
+              "\n",
+              "# To see the result of the test, ensure that you have called `vm.init()` and then run:\n",
+              "result.log()</code>\n",
+              "    </pre>\n",
+              "  </div>\n",
+              "</div>\n",
+              "\n",
+              "<style>\n",
+              "h5.vm_required_context {\n",
+              "    margin-top: 25px;\n",
+              "}\n",
+              "table.vm_params_table {\n",
+              "  margin-top: 20px;\n",
+              "  width: 350px;\n",
+              "  border-collapse: collapse;\n",
+              "  border-color: --jp-border-color0;\n",
+              "}\n",
+              "table.vm_params_table td, table.vm_params_table th {\n",
+              "  text-align: right;\n",
+              "}\n",
+              "table.vm_params_table td:first-child, table.vm_params_table th:first-child {\n",
+              "  text-align: left;\n",
+              "}\n",
+              "table.vm_params_table th {\n",
+              "  background-color: --jp-content-color0;\n",
+              "  font-weight: bold;\n",
+              "  font-size: 14px !important;\n",
+              "}\n",
+              "table.vm_params_table tr:nth-child(even) {\n",
+              "  background-color: --jp-layout-color1;\n",
+              "}\n",
+              "table.vm_params_table tr:nth-child(odd) {\n",
+              "  background-color: --jp-layout-color2;\n",
+              "}\n",
+              "table.vm_params_table tr:hover {\n",
+              "  background-color: --jp-layout-color3;\n",
+              "}\n",
+              "table.vm_params_table td, table.vm_params_table th {\n",
+              "  padding: 5px;\n",
+              "  border: .8px solid --jp-border-color0;\n",
+              "}\n",
+              "</style>\n",
+              "\n",
+              "                </div>\n",
+              "            </div>\n",
+              "            \n",
+              "        </div>\n",
+              "\n",
+              "        <script>\n",
+              "        function toggleAccordionItem(itemId) {\n",
+              "            const content = document.getElementById(itemId);\n",
+              "            const toggle = document.getElementById(itemId + '-toggle');\n",
+              "\n",
+              "            if (content.style.display === 'none' || content.style.display === '') {\n",
+              "                content.style.display = 'block';\n",
+              "                toggle.innerHTML = '▼';\n",
+              "            } else {\n",
+              "                content.style.display = 'none';\n",
+              "                toggle.innerHTML = '▶';\n",
+              "            }\n",
+              "        }\n",
+              "        </script>\n",
+              "        "
+            ],
+            "text/plain": [
+              "<IPython.core.display.HTML object>"
+            ]
+          }
+        }
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "Now that you’ve learned how to identify ValidMind test suites relevant to your use cases, we encourage you to explore our interactive notebooks to discover additional tests, learn how to run them, and effectively document your records (models).\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn more about the individual tests available in the ValidMind Library</b></span>\n",
+        "<br></br>\n",
+        "Check out our <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/explore_tests/explore_tests.html\" style=\"color: #DE257E;\"><b>Explore tests</b></a> notebook for more code examples and usage of key functions.</div>\n",
+        "\n",
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you'll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-daee3ccea95b41b4b4bc81230a4a55f5"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.10.13"
     }
-   ],
-   "source": [
-    "vm.tests.describe_test(\"validmind.data_validation.DescriptiveStatistics\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "Now that you’ve learned how to identify ValidMind test suites relevant to your use cases, we encourage you to explore our interactive notebooks to discover additional tests, learn how to run them, and effectively document your models.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn more about the individual tests available in the ValidMind Library</b></span>\n",
-    "<br></br>\n",
-    "Check out our <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/explore_tests/explore_tests.html\" style=\"color: #DE257E;\"><b>Explore tests</b></a> notebook for more code examples and usage of key functions.</div>\n",
-    "\n",
-    "<a id='toc6_1__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you'll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-a3ad64253d204629b8f2e773414c6aeb",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
   },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
-}
+  "nbformat": 4,
+  "nbformat_minor": 2
+}
\ No newline at end of file
diff --git a/site/notebooks/how_to/tests/explore_tests/explore_tests.ipynb b/site/notebooks/how_to/tests/explore_tests/explore_tests.ipynb
index 3bfda30329..048459ea72 100644
--- a/site/notebooks/how_to/tests/explore_tests/explore_tests.ipynb
+++ b/site/notebooks/how_to/tests/explore_tests/explore_tests.ipynb
@@ -1,4463 +1,4469 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Explore tests\n",
-    "\n",
-    "Explore the individual out-the-box tests available in the ValidMind Library, and identify which tests to run to evaluate different aspects of your model. Browse available tests, view their descriptions, and filter by tags or task type to find tests relevant to your use case."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Install the ValidMind Library](#toc2__)    \n",
-    "- [List all available tests](#toc3__)    \n",
-    "- [Understand tags and task types](#toc4__)    \n",
-    "- [Filter tests by tags and task types](#toc5__)    \n",
-    "- [Store test sets for use](#toc6__)    \n",
-    "- [Next steps](#toc7__)    \n",
-    "  - [Discover more learning resources](#toc7_1__)    \n",
-    "- [Upgrade ValidMind](#toc8__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
-    "\n",
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Custom tests**: Custom tests are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom test.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom test. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Install the ValidMind Library\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
-    "<br></br>\n",
-    "Python 3.8 <= x <= 3.14</div>\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## List all available tests"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Start by importing the functions from the [validmind.tests](https://docs.validmind.ai/validmind/validmind/tests.html) module for listing tests, listing tasks, listing tags, and listing tasks and tags to access these functions in the rest of this notebook:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.tests import (\n",
-    "    list_tests,\n",
-    "    list_tasks,\n",
-    "    list_tags,\n",
-    "    list_tasks_and_tags,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Use [list_tests()](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) to retrieve all available ValidMind tests, which returns a DataFrame with the following columns:\n",
-    "\n",
-    "- **ID** – A unique identifier for each test.\n",
-    "- **Name** – The test’s name.\n",
-    "- **Description** – A short summary of what the test evaluates.\n",
-    "- **Tags** –  Keywords that describe what the test does or applies to.\n",
-    "- **Tasks** – The type of modeling task the test supports."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Explore tests\n",
+        "\n",
+        "Explore the individual out-the-box tests available in the ValidMind Library, and identify which tests to run to evaluate different aspects of your model. Browse available tests, view their descriptions, and filter by tags or task type to find tests relevant to your use case."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Install the ValidMind Library](#toc2__)    \n",
+        "- [List all available tests](#toc3__)    \n",
+        "- [Understand tags and task types](#toc4__)    \n",
+        "- [Filter tests by tags and task types](#toc5__)    \n",
+        "- [Store test sets for use](#toc6__)    \n",
+        "- [Next steps](#toc7__)    \n",
+        "  - [Discover more learning resources](#toc7_1__)    \n",
+        "- [Upgrade ValidMind](#toc8__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+        "\n",
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Install the ValidMind Library\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
+        "<br></br>\n",
+        "Python 3.8 <= x <= 3.14</div>\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "%pip install -q validmind"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## List all available tests"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Start by importing the functions from the [validmind.tests](https://docs.validmind.ai/validmind/validmind/tests.html) module for listing tests, listing tasks, listing tags, and listing tasks and tags to access these functions in the rest of this notebook:"
+      ]
+    },
     {
-     "data": {
-      "text/html": [
-       "<style type=\"text/css\">\n",
-       "#T_0502a th {\n",
-       "  text-align: left;\n",
-       "}\n",
-       "#T_0502a_row0_col0, #T_0502a_row0_col1, #T_0502a_row0_col2, #T_0502a_row0_col3, #T_0502a_row0_col4, #T_0502a_row0_col5, #T_0502a_row0_col6, #T_0502a_row0_col7, #T_0502a_row0_col8, #T_0502a_row1_col0, #T_0502a_row1_col1, #T_0502a_row1_col2, #T_0502a_row1_col3, #T_0502a_row1_col4, #T_0502a_row1_col5, #T_0502a_row1_col6, #T_0502a_row1_col7, #T_0502a_row1_col8, #T_0502a_row2_col0, #T_0502a_row2_col1, #T_0502a_row2_col2, #T_0502a_row2_col3, #T_0502a_row2_col4, #T_0502a_row2_col5, #T_0502a_row2_col6, #T_0502a_row2_col7, #T_0502a_row2_col8, #T_0502a_row3_col0, #T_0502a_row3_col1, #T_0502a_row3_col2, #T_0502a_row3_col3, #T_0502a_row3_col4, #T_0502a_row3_col5, #T_0502a_row3_col6, #T_0502a_row3_col7, #T_0502a_row3_col8, #T_0502a_row4_col0, #T_0502a_row4_col1, #T_0502a_row4_col2, #T_0502a_row4_col3, #T_0502a_row4_col4, #T_0502a_row4_col5, #T_0502a_row4_col6, #T_0502a_row4_col7, #T_0502a_row4_col8, #T_0502a_row5_col0, #T_0502a_row5_col1, #T_0502a_row5_col2, #T_0502a_row5_col3, #T_0502a_row5_col4, #T_0502a_row5_col5, #T_0502a_row5_col6, #T_0502a_row5_col7, #T_0502a_row5_col8, #T_0502a_row6_col0, #T_0502a_row6_col1, #T_0502a_row6_col2, #T_0502a_row6_col3, #T_0502a_row6_col4, #T_0502a_row6_col5, #T_0502a_row6_col6, #T_0502a_row6_col7, #T_0502a_row6_col8, #T_0502a_row7_col0, #T_0502a_row7_col1, #T_0502a_row7_col2, #T_0502a_row7_col3, #T_0502a_row7_col4, #T_0502a_row7_col5, #T_0502a_row7_col6, #T_0502a_row7_col7, #T_0502a_row7_col8, #T_0502a_row8_col0, #T_0502a_row8_col1, #T_0502a_row8_col2, #T_0502a_row8_col3, #T_0502a_row8_col4, #T_0502a_row8_col5, #T_0502a_row8_col6, #T_0502a_row8_col7, #T_0502a_row8_col8, #T_0502a_row9_col0, #T_0502a_row9_col1, #T_0502a_row9_col2, #T_0502a_row9_col3, #T_0502a_row9_col4, #T_0502a_row9_col5, #T_0502a_row9_col6, #T_0502a_row9_col7, #T_0502a_row9_col8, #T_0502a_row10_col0, #T_0502a_row10_col1, #T_0502a_row10_col2, #T_0502a_row10_col3, #T_0502a_row10_col4, #T_0502a_row10_col5, #T_0502a_row10_col6, #T_0502a_row10_col7, #T_0502a_row10_col8, #T_0502a_row11_col0, #T_0502a_row11_col1, #T_0502a_row11_col2, #T_0502a_row11_col3, #T_0502a_row11_col4, #T_0502a_row11_col5, #T_0502a_row11_col6, #T_0502a_row11_col7, #T_0502a_row11_col8, #T_0502a_row12_col0, #T_0502a_row12_col1, #T_0502a_row12_col2, #T_0502a_row12_col3, #T_0502a_row12_col4, #T_0502a_row12_col5, #T_0502a_row12_col6, #T_0502a_row12_col7, #T_0502a_row12_col8, #T_0502a_row13_col0, #T_0502a_row13_col1, #T_0502a_row13_col2, #T_0502a_row13_col3, #T_0502a_row13_col4, #T_0502a_row13_col5, #T_0502a_row13_col6, #T_0502a_row13_col7, #T_0502a_row13_col8, #T_0502a_row14_col0, #T_0502a_row14_col1, #T_0502a_row14_col2, #T_0502a_row14_col3, #T_0502a_row14_col4, #T_0502a_row14_col5, #T_0502a_row14_col6, #T_0502a_row14_col7, #T_0502a_row14_col8, #T_0502a_row15_col0, #T_0502a_row15_col1, #T_0502a_row15_col2, #T_0502a_row15_col3, #T_0502a_row15_col4, #T_0502a_row15_col5, #T_0502a_row15_col6, #T_0502a_row15_col7, #T_0502a_row15_col8, #T_0502a_row16_col0, #T_0502a_row16_col1, #T_0502a_row16_col2, #T_0502a_row16_col3, #T_0502a_row16_col4, #T_0502a_row16_col5, #T_0502a_row16_col6, #T_0502a_row16_col7, #T_0502a_row16_col8, #T_0502a_row17_col0, #T_0502a_row17_col1, #T_0502a_row17_col2, #T_0502a_row17_col3, #T_0502a_row17_col4, #T_0502a_row17_col5, #T_0502a_row17_col6, #T_0502a_row17_col7, #T_0502a_row17_col8, #T_0502a_row18_col0, #T_0502a_row18_col1, #T_0502a_row18_col2, #T_0502a_row18_col3, #T_0502a_row18_col4, #T_0502a_row18_col5, #T_0502a_row18_col6, #T_0502a_row18_col7, #T_0502a_row18_col8, #T_0502a_row19_col0, #T_0502a_row19_col1, #T_0502a_row19_col2, #T_0502a_row19_col3, #T_0502a_row19_col4, #T_0502a_row19_col5, #T_0502a_row19_col6, #T_0502a_row19_col7, #T_0502a_row19_col8, #T_0502a_row20_col0, #T_0502a_row20_col1, #T_0502a_row20_col2, #T_0502a_row20_col3, #T_0502a_row20_col4, #T_0502a_row20_col5, #T_0502a_row20_col6, #T_0502a_row20_col7, #T_0502a_row20_col8, #T_0502a_row21_col0, #T_0502a_row21_col1, #T_0502a_row21_col2, #T_0502a_row21_col3, #T_0502a_row21_col4, #T_0502a_row21_col5, #T_0502a_row21_col6, #T_0502a_row21_col7, #T_0502a_row21_col8, #T_0502a_row22_col0, #T_0502a_row22_col1, #T_0502a_row22_col2, #T_0502a_row22_col3, #T_0502a_row22_col4, #T_0502a_row22_col5, #T_0502a_row22_col6, #T_0502a_row22_col7, #T_0502a_row22_col8, #T_0502a_row23_col0, #T_0502a_row23_col1, #T_0502a_row23_col2, #T_0502a_row23_col3, #T_0502a_row23_col4, #T_0502a_row23_col5, #T_0502a_row23_col6, #T_0502a_row23_col7, #T_0502a_row23_col8, #T_0502a_row24_col0, #T_0502a_row24_col1, #T_0502a_row24_col2, #T_0502a_row24_col3, #T_0502a_row24_col4, #T_0502a_row24_col5, #T_0502a_row24_col6, #T_0502a_row24_col7, #T_0502a_row24_col8, #T_0502a_row25_col0, #T_0502a_row25_col1, #T_0502a_row25_col2, #T_0502a_row25_col3, #T_0502a_row25_col4, #T_0502a_row25_col5, #T_0502a_row25_col6, #T_0502a_row25_col7, #T_0502a_row25_col8, #T_0502a_row26_col0, #T_0502a_row26_col1, #T_0502a_row26_col2, #T_0502a_row26_col3, #T_0502a_row26_col4, #T_0502a_row26_col5, #T_0502a_row26_col6, #T_0502a_row26_col7, #T_0502a_row26_col8, #T_0502a_row27_col0, #T_0502a_row27_col1, #T_0502a_row27_col2, #T_0502a_row27_col3, #T_0502a_row27_col4, #T_0502a_row27_col5, #T_0502a_row27_col6, #T_0502a_row27_col7, #T_0502a_row27_col8, #T_0502a_row28_col0, #T_0502a_row28_col1, #T_0502a_row28_col2, #T_0502a_row28_col3, #T_0502a_row28_col4, #T_0502a_row28_col5, #T_0502a_row28_col6, #T_0502a_row28_col7, #T_0502a_row28_col8, #T_0502a_row29_col0, #T_0502a_row29_col1, #T_0502a_row29_col2, #T_0502a_row29_col3, #T_0502a_row29_col4, #T_0502a_row29_col5, #T_0502a_row29_col6, #T_0502a_row29_col7, #T_0502a_row29_col8, #T_0502a_row30_col0, #T_0502a_row30_col1, #T_0502a_row30_col2, #T_0502a_row30_col3, #T_0502a_row30_col4, #T_0502a_row30_col5, #T_0502a_row30_col6, #T_0502a_row30_col7, #T_0502a_row30_col8, #T_0502a_row31_col0, #T_0502a_row31_col1, #T_0502a_row31_col2, #T_0502a_row31_col3, #T_0502a_row31_col4, #T_0502a_row31_col5, #T_0502a_row31_col6, #T_0502a_row31_col7, #T_0502a_row31_col8, #T_0502a_row32_col0, #T_0502a_row32_col1, #T_0502a_row32_col2, #T_0502a_row32_col3, #T_0502a_row32_col4, #T_0502a_row32_col5, #T_0502a_row32_col6, #T_0502a_row32_col7, #T_0502a_row32_col8, #T_0502a_row33_col0, #T_0502a_row33_col1, #T_0502a_row33_col2, #T_0502a_row33_col3, #T_0502a_row33_col4, #T_0502a_row33_col5, #T_0502a_row33_col6, #T_0502a_row33_col7, #T_0502a_row33_col8, #T_0502a_row34_col0, #T_0502a_row34_col1, #T_0502a_row34_col2, #T_0502a_row34_col3, #T_0502a_row34_col4, #T_0502a_row34_col5, #T_0502a_row34_col6, #T_0502a_row34_col7, #T_0502a_row34_col8, #T_0502a_row35_col0, #T_0502a_row35_col1, #T_0502a_row35_col2, #T_0502a_row35_col3, #T_0502a_row35_col4, #T_0502a_row35_col5, #T_0502a_row35_col6, #T_0502a_row35_col7, #T_0502a_row35_col8, #T_0502a_row36_col0, #T_0502a_row36_col1, #T_0502a_row36_col2, #T_0502a_row36_col3, #T_0502a_row36_col4, #T_0502a_row36_col5, #T_0502a_row36_col6, #T_0502a_row36_col7, #T_0502a_row36_col8, #T_0502a_row37_col0, #T_0502a_row37_col1, #T_0502a_row37_col2, #T_0502a_row37_col3, #T_0502a_row37_col4, #T_0502a_row37_col5, #T_0502a_row37_col6, #T_0502a_row37_col7, #T_0502a_row37_col8, #T_0502a_row38_col0, #T_0502a_row38_col1, #T_0502a_row38_col2, #T_0502a_row38_col3, #T_0502a_row38_col4, #T_0502a_row38_col5, #T_0502a_row38_col6, #T_0502a_row38_col7, #T_0502a_row38_col8, #T_0502a_row39_col0, #T_0502a_row39_col1, #T_0502a_row39_col2, #T_0502a_row39_col3, #T_0502a_row39_col4, #T_0502a_row39_col5, #T_0502a_row39_col6, #T_0502a_row39_col7, #T_0502a_row39_col8, #T_0502a_row40_col0, #T_0502a_row40_col1, #T_0502a_row40_col2, #T_0502a_row40_col3, #T_0502a_row40_col4, #T_0502a_row40_col5, #T_0502a_row40_col6, #T_0502a_row40_col7, #T_0502a_row40_col8, #T_0502a_row41_col0, #T_0502a_row41_col1, #T_0502a_row41_col2, #T_0502a_row41_col3, #T_0502a_row41_col4, #T_0502a_row41_col5, #T_0502a_row41_col6, #T_0502a_row41_col7, #T_0502a_row41_col8, #T_0502a_row42_col0, #T_0502a_row42_col1, #T_0502a_row42_col2, #T_0502a_row42_col3, #T_0502a_row42_col4, #T_0502a_row42_col5, #T_0502a_row42_col6, #T_0502a_row42_col7, #T_0502a_row42_col8, #T_0502a_row43_col0, #T_0502a_row43_col1, #T_0502a_row43_col2, #T_0502a_row43_col3, #T_0502a_row43_col4, #T_0502a_row43_col5, #T_0502a_row43_col6, #T_0502a_row43_col7, #T_0502a_row43_col8, #T_0502a_row44_col0, #T_0502a_row44_col1, #T_0502a_row44_col2, #T_0502a_row44_col3, #T_0502a_row44_col4, #T_0502a_row44_col5, #T_0502a_row44_col6, #T_0502a_row44_col7, #T_0502a_row44_col8, #T_0502a_row45_col0, #T_0502a_row45_col1, #T_0502a_row45_col2, #T_0502a_row45_col3, #T_0502a_row45_col4, #T_0502a_row45_col5, #T_0502a_row45_col6, #T_0502a_row45_col7, #T_0502a_row45_col8, #T_0502a_row46_col0, #T_0502a_row46_col1, #T_0502a_row46_col2, #T_0502a_row46_col3, #T_0502a_row46_col4, #T_0502a_row46_col5, #T_0502a_row46_col6, #T_0502a_row46_col7, #T_0502a_row46_col8, #T_0502a_row47_col0, #T_0502a_row47_col1, #T_0502a_row47_col2, #T_0502a_row47_col3, #T_0502a_row47_col4, #T_0502a_row47_col5, #T_0502a_row47_col6, #T_0502a_row47_col7, #T_0502a_row47_col8, #T_0502a_row48_col0, #T_0502a_row48_col1, #T_0502a_row48_col2, #T_0502a_row48_col3, #T_0502a_row48_col4, #T_0502a_row48_col5, #T_0502a_row48_col6, #T_0502a_row48_col7, #T_0502a_row48_col8, #T_0502a_row49_col0, #T_0502a_row49_col1, #T_0502a_row49_col2, #T_0502a_row49_col3, #T_0502a_row49_col4, #T_0502a_row49_col5, #T_0502a_row49_col6, #T_0502a_row49_col7, #T_0502a_row49_col8, #T_0502a_row50_col0, #T_0502a_row50_col1, #T_0502a_row50_col2, #T_0502a_row50_col3, #T_0502a_row50_col4, #T_0502a_row50_col5, #T_0502a_row50_col6, #T_0502a_row50_col7, #T_0502a_row50_col8, #T_0502a_row51_col0, #T_0502a_row51_col1, #T_0502a_row51_col2, #T_0502a_row51_col3, #T_0502a_row51_col4, #T_0502a_row51_col5, #T_0502a_row51_col6, #T_0502a_row51_col7, #T_0502a_row51_col8, #T_0502a_row52_col0, #T_0502a_row52_col1, #T_0502a_row52_col2, #T_0502a_row52_col3, #T_0502a_row52_col4, #T_0502a_row52_col5, #T_0502a_row52_col6, #T_0502a_row52_col7, #T_0502a_row52_col8, #T_0502a_row53_col0, #T_0502a_row53_col1, #T_0502a_row53_col2, #T_0502a_row53_col3, #T_0502a_row53_col4, #T_0502a_row53_col5, #T_0502a_row53_col6, #T_0502a_row53_col7, #T_0502a_row53_col8, #T_0502a_row54_col0, #T_0502a_row54_col1, #T_0502a_row54_col2, #T_0502a_row54_col3, #T_0502a_row54_col4, #T_0502a_row54_col5, #T_0502a_row54_col6, #T_0502a_row54_col7, #T_0502a_row54_col8, #T_0502a_row55_col0, #T_0502a_row55_col1, #T_0502a_row55_col2, #T_0502a_row55_col3, #T_0502a_row55_col4, #T_0502a_row55_col5, #T_0502a_row55_col6, #T_0502a_row55_col7, #T_0502a_row55_col8, #T_0502a_row56_col0, #T_0502a_row56_col1, #T_0502a_row56_col2, #T_0502a_row56_col3, #T_0502a_row56_col4, #T_0502a_row56_col5, #T_0502a_row56_col6, #T_0502a_row56_col7, #T_0502a_row56_col8, #T_0502a_row57_col0, #T_0502a_row57_col1, #T_0502a_row57_col2, #T_0502a_row57_col3, #T_0502a_row57_col4, #T_0502a_row57_col5, #T_0502a_row57_col6, #T_0502a_row57_col7, #T_0502a_row57_col8, #T_0502a_row58_col0, #T_0502a_row58_col1, #T_0502a_row58_col2, #T_0502a_row58_col3, #T_0502a_row58_col4, #T_0502a_row58_col5, #T_0502a_row58_col6, #T_0502a_row58_col7, #T_0502a_row58_col8, #T_0502a_row59_col0, #T_0502a_row59_col1, #T_0502a_row59_col2, #T_0502a_row59_col3, #T_0502a_row59_col4, #T_0502a_row59_col5, #T_0502a_row59_col6, #T_0502a_row59_col7, #T_0502a_row59_col8, #T_0502a_row60_col0, #T_0502a_row60_col1, #T_0502a_row60_col2, #T_0502a_row60_col3, #T_0502a_row60_col4, #T_0502a_row60_col5, #T_0502a_row60_col6, #T_0502a_row60_col7, #T_0502a_row60_col8, #T_0502a_row61_col0, #T_0502a_row61_col1, #T_0502a_row61_col2, #T_0502a_row61_col3, #T_0502a_row61_col4, #T_0502a_row61_col5, #T_0502a_row61_col6, #T_0502a_row61_col7, #T_0502a_row61_col8, #T_0502a_row62_col0, #T_0502a_row62_col1, #T_0502a_row62_col2, #T_0502a_row62_col3, #T_0502a_row62_col4, #T_0502a_row62_col5, #T_0502a_row62_col6, #T_0502a_row62_col7, #T_0502a_row62_col8, #T_0502a_row63_col0, #T_0502a_row63_col1, #T_0502a_row63_col2, #T_0502a_row63_col3, #T_0502a_row63_col4, #T_0502a_row63_col5, #T_0502a_row63_col6, #T_0502a_row63_col7, #T_0502a_row63_col8, #T_0502a_row64_col0, #T_0502a_row64_col1, #T_0502a_row64_col2, #T_0502a_row64_col3, #T_0502a_row64_col4, #T_0502a_row64_col5, #T_0502a_row64_col6, #T_0502a_row64_col7, #T_0502a_row64_col8, #T_0502a_row65_col0, #T_0502a_row65_col1, #T_0502a_row65_col2, #T_0502a_row65_col3, #T_0502a_row65_col4, #T_0502a_row65_col5, #T_0502a_row65_col6, #T_0502a_row65_col7, #T_0502a_row65_col8, #T_0502a_row66_col0, #T_0502a_row66_col1, #T_0502a_row66_col2, #T_0502a_row66_col3, #T_0502a_row66_col4, #T_0502a_row66_col5, #T_0502a_row66_col6, #T_0502a_row66_col7, #T_0502a_row66_col8, #T_0502a_row67_col0, #T_0502a_row67_col1, #T_0502a_row67_col2, #T_0502a_row67_col3, #T_0502a_row67_col4, #T_0502a_row67_col5, #T_0502a_row67_col6, #T_0502a_row67_col7, #T_0502a_row67_col8, #T_0502a_row68_col0, #T_0502a_row68_col1, #T_0502a_row68_col2, #T_0502a_row68_col3, #T_0502a_row68_col4, #T_0502a_row68_col5, #T_0502a_row68_col6, #T_0502a_row68_col7, #T_0502a_row68_col8, #T_0502a_row69_col0, #T_0502a_row69_col1, #T_0502a_row69_col2, #T_0502a_row69_col3, #T_0502a_row69_col4, #T_0502a_row69_col5, #T_0502a_row69_col6, #T_0502a_row69_col7, #T_0502a_row69_col8, #T_0502a_row70_col0, #T_0502a_row70_col1, #T_0502a_row70_col2, #T_0502a_row70_col3, #T_0502a_row70_col4, #T_0502a_row70_col5, #T_0502a_row70_col6, #T_0502a_row70_col7, #T_0502a_row70_col8, #T_0502a_row71_col0, #T_0502a_row71_col1, #T_0502a_row71_col2, #T_0502a_row71_col3, #T_0502a_row71_col4, #T_0502a_row71_col5, #T_0502a_row71_col6, #T_0502a_row71_col7, #T_0502a_row71_col8, #T_0502a_row72_col0, #T_0502a_row72_col1, #T_0502a_row72_col2, #T_0502a_row72_col3, #T_0502a_row72_col4, #T_0502a_row72_col5, #T_0502a_row72_col6, #T_0502a_row72_col7, #T_0502a_row72_col8, #T_0502a_row73_col0, #T_0502a_row73_col1, #T_0502a_row73_col2, #T_0502a_row73_col3, #T_0502a_row73_col4, #T_0502a_row73_col5, #T_0502a_row73_col6, #T_0502a_row73_col7, #T_0502a_row73_col8, #T_0502a_row74_col0, #T_0502a_row74_col1, #T_0502a_row74_col2, #T_0502a_row74_col3, #T_0502a_row74_col4, #T_0502a_row74_col5, #T_0502a_row74_col6, #T_0502a_row74_col7, #T_0502a_row74_col8, #T_0502a_row75_col0, #T_0502a_row75_col1, #T_0502a_row75_col2, #T_0502a_row75_col3, #T_0502a_row75_col4, #T_0502a_row75_col5, #T_0502a_row75_col6, #T_0502a_row75_col7, #T_0502a_row75_col8, #T_0502a_row76_col0, #T_0502a_row76_col1, #T_0502a_row76_col2, #T_0502a_row76_col3, #T_0502a_row76_col4, #T_0502a_row76_col5, #T_0502a_row76_col6, #T_0502a_row76_col7, #T_0502a_row76_col8, #T_0502a_row77_col0, #T_0502a_row77_col1, #T_0502a_row77_col2, #T_0502a_row77_col3, #T_0502a_row77_col4, #T_0502a_row77_col5, #T_0502a_row77_col6, #T_0502a_row77_col7, #T_0502a_row77_col8, #T_0502a_row78_col0, #T_0502a_row78_col1, #T_0502a_row78_col2, #T_0502a_row78_col3, #T_0502a_row78_col4, #T_0502a_row78_col5, #T_0502a_row78_col6, #T_0502a_row78_col7, #T_0502a_row78_col8, #T_0502a_row79_col0, #T_0502a_row79_col1, #T_0502a_row79_col2, #T_0502a_row79_col3, #T_0502a_row79_col4, #T_0502a_row79_col5, #T_0502a_row79_col6, #T_0502a_row79_col7, #T_0502a_row79_col8, #T_0502a_row80_col0, #T_0502a_row80_col1, #T_0502a_row80_col2, #T_0502a_row80_col3, #T_0502a_row80_col4, #T_0502a_row80_col5, #T_0502a_row80_col6, #T_0502a_row80_col7, #T_0502a_row80_col8, #T_0502a_row81_col0, #T_0502a_row81_col1, #T_0502a_row81_col2, #T_0502a_row81_col3, #T_0502a_row81_col4, #T_0502a_row81_col5, #T_0502a_row81_col6, #T_0502a_row81_col7, #T_0502a_row81_col8, #T_0502a_row82_col0, #T_0502a_row82_col1, #T_0502a_row82_col2, #T_0502a_row82_col3, #T_0502a_row82_col4, #T_0502a_row82_col5, #T_0502a_row82_col6, #T_0502a_row82_col7, #T_0502a_row82_col8, #T_0502a_row83_col0, #T_0502a_row83_col1, #T_0502a_row83_col2, #T_0502a_row83_col3, #T_0502a_row83_col4, #T_0502a_row83_col5, #T_0502a_row83_col6, #T_0502a_row83_col7, #T_0502a_row83_col8, #T_0502a_row84_col0, #T_0502a_row84_col1, #T_0502a_row84_col2, #T_0502a_row84_col3, #T_0502a_row84_col4, #T_0502a_row84_col5, #T_0502a_row84_col6, #T_0502a_row84_col7, #T_0502a_row84_col8, #T_0502a_row85_col0, #T_0502a_row85_col1, #T_0502a_row85_col2, #T_0502a_row85_col3, #T_0502a_row85_col4, #T_0502a_row85_col5, #T_0502a_row85_col6, #T_0502a_row85_col7, #T_0502a_row85_col8, #T_0502a_row86_col0, #T_0502a_row86_col1, #T_0502a_row86_col2, #T_0502a_row86_col3, #T_0502a_row86_col4, #T_0502a_row86_col5, #T_0502a_row86_col6, #T_0502a_row86_col7, #T_0502a_row86_col8, #T_0502a_row87_col0, #T_0502a_row87_col1, #T_0502a_row87_col2, #T_0502a_row87_col3, #T_0502a_row87_col4, #T_0502a_row87_col5, #T_0502a_row87_col6, #T_0502a_row87_col7, #T_0502a_row87_col8, #T_0502a_row88_col0, #T_0502a_row88_col1, #T_0502a_row88_col2, #T_0502a_row88_col3, #T_0502a_row88_col4, #T_0502a_row88_col5, #T_0502a_row88_col6, #T_0502a_row88_col7, #T_0502a_row88_col8, #T_0502a_row89_col0, #T_0502a_row89_col1, #T_0502a_row89_col2, #T_0502a_row89_col3, #T_0502a_row89_col4, #T_0502a_row89_col5, #T_0502a_row89_col6, #T_0502a_row89_col7, #T_0502a_row89_col8, #T_0502a_row90_col0, #T_0502a_row90_col1, #T_0502a_row90_col2, #T_0502a_row90_col3, #T_0502a_row90_col4, #T_0502a_row90_col5, #T_0502a_row90_col6, #T_0502a_row90_col7, #T_0502a_row90_col8, #T_0502a_row91_col0, #T_0502a_row91_col1, #T_0502a_row91_col2, #T_0502a_row91_col3, #T_0502a_row91_col4, #T_0502a_row91_col5, #T_0502a_row91_col6, #T_0502a_row91_col7, #T_0502a_row91_col8, #T_0502a_row92_col0, #T_0502a_row92_col1, #T_0502a_row92_col2, #T_0502a_row92_col3, #T_0502a_row92_col4, #T_0502a_row92_col5, #T_0502a_row92_col6, #T_0502a_row92_col7, #T_0502a_row92_col8, #T_0502a_row93_col0, #T_0502a_row93_col1, #T_0502a_row93_col2, #T_0502a_row93_col3, #T_0502a_row93_col4, #T_0502a_row93_col5, #T_0502a_row93_col6, #T_0502a_row93_col7, #T_0502a_row93_col8, #T_0502a_row94_col0, #T_0502a_row94_col1, #T_0502a_row94_col2, #T_0502a_row94_col3, #T_0502a_row94_col4, #T_0502a_row94_col5, #T_0502a_row94_col6, #T_0502a_row94_col7, #T_0502a_row94_col8, #T_0502a_row95_col0, #T_0502a_row95_col1, #T_0502a_row95_col2, #T_0502a_row95_col3, #T_0502a_row95_col4, #T_0502a_row95_col5, #T_0502a_row95_col6, #T_0502a_row95_col7, #T_0502a_row95_col8, #T_0502a_row96_col0, #T_0502a_row96_col1, #T_0502a_row96_col2, #T_0502a_row96_col3, #T_0502a_row96_col4, #T_0502a_row96_col5, #T_0502a_row96_col6, #T_0502a_row96_col7, #T_0502a_row96_col8, #T_0502a_row97_col0, #T_0502a_row97_col1, #T_0502a_row97_col2, #T_0502a_row97_col3, #T_0502a_row97_col4, #T_0502a_row97_col5, #T_0502a_row97_col6, #T_0502a_row97_col7, #T_0502a_row97_col8, #T_0502a_row98_col0, #T_0502a_row98_col1, #T_0502a_row98_col2, #T_0502a_row98_col3, #T_0502a_row98_col4, #T_0502a_row98_col5, #T_0502a_row98_col6, #T_0502a_row98_col7, #T_0502a_row98_col8, #T_0502a_row99_col0, #T_0502a_row99_col1, #T_0502a_row99_col2, #T_0502a_row99_col3, #T_0502a_row99_col4, #T_0502a_row99_col5, #T_0502a_row99_col6, #T_0502a_row99_col7, #T_0502a_row99_col8, #T_0502a_row100_col0, #T_0502a_row100_col1, #T_0502a_row100_col2, #T_0502a_row100_col3, #T_0502a_row100_col4, #T_0502a_row100_col5, #T_0502a_row100_col6, #T_0502a_row100_col7, #T_0502a_row100_col8, #T_0502a_row101_col0, #T_0502a_row101_col1, #T_0502a_row101_col2, #T_0502a_row101_col3, #T_0502a_row101_col4, #T_0502a_row101_col5, #T_0502a_row101_col6, #T_0502a_row101_col7, #T_0502a_row101_col8, #T_0502a_row102_col0, #T_0502a_row102_col1, #T_0502a_row102_col2, #T_0502a_row102_col3, #T_0502a_row102_col4, #T_0502a_row102_col5, #T_0502a_row102_col6, #T_0502a_row102_col7, #T_0502a_row102_col8, #T_0502a_row103_col0, #T_0502a_row103_col1, #T_0502a_row103_col2, #T_0502a_row103_col3, #T_0502a_row103_col4, #T_0502a_row103_col5, #T_0502a_row103_col6, #T_0502a_row103_col7, #T_0502a_row103_col8, #T_0502a_row104_col0, #T_0502a_row104_col1, #T_0502a_row104_col2, #T_0502a_row104_col3, #T_0502a_row104_col4, #T_0502a_row104_col5, #T_0502a_row104_col6, #T_0502a_row104_col7, #T_0502a_row104_col8, #T_0502a_row105_col0, #T_0502a_row105_col1, #T_0502a_row105_col2, #T_0502a_row105_col3, #T_0502a_row105_col4, #T_0502a_row105_col5, #T_0502a_row105_col6, #T_0502a_row105_col7, #T_0502a_row105_col8, #T_0502a_row106_col0, #T_0502a_row106_col1, #T_0502a_row106_col2, #T_0502a_row106_col3, #T_0502a_row106_col4, #T_0502a_row106_col5, #T_0502a_row106_col6, #T_0502a_row106_col7, #T_0502a_row106_col8, #T_0502a_row107_col0, #T_0502a_row107_col1, #T_0502a_row107_col2, #T_0502a_row107_col3, #T_0502a_row107_col4, #T_0502a_row107_col5, #T_0502a_row107_col6, #T_0502a_row107_col7, #T_0502a_row107_col8, #T_0502a_row108_col0, #T_0502a_row108_col1, #T_0502a_row108_col2, #T_0502a_row108_col3, #T_0502a_row108_col4, #T_0502a_row108_col5, #T_0502a_row108_col6, #T_0502a_row108_col7, #T_0502a_row108_col8, #T_0502a_row109_col0, #T_0502a_row109_col1, #T_0502a_row109_col2, #T_0502a_row109_col3, #T_0502a_row109_col4, #T_0502a_row109_col5, #T_0502a_row109_col6, #T_0502a_row109_col7, #T_0502a_row109_col8, #T_0502a_row110_col0, #T_0502a_row110_col1, #T_0502a_row110_col2, #T_0502a_row110_col3, #T_0502a_row110_col4, #T_0502a_row110_col5, #T_0502a_row110_col6, #T_0502a_row110_col7, #T_0502a_row110_col8, #T_0502a_row111_col0, #T_0502a_row111_col1, #T_0502a_row111_col2, #T_0502a_row111_col3, #T_0502a_row111_col4, #T_0502a_row111_col5, #T_0502a_row111_col6, #T_0502a_row111_col7, #T_0502a_row111_col8, #T_0502a_row112_col0, #T_0502a_row112_col1, #T_0502a_row112_col2, #T_0502a_row112_col3, #T_0502a_row112_col4, #T_0502a_row112_col5, #T_0502a_row112_col6, #T_0502a_row112_col7, #T_0502a_row112_col8, #T_0502a_row113_col0, #T_0502a_row113_col1, #T_0502a_row113_col2, #T_0502a_row113_col3, #T_0502a_row113_col4, #T_0502a_row113_col5, #T_0502a_row113_col6, #T_0502a_row113_col7, #T_0502a_row113_col8, #T_0502a_row114_col0, #T_0502a_row114_col1, #T_0502a_row114_col2, #T_0502a_row114_col3, #T_0502a_row114_col4, #T_0502a_row114_col5, #T_0502a_row114_col6, #T_0502a_row114_col7, #T_0502a_row114_col8, #T_0502a_row115_col0, #T_0502a_row115_col1, #T_0502a_row115_col2, #T_0502a_row115_col3, #T_0502a_row115_col4, #T_0502a_row115_col5, #T_0502a_row115_col6, #T_0502a_row115_col7, #T_0502a_row115_col8, #T_0502a_row116_col0, #T_0502a_row116_col1, #T_0502a_row116_col2, #T_0502a_row116_col3, #T_0502a_row116_col4, #T_0502a_row116_col5, #T_0502a_row116_col6, #T_0502a_row116_col7, #T_0502a_row116_col8, #T_0502a_row117_col0, #T_0502a_row117_col1, #T_0502a_row117_col2, #T_0502a_row117_col3, #T_0502a_row117_col4, #T_0502a_row117_col5, #T_0502a_row117_col6, #T_0502a_row117_col7, #T_0502a_row117_col8, #T_0502a_row118_col0, #T_0502a_row118_col1, #T_0502a_row118_col2, #T_0502a_row118_col3, #T_0502a_row118_col4, #T_0502a_row118_col5, #T_0502a_row118_col6, #T_0502a_row118_col7, #T_0502a_row118_col8, #T_0502a_row119_col0, #T_0502a_row119_col1, #T_0502a_row119_col2, #T_0502a_row119_col3, #T_0502a_row119_col4, #T_0502a_row119_col5, #T_0502a_row119_col6, #T_0502a_row119_col7, #T_0502a_row119_col8, #T_0502a_row120_col0, #T_0502a_row120_col1, #T_0502a_row120_col2, #T_0502a_row120_col3, #T_0502a_row120_col4, #T_0502a_row120_col5, #T_0502a_row120_col6, #T_0502a_row120_col7, #T_0502a_row120_col8, #T_0502a_row121_col0, #T_0502a_row121_col1, #T_0502a_row121_col2, #T_0502a_row121_col3, #T_0502a_row121_col4, #T_0502a_row121_col5, #T_0502a_row121_col6, #T_0502a_row121_col7, #T_0502a_row121_col8, #T_0502a_row122_col0, #T_0502a_row122_col1, #T_0502a_row122_col2, #T_0502a_row122_col3, #T_0502a_row122_col4, #T_0502a_row122_col5, #T_0502a_row122_col6, #T_0502a_row122_col7, #T_0502a_row122_col8, #T_0502a_row123_col0, #T_0502a_row123_col1, #T_0502a_row123_col2, #T_0502a_row123_col3, #T_0502a_row123_col4, #T_0502a_row123_col5, #T_0502a_row123_col6, #T_0502a_row123_col7, #T_0502a_row123_col8, #T_0502a_row124_col0, #T_0502a_row124_col1, #T_0502a_row124_col2, #T_0502a_row124_col3, #T_0502a_row124_col4, #T_0502a_row124_col5, #T_0502a_row124_col6, #T_0502a_row124_col7, #T_0502a_row124_col8, #T_0502a_row125_col0, #T_0502a_row125_col1, #T_0502a_row125_col2, #T_0502a_row125_col3, #T_0502a_row125_col4, #T_0502a_row125_col5, #T_0502a_row125_col6, #T_0502a_row125_col7, #T_0502a_row125_col8, #T_0502a_row126_col0, #T_0502a_row126_col1, #T_0502a_row126_col2, #T_0502a_row126_col3, #T_0502a_row126_col4, #T_0502a_row126_col5, #T_0502a_row126_col6, #T_0502a_row126_col7, #T_0502a_row126_col8, #T_0502a_row127_col0, #T_0502a_row127_col1, #T_0502a_row127_col2, #T_0502a_row127_col3, #T_0502a_row127_col4, #T_0502a_row127_col5, #T_0502a_row127_col6, #T_0502a_row127_col7, #T_0502a_row127_col8, #T_0502a_row128_col0, #T_0502a_row128_col1, #T_0502a_row128_col2, #T_0502a_row128_col3, #T_0502a_row128_col4, #T_0502a_row128_col5, #T_0502a_row128_col6, #T_0502a_row128_col7, #T_0502a_row128_col8, #T_0502a_row129_col0, #T_0502a_row129_col1, #T_0502a_row129_col2, #T_0502a_row129_col3, #T_0502a_row129_col4, #T_0502a_row129_col5, #T_0502a_row129_col6, #T_0502a_row129_col7, #T_0502a_row129_col8, #T_0502a_row130_col0, #T_0502a_row130_col1, #T_0502a_row130_col2, #T_0502a_row130_col3, #T_0502a_row130_col4, #T_0502a_row130_col5, #T_0502a_row130_col6, #T_0502a_row130_col7, #T_0502a_row130_col8, #T_0502a_row131_col0, #T_0502a_row131_col1, #T_0502a_row131_col2, #T_0502a_row131_col3, #T_0502a_row131_col4, #T_0502a_row131_col5, #T_0502a_row131_col6, #T_0502a_row131_col7, #T_0502a_row131_col8, #T_0502a_row132_col0, #T_0502a_row132_col1, #T_0502a_row132_col2, #T_0502a_row132_col3, #T_0502a_row132_col4, #T_0502a_row132_col5, #T_0502a_row132_col6, #T_0502a_row132_col7, #T_0502a_row132_col8, #T_0502a_row133_col0, #T_0502a_row133_col1, #T_0502a_row133_col2, #T_0502a_row133_col3, #T_0502a_row133_col4, #T_0502a_row133_col5, #T_0502a_row133_col6, #T_0502a_row133_col7, #T_0502a_row133_col8, #T_0502a_row134_col0, #T_0502a_row134_col1, #T_0502a_row134_col2, #T_0502a_row134_col3, #T_0502a_row134_col4, #T_0502a_row134_col5, #T_0502a_row134_col6, #T_0502a_row134_col7, #T_0502a_row134_col8, #T_0502a_row135_col0, #T_0502a_row135_col1, #T_0502a_row135_col2, #T_0502a_row135_col3, #T_0502a_row135_col4, #T_0502a_row135_col5, #T_0502a_row135_col6, #T_0502a_row135_col7, #T_0502a_row135_col8, #T_0502a_row136_col0, #T_0502a_row136_col1, #T_0502a_row136_col2, #T_0502a_row136_col3, #T_0502a_row136_col4, #T_0502a_row136_col5, #T_0502a_row136_col6, #T_0502a_row136_col7, #T_0502a_row136_col8, #T_0502a_row137_col0, #T_0502a_row137_col1, #T_0502a_row137_col2, #T_0502a_row137_col3, #T_0502a_row137_col4, #T_0502a_row137_col5, #T_0502a_row137_col6, #T_0502a_row137_col7, #T_0502a_row137_col8, #T_0502a_row138_col0, #T_0502a_row138_col1, #T_0502a_row138_col2, #T_0502a_row138_col3, #T_0502a_row138_col4, #T_0502a_row138_col5, #T_0502a_row138_col6, #T_0502a_row138_col7, #T_0502a_row138_col8, #T_0502a_row139_col0, #T_0502a_row139_col1, #T_0502a_row139_col2, #T_0502a_row139_col3, #T_0502a_row139_col4, #T_0502a_row139_col5, #T_0502a_row139_col6, #T_0502a_row139_col7, #T_0502a_row139_col8, #T_0502a_row140_col0, #T_0502a_row140_col1, #T_0502a_row140_col2, #T_0502a_row140_col3, #T_0502a_row140_col4, #T_0502a_row140_col5, #T_0502a_row140_col6, #T_0502a_row140_col7, #T_0502a_row140_col8, #T_0502a_row141_col0, #T_0502a_row141_col1, #T_0502a_row141_col2, #T_0502a_row141_col3, #T_0502a_row141_col4, #T_0502a_row141_col5, #T_0502a_row141_col6, #T_0502a_row141_col7, #T_0502a_row141_col8, #T_0502a_row142_col0, #T_0502a_row142_col1, #T_0502a_row142_col2, #T_0502a_row142_col3, #T_0502a_row142_col4, #T_0502a_row142_col5, #T_0502a_row142_col6, #T_0502a_row142_col7, #T_0502a_row142_col8, #T_0502a_row143_col0, #T_0502a_row143_col1, #T_0502a_row143_col2, #T_0502a_row143_col3, #T_0502a_row143_col4, #T_0502a_row143_col5, #T_0502a_row143_col6, #T_0502a_row143_col7, #T_0502a_row143_col8, #T_0502a_row144_col0, #T_0502a_row144_col1, #T_0502a_row144_col2, #T_0502a_row144_col3, #T_0502a_row144_col4, #T_0502a_row144_col5, #T_0502a_row144_col6, #T_0502a_row144_col7, #T_0502a_row144_col8, #T_0502a_row145_col0, #T_0502a_row145_col1, #T_0502a_row145_col2, #T_0502a_row145_col3, #T_0502a_row145_col4, #T_0502a_row145_col5, #T_0502a_row145_col6, #T_0502a_row145_col7, #T_0502a_row145_col8, #T_0502a_row146_col0, #T_0502a_row146_col1, #T_0502a_row146_col2, #T_0502a_row146_col3, #T_0502a_row146_col4, #T_0502a_row146_col5, #T_0502a_row146_col6, #T_0502a_row146_col7, #T_0502a_row146_col8, #T_0502a_row147_col0, #T_0502a_row147_col1, #T_0502a_row147_col2, #T_0502a_row147_col3, #T_0502a_row147_col4, #T_0502a_row147_col5, #T_0502a_row147_col6, #T_0502a_row147_col7, #T_0502a_row147_col8, #T_0502a_row148_col0, #T_0502a_row148_col1, #T_0502a_row148_col2, #T_0502a_row148_col3, #T_0502a_row148_col4, #T_0502a_row148_col5, #T_0502a_row148_col6, #T_0502a_row148_col7, #T_0502a_row148_col8, #T_0502a_row149_col0, #T_0502a_row149_col1, #T_0502a_row149_col2, #T_0502a_row149_col3, #T_0502a_row149_col4, #T_0502a_row149_col5, #T_0502a_row149_col6, #T_0502a_row149_col7, #T_0502a_row149_col8, #T_0502a_row150_col0, #T_0502a_row150_col1, #T_0502a_row150_col2, #T_0502a_row150_col3, #T_0502a_row150_col4, #T_0502a_row150_col5, #T_0502a_row150_col6, #T_0502a_row150_col7, #T_0502a_row150_col8, #T_0502a_row151_col0, #T_0502a_row151_col1, #T_0502a_row151_col2, #T_0502a_row151_col3, #T_0502a_row151_col4, #T_0502a_row151_col5, #T_0502a_row151_col6, #T_0502a_row151_col7, #T_0502a_row151_col8, #T_0502a_row152_col0, #T_0502a_row152_col1, #T_0502a_row152_col2, #T_0502a_row152_col3, #T_0502a_row152_col4, #T_0502a_row152_col5, #T_0502a_row152_col6, #T_0502a_row152_col7, #T_0502a_row152_col8, #T_0502a_row153_col0, #T_0502a_row153_col1, #T_0502a_row153_col2, #T_0502a_row153_col3, #T_0502a_row153_col4, #T_0502a_row153_col5, #T_0502a_row153_col6, #T_0502a_row153_col7, #T_0502a_row153_col8, #T_0502a_row154_col0, #T_0502a_row154_col1, #T_0502a_row154_col2, #T_0502a_row154_col3, #T_0502a_row154_col4, #T_0502a_row154_col5, #T_0502a_row154_col6, #T_0502a_row154_col7, #T_0502a_row154_col8, #T_0502a_row155_col0, #T_0502a_row155_col1, #T_0502a_row155_col2, #T_0502a_row155_col3, #T_0502a_row155_col4, #T_0502a_row155_col5, #T_0502a_row155_col6, #T_0502a_row155_col7, #T_0502a_row155_col8, #T_0502a_row156_col0, #T_0502a_row156_col1, #T_0502a_row156_col2, #T_0502a_row156_col3, #T_0502a_row156_col4, #T_0502a_row156_col5, #T_0502a_row156_col6, #T_0502a_row156_col7, #T_0502a_row156_col8, #T_0502a_row157_col0, #T_0502a_row157_col1, #T_0502a_row157_col2, #T_0502a_row157_col3, #T_0502a_row157_col4, #T_0502a_row157_col5, #T_0502a_row157_col6, #T_0502a_row157_col7, #T_0502a_row157_col8, #T_0502a_row158_col0, #T_0502a_row158_col1, #T_0502a_row158_col2, #T_0502a_row158_col3, #T_0502a_row158_col4, #T_0502a_row158_col5, #T_0502a_row158_col6, #T_0502a_row158_col7, #T_0502a_row158_col8, #T_0502a_row159_col0, #T_0502a_row159_col1, #T_0502a_row159_col2, #T_0502a_row159_col3, #T_0502a_row159_col4, #T_0502a_row159_col5, #T_0502a_row159_col6, #T_0502a_row159_col7, #T_0502a_row159_col8, #T_0502a_row160_col0, #T_0502a_row160_col1, #T_0502a_row160_col2, #T_0502a_row160_col3, #T_0502a_row160_col4, #T_0502a_row160_col5, #T_0502a_row160_col6, #T_0502a_row160_col7, #T_0502a_row160_col8, #T_0502a_row161_col0, #T_0502a_row161_col1, #T_0502a_row161_col2, #T_0502a_row161_col3, #T_0502a_row161_col4, #T_0502a_row161_col5, #T_0502a_row161_col6, #T_0502a_row161_col7, #T_0502a_row161_col8, #T_0502a_row162_col0, #T_0502a_row162_col1, #T_0502a_row162_col2, #T_0502a_row162_col3, #T_0502a_row162_col4, #T_0502a_row162_col5, #T_0502a_row162_col6, #T_0502a_row162_col7, #T_0502a_row162_col8, #T_0502a_row163_col0, #T_0502a_row163_col1, #T_0502a_row163_col2, #T_0502a_row163_col3, #T_0502a_row163_col4, #T_0502a_row163_col5, #T_0502a_row163_col6, #T_0502a_row163_col7, #T_0502a_row163_col8, #T_0502a_row164_col0, #T_0502a_row164_col1, #T_0502a_row164_col2, #T_0502a_row164_col3, #T_0502a_row164_col4, #T_0502a_row164_col5, #T_0502a_row164_col6, #T_0502a_row164_col7, #T_0502a_row164_col8, #T_0502a_row165_col0, #T_0502a_row165_col1, #T_0502a_row165_col2, #T_0502a_row165_col3, #T_0502a_row165_col4, #T_0502a_row165_col5, #T_0502a_row165_col6, #T_0502a_row165_col7, #T_0502a_row165_col8, #T_0502a_row166_col0, #T_0502a_row166_col1, #T_0502a_row166_col2, #T_0502a_row166_col3, #T_0502a_row166_col4, #T_0502a_row166_col5, #T_0502a_row166_col6, #T_0502a_row166_col7, #T_0502a_row166_col8, #T_0502a_row167_col0, #T_0502a_row167_col1, #T_0502a_row167_col2, #T_0502a_row167_col3, #T_0502a_row167_col4, #T_0502a_row167_col5, #T_0502a_row167_col6, #T_0502a_row167_col7, #T_0502a_row167_col8, #T_0502a_row168_col0, #T_0502a_row168_col1, #T_0502a_row168_col2, #T_0502a_row168_col3, #T_0502a_row168_col4, #T_0502a_row168_col5, #T_0502a_row168_col6, #T_0502a_row168_col7, #T_0502a_row168_col8, #T_0502a_row169_col0, #T_0502a_row169_col1, #T_0502a_row169_col2, #T_0502a_row169_col3, #T_0502a_row169_col4, #T_0502a_row169_col5, #T_0502a_row169_col6, #T_0502a_row169_col7, #T_0502a_row169_col8, #T_0502a_row170_col0, #T_0502a_row170_col1, #T_0502a_row170_col2, #T_0502a_row170_col3, #T_0502a_row170_col4, #T_0502a_row170_col5, #T_0502a_row170_col6, #T_0502a_row170_col7, #T_0502a_row170_col8, #T_0502a_row171_col0, #T_0502a_row171_col1, #T_0502a_row171_col2, #T_0502a_row171_col3, #T_0502a_row171_col4, #T_0502a_row171_col5, #T_0502a_row171_col6, #T_0502a_row171_col7, #T_0502a_row171_col8, #T_0502a_row172_col0, #T_0502a_row172_col1, #T_0502a_row172_col2, #T_0502a_row172_col3, #T_0502a_row172_col4, #T_0502a_row172_col5, #T_0502a_row172_col6, #T_0502a_row172_col7, #T_0502a_row172_col8, #T_0502a_row173_col0, #T_0502a_row173_col1, #T_0502a_row173_col2, #T_0502a_row173_col3, #T_0502a_row173_col4, #T_0502a_row173_col5, #T_0502a_row173_col6, #T_0502a_row173_col7, #T_0502a_row173_col8, #T_0502a_row174_col0, #T_0502a_row174_col1, #T_0502a_row174_col2, #T_0502a_row174_col3, #T_0502a_row174_col4, #T_0502a_row174_col5, #T_0502a_row174_col6, #T_0502a_row174_col7, #T_0502a_row174_col8, #T_0502a_row175_col0, #T_0502a_row175_col1, #T_0502a_row175_col2, #T_0502a_row175_col3, #T_0502a_row175_col4, #T_0502a_row175_col5, #T_0502a_row175_col6, #T_0502a_row175_col7, #T_0502a_row175_col8, #T_0502a_row176_col0, #T_0502a_row176_col1, #T_0502a_row176_col2, #T_0502a_row176_col3, #T_0502a_row176_col4, #T_0502a_row176_col5, #T_0502a_row176_col6, #T_0502a_row176_col7, #T_0502a_row176_col8, #T_0502a_row177_col0, #T_0502a_row177_col1, #T_0502a_row177_col2, #T_0502a_row177_col3, #T_0502a_row177_col4, #T_0502a_row177_col5, #T_0502a_row177_col6, #T_0502a_row177_col7, #T_0502a_row177_col8, #T_0502a_row178_col0, #T_0502a_row178_col1, #T_0502a_row178_col2, #T_0502a_row178_col3, #T_0502a_row178_col4, #T_0502a_row178_col5, #T_0502a_row178_col6, #T_0502a_row178_col7, #T_0502a_row178_col8, #T_0502a_row179_col0, #T_0502a_row179_col1, #T_0502a_row179_col2, #T_0502a_row179_col3, #T_0502a_row179_col4, #T_0502a_row179_col5, #T_0502a_row179_col6, #T_0502a_row179_col7, #T_0502a_row179_col8, #T_0502a_row180_col0, #T_0502a_row180_col1, #T_0502a_row180_col2, #T_0502a_row180_col3, #T_0502a_row180_col4, #T_0502a_row180_col5, #T_0502a_row180_col6, #T_0502a_row180_col7, #T_0502a_row180_col8, #T_0502a_row181_col0, #T_0502a_row181_col1, #T_0502a_row181_col2, #T_0502a_row181_col3, #T_0502a_row181_col4, #T_0502a_row181_col5, #T_0502a_row181_col6, #T_0502a_row181_col7, #T_0502a_row181_col8, #T_0502a_row182_col0, #T_0502a_row182_col1, #T_0502a_row182_col2, #T_0502a_row182_col3, #T_0502a_row182_col4, #T_0502a_row182_col5, #T_0502a_row182_col6, #T_0502a_row182_col7, #T_0502a_row182_col8, #T_0502a_row183_col0, #T_0502a_row183_col1, #T_0502a_row183_col2, #T_0502a_row183_col3, #T_0502a_row183_col4, #T_0502a_row183_col5, #T_0502a_row183_col6, #T_0502a_row183_col7, #T_0502a_row183_col8, #T_0502a_row184_col0, #T_0502a_row184_col1, #T_0502a_row184_col2, #T_0502a_row184_col3, #T_0502a_row184_col4, #T_0502a_row184_col5, #T_0502a_row184_col6, #T_0502a_row184_col7, #T_0502a_row184_col8, #T_0502a_row185_col0, #T_0502a_row185_col1, #T_0502a_row185_col2, #T_0502a_row185_col3, #T_0502a_row185_col4, #T_0502a_row185_col5, #T_0502a_row185_col6, #T_0502a_row185_col7, #T_0502a_row185_col8, #T_0502a_row186_col0, #T_0502a_row186_col1, #T_0502a_row186_col2, #T_0502a_row186_col3, #T_0502a_row186_col4, #T_0502a_row186_col5, #T_0502a_row186_col6, #T_0502a_row186_col7, #T_0502a_row186_col8, #T_0502a_row187_col0, #T_0502a_row187_col1, #T_0502a_row187_col2, #T_0502a_row187_col3, #T_0502a_row187_col4, #T_0502a_row187_col5, #T_0502a_row187_col6, #T_0502a_row187_col7, #T_0502a_row187_col8, #T_0502a_row188_col0, #T_0502a_row188_col1, #T_0502a_row188_col2, #T_0502a_row188_col3, #T_0502a_row188_col4, #T_0502a_row188_col5, #T_0502a_row188_col6, #T_0502a_row188_col7, #T_0502a_row188_col8, #T_0502a_row189_col0, #T_0502a_row189_col1, #T_0502a_row189_col2, #T_0502a_row189_col3, #T_0502a_row189_col4, #T_0502a_row189_col5, #T_0502a_row189_col6, #T_0502a_row189_col7, #T_0502a_row189_col8, #T_0502a_row190_col0, #T_0502a_row190_col1, #T_0502a_row190_col2, #T_0502a_row190_col3, #T_0502a_row190_col4, #T_0502a_row190_col5, #T_0502a_row190_col6, #T_0502a_row190_col7, #T_0502a_row190_col8, #T_0502a_row191_col0, #T_0502a_row191_col1, #T_0502a_row191_col2, #T_0502a_row191_col3, #T_0502a_row191_col4, #T_0502a_row191_col5, #T_0502a_row191_col6, #T_0502a_row191_col7, #T_0502a_row191_col8, #T_0502a_row192_col0, #T_0502a_row192_col1, #T_0502a_row192_col2, #T_0502a_row192_col3, #T_0502a_row192_col4, #T_0502a_row192_col5, #T_0502a_row192_col6, #T_0502a_row192_col7, #T_0502a_row192_col8, #T_0502a_row193_col0, #T_0502a_row193_col1, #T_0502a_row193_col2, #T_0502a_row193_col3, #T_0502a_row193_col4, #T_0502a_row193_col5, #T_0502a_row193_col6, #T_0502a_row193_col7, #T_0502a_row193_col8, #T_0502a_row194_col0, #T_0502a_row194_col1, #T_0502a_row194_col2, #T_0502a_row194_col3, #T_0502a_row194_col4, #T_0502a_row194_col5, #T_0502a_row194_col6, #T_0502a_row194_col7, #T_0502a_row194_col8 {\n",
-       "  text-align: left;\n",
-       "}\n",
-       "</style>\n",
-       "<table id=\"T_0502a\">\n",
-       "  <thead>\n",
-       "    <tr>\n",
-       "      <th id=\"T_0502a_level0_col0\" class=\"col_heading level0 col0\" >ID</th>\n",
-       "      <th id=\"T_0502a_level0_col1\" class=\"col_heading level0 col1\" >Name</th>\n",
-       "      <th id=\"T_0502a_level0_col2\" class=\"col_heading level0 col2\" >Description</th>\n",
-       "      <th id=\"T_0502a_level0_col3\" class=\"col_heading level0 col3\" >Has Figure</th>\n",
-       "      <th id=\"T_0502a_level0_col4\" class=\"col_heading level0 col4\" >Has Table</th>\n",
-       "      <th id=\"T_0502a_level0_col5\" class=\"col_heading level0 col5\" >Required Inputs</th>\n",
-       "      <th id=\"T_0502a_level0_col6\" class=\"col_heading level0 col6\" >Params</th>\n",
-       "      <th id=\"T_0502a_level0_col7\" class=\"col_heading level0 col7\" >Tags</th>\n",
-       "      <th id=\"T_0502a_level0_col8\" class=\"col_heading level0 col8\" >Tasks</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row0_col0\" class=\"data row0 col0\" >validmind.data_validation.ACFandPACFPlot</td>\n",
-       "      <td id=\"T_0502a_row0_col1\" class=\"data row0 col1\" >AC Fand PACF Plot</td>\n",
-       "      <td id=\"T_0502a_row0_col2\" class=\"data row0 col2\" >Analyzes time series data using Autocorrelation Function (ACF) and Partial Autocorrelation Function (PACF) plots to...</td>\n",
-       "      <td id=\"T_0502a_row0_col3\" class=\"data row0 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row0_col4\" class=\"data row0 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row0_col5\" class=\"data row0 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row0_col6\" class=\"data row0 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row0_col7\" class=\"data row0 col7\" >['time_series_data', 'forecasting', 'statistical_test', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row0_col8\" class=\"data row0 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row1_col0\" class=\"data row1 col0\" >validmind.data_validation.ADF</td>\n",
-       "      <td id=\"T_0502a_row1_col1\" class=\"data row1 col1\" >ADF</td>\n",
-       "      <td id=\"T_0502a_row1_col2\" class=\"data row1 col2\" >Assesses the stationarity of a time series dataset using the Augmented Dickey-Fuller (ADF) test....</td>\n",
-       "      <td id=\"T_0502a_row1_col3\" class=\"data row1 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row1_col4\" class=\"data row1 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row1_col5\" class=\"data row1 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row1_col6\" class=\"data row1 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row1_col7\" class=\"data row1 col7\" >['time_series_data', 'statsmodels', 'forecasting', 'statistical_test', 'stationarity']</td>\n",
-       "      <td id=\"T_0502a_row1_col8\" class=\"data row1 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row2_col0\" class=\"data row2 col0\" >validmind.data_validation.AutoAR</td>\n",
-       "      <td id=\"T_0502a_row2_col1\" class=\"data row2 col1\" >Auto AR</td>\n",
-       "      <td id=\"T_0502a_row2_col2\" class=\"data row2 col2\" >Automatically identifies the optimal Autoregressive (AR) order for a time series using BIC and AIC criteria....</td>\n",
-       "      <td id=\"T_0502a_row2_col3\" class=\"data row2 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row2_col4\" class=\"data row2 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row2_col5\" class=\"data row2 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row2_col6\" class=\"data row2 col6\" >{'max_ar_order': {'type': 'int', 'default': 3}}</td>\n",
-       "      <td id=\"T_0502a_row2_col7\" class=\"data row2 col7\" >['time_series_data', 'statsmodels', 'forecasting', 'statistical_test']</td>\n",
-       "      <td id=\"T_0502a_row2_col8\" class=\"data row2 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row3_col0\" class=\"data row3 col0\" >validmind.data_validation.AutoMA</td>\n",
-       "      <td id=\"T_0502a_row3_col1\" class=\"data row3 col1\" >Auto MA</td>\n",
-       "      <td id=\"T_0502a_row3_col2\" class=\"data row3 col2\" >Automatically selects the optimal Moving Average (MA) order for each variable in a time series dataset based on...</td>\n",
-       "      <td id=\"T_0502a_row3_col3\" class=\"data row3 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row3_col4\" class=\"data row3 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row3_col5\" class=\"data row3 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row3_col6\" class=\"data row3 col6\" >{'max_ma_order': {'type': 'int', 'default': 3}}</td>\n",
-       "      <td id=\"T_0502a_row3_col7\" class=\"data row3 col7\" >['time_series_data', 'statsmodels', 'forecasting', 'statistical_test']</td>\n",
-       "      <td id=\"T_0502a_row3_col8\" class=\"data row3 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row4_col0\" class=\"data row4 col0\" >validmind.data_validation.AutoStationarity</td>\n",
-       "      <td id=\"T_0502a_row4_col1\" class=\"data row4 col1\" >Auto Stationarity</td>\n",
-       "      <td id=\"T_0502a_row4_col2\" class=\"data row4 col2\" >Automates Augmented Dickey-Fuller test to assess stationarity across multiple time series in a DataFrame....</td>\n",
-       "      <td id=\"T_0502a_row4_col3\" class=\"data row4 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row4_col4\" class=\"data row4 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row4_col5\" class=\"data row4 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row4_col6\" class=\"data row4 col6\" >{'max_order': {'type': 'int', 'default': 5}, 'threshold': {'type': 'float', 'default': 0.05}}</td>\n",
-       "      <td id=\"T_0502a_row4_col7\" class=\"data row4 col7\" >['time_series_data', 'statsmodels', 'forecasting', 'statistical_test']</td>\n",
-       "      <td id=\"T_0502a_row4_col8\" class=\"data row4 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row5_col0\" class=\"data row5 col0\" >validmind.data_validation.BivariateScatterPlots</td>\n",
-       "      <td id=\"T_0502a_row5_col1\" class=\"data row5 col1\" >Bivariate Scatter Plots</td>\n",
-       "      <td id=\"T_0502a_row5_col2\" class=\"data row5 col2\" >Generates bivariate scatterplots to visually inspect relationships between pairs of numerical predictor variables...</td>\n",
-       "      <td id=\"T_0502a_row5_col3\" class=\"data row5 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row5_col4\" class=\"data row5 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row5_col5\" class=\"data row5 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row5_col6\" class=\"data row5 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row5_col7\" class=\"data row5 col7\" >['tabular_data', 'numerical_data', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row5_col8\" class=\"data row5 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row6_col0\" class=\"data row6 col0\" >validmind.data_validation.BoxPierce</td>\n",
-       "      <td id=\"T_0502a_row6_col1\" class=\"data row6 col1\" >Box Pierce</td>\n",
-       "      <td id=\"T_0502a_row6_col2\" class=\"data row6 col2\" >Detects autocorrelation in time-series data through the Box-Pierce test to validate model performance....</td>\n",
-       "      <td id=\"T_0502a_row6_col3\" class=\"data row6 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row6_col4\" class=\"data row6 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row6_col5\" class=\"data row6 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row6_col6\" class=\"data row6 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row6_col7\" class=\"data row6 col7\" >['time_series_data', 'forecasting', 'statistical_test', 'statsmodels']</td>\n",
-       "      <td id=\"T_0502a_row6_col8\" class=\"data row6 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row7_col0\" class=\"data row7 col0\" >validmind.data_validation.ChiSquaredFeaturesTable</td>\n",
-       "      <td id=\"T_0502a_row7_col1\" class=\"data row7 col1\" >Chi Squared Features Table</td>\n",
-       "      <td id=\"T_0502a_row7_col2\" class=\"data row7 col2\" >Assesses the statistical association between categorical features and a target variable using the Chi-Squared test....</td>\n",
-       "      <td id=\"T_0502a_row7_col3\" class=\"data row7 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row7_col4\" class=\"data row7 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row7_col5\" class=\"data row7 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row7_col6\" class=\"data row7 col6\" >{'p_threshold': {'type': '_empty', 'default': 0.05}}</td>\n",
-       "      <td id=\"T_0502a_row7_col7\" class=\"data row7 col7\" >['tabular_data', 'categorical_data', 'statistical_test']</td>\n",
-       "      <td id=\"T_0502a_row7_col8\" class=\"data row7 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row8_col0\" class=\"data row8 col0\" >validmind.data_validation.ClassImbalance</td>\n",
-       "      <td id=\"T_0502a_row8_col1\" class=\"data row8 col1\" >Class Imbalance</td>\n",
-       "      <td id=\"T_0502a_row8_col2\" class=\"data row8 col2\" >Evaluates and quantifies class distribution imbalance in a dataset used by a machine learning model....</td>\n",
-       "      <td id=\"T_0502a_row8_col3\" class=\"data row8 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row8_col4\" class=\"data row8 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row8_col5\" class=\"data row8 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row8_col6\" class=\"data row8 col6\" >{'min_percent_threshold': {'type': 'int', 'default': 10}}</td>\n",
-       "      <td id=\"T_0502a_row8_col7\" class=\"data row8 col7\" >['tabular_data', 'binary_classification', 'multiclass_classification', 'data_quality']</td>\n",
-       "      <td id=\"T_0502a_row8_col8\" class=\"data row8 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row9_col0\" class=\"data row9 col0\" >validmind.data_validation.DatasetDescription</td>\n",
-       "      <td id=\"T_0502a_row9_col1\" class=\"data row9 col1\" >Dataset Description</td>\n",
-       "      <td id=\"T_0502a_row9_col2\" class=\"data row9 col2\" >Provides comprehensive analysis and statistical summaries of each column in a machine learning model's dataset....</td>\n",
-       "      <td id=\"T_0502a_row9_col3\" class=\"data row9 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row9_col4\" class=\"data row9 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row9_col5\" class=\"data row9 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row9_col6\" class=\"data row9 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row9_col7\" class=\"data row9 col7\" >['tabular_data', 'time_series_data', 'text_data']</td>\n",
-       "      <td id=\"T_0502a_row9_col8\" class=\"data row9 col8\" >['classification', 'regression', 'text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row10_col0\" class=\"data row10 col0\" >validmind.data_validation.DatasetSplit</td>\n",
-       "      <td id=\"T_0502a_row10_col1\" class=\"data row10 col1\" >Dataset Split</td>\n",
-       "      <td id=\"T_0502a_row10_col2\" class=\"data row10 col2\" >Evaluates and visualizes the distribution proportions among training, testing, and validation datasets of an ML...</td>\n",
-       "      <td id=\"T_0502a_row10_col3\" class=\"data row10 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row10_col4\" class=\"data row10 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row10_col5\" class=\"data row10 col5\" >['datasets']</td>\n",
-       "      <td id=\"T_0502a_row10_col6\" class=\"data row10 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row10_col7\" class=\"data row10 col7\" >['tabular_data', 'time_series_data', 'text_data']</td>\n",
-       "      <td id=\"T_0502a_row10_col8\" class=\"data row10 col8\" >['classification', 'regression', 'text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row11_col0\" class=\"data row11 col0\" >validmind.data_validation.DescriptiveStatistics</td>\n",
-       "      <td id=\"T_0502a_row11_col1\" class=\"data row11 col1\" >Descriptive Statistics</td>\n",
-       "      <td id=\"T_0502a_row11_col2\" class=\"data row11 col2\" >Performs a detailed descriptive statistical analysis of both numerical and categorical data within a model's...</td>\n",
-       "      <td id=\"T_0502a_row11_col3\" class=\"data row11 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row11_col4\" class=\"data row11 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row11_col5\" class=\"data row11 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row11_col6\" class=\"data row11 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row11_col7\" class=\"data row11 col7\" >['tabular_data', 'time_series_data', 'data_quality']</td>\n",
-       "      <td id=\"T_0502a_row11_col8\" class=\"data row11 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row12_col0\" class=\"data row12 col0\" >validmind.data_validation.DickeyFullerGLS</td>\n",
-       "      <td id=\"T_0502a_row12_col1\" class=\"data row12 col1\" >Dickey Fuller GLS</td>\n",
-       "      <td id=\"T_0502a_row12_col2\" class=\"data row12 col2\" >Assesses stationarity in time series data using the Dickey-Fuller GLS test to determine the order of integration....</td>\n",
-       "      <td id=\"T_0502a_row12_col3\" class=\"data row12 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row12_col4\" class=\"data row12 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row12_col5\" class=\"data row12 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row12_col6\" class=\"data row12 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row12_col7\" class=\"data row12 col7\" >['time_series_data', 'forecasting', 'unit_root_test']</td>\n",
-       "      <td id=\"T_0502a_row12_col8\" class=\"data row12 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row13_col0\" class=\"data row13 col0\" >validmind.data_validation.Duplicates</td>\n",
-       "      <td id=\"T_0502a_row13_col1\" class=\"data row13 col1\" >Duplicates</td>\n",
-       "      <td id=\"T_0502a_row13_col2\" class=\"data row13 col2\" >Tests dataset for duplicate entries, ensuring model reliability via data quality verification....</td>\n",
-       "      <td id=\"T_0502a_row13_col3\" class=\"data row13 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row13_col4\" class=\"data row13 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row13_col5\" class=\"data row13 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row13_col6\" class=\"data row13 col6\" >{'min_threshold': {'type': '_empty', 'default': 1}}</td>\n",
-       "      <td id=\"T_0502a_row13_col7\" class=\"data row13 col7\" >['tabular_data', 'data_quality', 'text_data']</td>\n",
-       "      <td id=\"T_0502a_row13_col8\" class=\"data row13 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row14_col0\" class=\"data row14 col0\" >validmind.data_validation.EngleGrangerCoint</td>\n",
-       "      <td id=\"T_0502a_row14_col1\" class=\"data row14 col1\" >Engle Granger Coint</td>\n",
-       "      <td id=\"T_0502a_row14_col2\" class=\"data row14 col2\" >Assesses the degree of co-movement between pairs of time series data using the Engle-Granger cointegration test....</td>\n",
-       "      <td id=\"T_0502a_row14_col3\" class=\"data row14 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row14_col4\" class=\"data row14 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row14_col5\" class=\"data row14 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row14_col6\" class=\"data row14 col6\" >{'threshold': {'type': 'float', 'default': 0.05}}</td>\n",
-       "      <td id=\"T_0502a_row14_col7\" class=\"data row14 col7\" >['time_series_data', 'statistical_test', 'forecasting']</td>\n",
-       "      <td id=\"T_0502a_row14_col8\" class=\"data row14 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row15_col0\" class=\"data row15 col0\" >validmind.data_validation.FeatureTargetCorrelationPlot</td>\n",
-       "      <td id=\"T_0502a_row15_col1\" class=\"data row15 col1\" >Feature Target Correlation Plot</td>\n",
-       "      <td id=\"T_0502a_row15_col2\" class=\"data row15 col2\" >Visualizes the correlation between input features and the model's target output in a color-coded horizontal bar...</td>\n",
-       "      <td id=\"T_0502a_row15_col3\" class=\"data row15 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row15_col4\" class=\"data row15 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row15_col5\" class=\"data row15 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row15_col6\" class=\"data row15 col6\" >{'fig_height': {'type': '_empty', 'default': 600}}</td>\n",
-       "      <td id=\"T_0502a_row15_col7\" class=\"data row15 col7\" >['tabular_data', 'visualization', 'correlation']</td>\n",
-       "      <td id=\"T_0502a_row15_col8\" class=\"data row15 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row16_col0\" class=\"data row16 col0\" >validmind.data_validation.HighCardinality</td>\n",
-       "      <td id=\"T_0502a_row16_col1\" class=\"data row16 col1\" >High Cardinality</td>\n",
-       "      <td id=\"T_0502a_row16_col2\" class=\"data row16 col2\" >Assesses the number of unique values in categorical columns to detect high cardinality and potential overfitting....</td>\n",
-       "      <td id=\"T_0502a_row16_col3\" class=\"data row16 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row16_col4\" class=\"data row16 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row16_col5\" class=\"data row16 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row16_col6\" class=\"data row16 col6\" >{'num_threshold': {'type': 'int', 'default': 100}, 'percent_threshold': {'type': 'float', 'default': 0.1}, 'threshold_type': {'type': 'str', 'default': 'percent'}}</td>\n",
-       "      <td id=\"T_0502a_row16_col7\" class=\"data row16 col7\" >['tabular_data', 'data_quality', 'categorical_data']</td>\n",
-       "      <td id=\"T_0502a_row16_col8\" class=\"data row16 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row17_col0\" class=\"data row17 col0\" >validmind.data_validation.HighPearsonCorrelation</td>\n",
-       "      <td id=\"T_0502a_row17_col1\" class=\"data row17 col1\" >High Pearson Correlation</td>\n",
-       "      <td id=\"T_0502a_row17_col2\" class=\"data row17 col2\" >Identifies highly correlated feature pairs in a dataset suggesting feature redundancy or multicollinearity....</td>\n",
-       "      <td id=\"T_0502a_row17_col3\" class=\"data row17 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row17_col4\" class=\"data row17 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row17_col5\" class=\"data row17 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row17_col6\" class=\"data row17 col6\" >{'max_threshold': {'type': 'float', 'default': 0.3}, 'top_n_correlations': {'type': 'int', 'default': 10}, 'feature_columns': {'type': 'list', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row17_col7\" class=\"data row17 col7\" >['tabular_data', 'data_quality', 'correlation']</td>\n",
-       "      <td id=\"T_0502a_row17_col8\" class=\"data row17 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row18_col0\" class=\"data row18 col0\" >validmind.data_validation.IQROutliersBarPlot</td>\n",
-       "      <td id=\"T_0502a_row18_col1\" class=\"data row18 col1\" >IQR Outliers Bar Plot</td>\n",
-       "      <td id=\"T_0502a_row18_col2\" class=\"data row18 col2\" >Visualizes outlier distribution across percentiles in numerical data using the Interquartile Range (IQR) method....</td>\n",
-       "      <td id=\"T_0502a_row18_col3\" class=\"data row18 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row18_col4\" class=\"data row18 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row18_col5\" class=\"data row18 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row18_col6\" class=\"data row18 col6\" >{'threshold': {'type': 'float', 'default': 1.5}, 'fig_width': {'type': 'int', 'default': 800}}</td>\n",
-       "      <td id=\"T_0502a_row18_col7\" class=\"data row18 col7\" >['tabular_data', 'visualization', 'numerical_data']</td>\n",
-       "      <td id=\"T_0502a_row18_col8\" class=\"data row18 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row19_col0\" class=\"data row19 col0\" >validmind.data_validation.IQROutliersTable</td>\n",
-       "      <td id=\"T_0502a_row19_col1\" class=\"data row19 col1\" >IQR Outliers Table</td>\n",
-       "      <td id=\"T_0502a_row19_col2\" class=\"data row19 col2\" >Determines and summarizes outliers in numerical features using the Interquartile Range method....</td>\n",
-       "      <td id=\"T_0502a_row19_col3\" class=\"data row19 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row19_col4\" class=\"data row19 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row19_col5\" class=\"data row19 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row19_col6\" class=\"data row19 col6\" >{'threshold': {'type': 'float', 'default': 1.5}}</td>\n",
-       "      <td id=\"T_0502a_row19_col7\" class=\"data row19 col7\" >['tabular_data', 'numerical_data']</td>\n",
-       "      <td id=\"T_0502a_row19_col8\" class=\"data row19 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row20_col0\" class=\"data row20 col0\" >validmind.data_validation.IsolationForestOutliers</td>\n",
-       "      <td id=\"T_0502a_row20_col1\" class=\"data row20 col1\" >Isolation Forest Outliers</td>\n",
-       "      <td id=\"T_0502a_row20_col2\" class=\"data row20 col2\" >Detects outliers in a dataset using the Isolation Forest algorithm and visualizes results through scatter plots....</td>\n",
-       "      <td id=\"T_0502a_row20_col3\" class=\"data row20 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row20_col4\" class=\"data row20 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row20_col5\" class=\"data row20 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row20_col6\" class=\"data row20 col6\" >{'random_state': {'type': 'int', 'default': 0}, 'contamination': {'type': 'float', 'default': 0.1}, 'feature_columns': {'type': 'list', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row20_col7\" class=\"data row20 col7\" >['tabular_data', 'anomaly_detection']</td>\n",
-       "      <td id=\"T_0502a_row20_col8\" class=\"data row20 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row21_col0\" class=\"data row21 col0\" >validmind.data_validation.JarqueBera</td>\n",
-       "      <td id=\"T_0502a_row21_col1\" class=\"data row21 col1\" >Jarque Bera</td>\n",
-       "      <td id=\"T_0502a_row21_col2\" class=\"data row21 col2\" >Assesses normality of dataset features in an ML model using the Jarque-Bera test....</td>\n",
-       "      <td id=\"T_0502a_row21_col3\" class=\"data row21 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row21_col4\" class=\"data row21 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row21_col5\" class=\"data row21 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row21_col6\" class=\"data row21 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row21_col7\" class=\"data row21 col7\" >['tabular_data', 'data_distribution', 'statistical_test', 'statsmodels']</td>\n",
-       "      <td id=\"T_0502a_row21_col8\" class=\"data row21 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row22_col0\" class=\"data row22 col0\" >validmind.data_validation.KPSS</td>\n",
-       "      <td id=\"T_0502a_row22_col1\" class=\"data row22 col1\" >KPSS</td>\n",
-       "      <td id=\"T_0502a_row22_col2\" class=\"data row22 col2\" >Assesses the stationarity of time-series data in a machine learning model using the KPSS unit root test....</td>\n",
-       "      <td id=\"T_0502a_row22_col3\" class=\"data row22 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row22_col4\" class=\"data row22 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row22_col5\" class=\"data row22 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row22_col6\" class=\"data row22 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row22_col7\" class=\"data row22 col7\" >['time_series_data', 'stationarity', 'unit_root_test', 'statsmodels']</td>\n",
-       "      <td id=\"T_0502a_row22_col8\" class=\"data row22 col8\" >['data_validation']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row23_col0\" class=\"data row23 col0\" >validmind.data_validation.LJungBox</td>\n",
-       "      <td id=\"T_0502a_row23_col1\" class=\"data row23 col1\" >L Jung Box</td>\n",
-       "      <td id=\"T_0502a_row23_col2\" class=\"data row23 col2\" >Assesses autocorrelations in dataset features by performing a Ljung-Box test on each feature....</td>\n",
-       "      <td id=\"T_0502a_row23_col3\" class=\"data row23 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row23_col4\" class=\"data row23 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row23_col5\" class=\"data row23 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row23_col6\" class=\"data row23 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row23_col7\" class=\"data row23 col7\" >['time_series_data', 'forecasting', 'statistical_test', 'statsmodels']</td>\n",
-       "      <td id=\"T_0502a_row23_col8\" class=\"data row23 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row24_col0\" class=\"data row24 col0\" >validmind.data_validation.LaggedCorrelationHeatmap</td>\n",
-       "      <td id=\"T_0502a_row24_col1\" class=\"data row24 col1\" >Lagged Correlation Heatmap</td>\n",
-       "      <td id=\"T_0502a_row24_col2\" class=\"data row24 col2\" >Assesses and visualizes correlation between target variable and lagged independent variables in a time-series...</td>\n",
-       "      <td id=\"T_0502a_row24_col3\" class=\"data row24 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row24_col4\" class=\"data row24 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row24_col5\" class=\"data row24 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row24_col6\" class=\"data row24 col6\" >{'num_lags': {'type': 'int', 'default': 10}}</td>\n",
-       "      <td id=\"T_0502a_row24_col7\" class=\"data row24 col7\" >['time_series_data', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row24_col8\" class=\"data row24 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row25_col0\" class=\"data row25 col0\" >validmind.data_validation.MissingValues</td>\n",
-       "      <td id=\"T_0502a_row25_col1\" class=\"data row25 col1\" >Missing Values</td>\n",
-       "      <td id=\"T_0502a_row25_col2\" class=\"data row25 col2\" >Evaluates dataset quality by ensuring missing value ratio across all features does not exceed a set threshold....</td>\n",
-       "      <td id=\"T_0502a_row25_col3\" class=\"data row25 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row25_col4\" class=\"data row25 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row25_col5\" class=\"data row25 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row25_col6\" class=\"data row25 col6\" >{'min_threshold': {'type': 'int', 'default': 1}}</td>\n",
-       "      <td id=\"T_0502a_row25_col7\" class=\"data row25 col7\" >['tabular_data', 'data_quality']</td>\n",
-       "      <td id=\"T_0502a_row25_col8\" class=\"data row25 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row26_col0\" class=\"data row26 col0\" >validmind.data_validation.MissingValuesBarPlot</td>\n",
-       "      <td id=\"T_0502a_row26_col1\" class=\"data row26 col1\" >Missing Values Bar Plot</td>\n",
-       "      <td id=\"T_0502a_row26_col2\" class=\"data row26 col2\" >Assesses the percentage and distribution of missing values in the dataset via a bar plot, with emphasis on...</td>\n",
-       "      <td id=\"T_0502a_row26_col3\" class=\"data row26 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row26_col4\" class=\"data row26 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row26_col5\" class=\"data row26 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row26_col6\" class=\"data row26 col6\" >{'threshold': {'type': 'int', 'default': 80}, 'fig_height': {'type': 'int', 'default': 600}}</td>\n",
-       "      <td id=\"T_0502a_row26_col7\" class=\"data row26 col7\" >['tabular_data', 'data_quality', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row26_col8\" class=\"data row26 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row27_col0\" class=\"data row27 col0\" >validmind.data_validation.MutualInformation</td>\n",
-       "      <td id=\"T_0502a_row27_col1\" class=\"data row27 col1\" >Mutual Information</td>\n",
-       "      <td id=\"T_0502a_row27_col2\" class=\"data row27 col2\" >Calculates mutual information scores between features and target variable to evaluate feature relevance....</td>\n",
-       "      <td id=\"T_0502a_row27_col3\" class=\"data row27 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row27_col4\" class=\"data row27 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row27_col5\" class=\"data row27 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row27_col6\" class=\"data row27 col6\" >{'min_threshold': {'type': 'float', 'default': 0.01}, 'task': {'type': 'str', 'default': 'classification'}}</td>\n",
-       "      <td id=\"T_0502a_row27_col7\" class=\"data row27 col7\" >['feature_selection', 'data_analysis']</td>\n",
-       "      <td id=\"T_0502a_row27_col8\" class=\"data row27 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row28_col0\" class=\"data row28 col0\" >validmind.data_validation.PearsonCorrelationMatrix</td>\n",
-       "      <td id=\"T_0502a_row28_col1\" class=\"data row28 col1\" >Pearson Correlation Matrix</td>\n",
-       "      <td id=\"T_0502a_row28_col2\" class=\"data row28 col2\" >Evaluates linear dependency between numerical variables in a dataset via a Pearson Correlation coefficient heat map....</td>\n",
-       "      <td id=\"T_0502a_row28_col3\" class=\"data row28 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row28_col4\" class=\"data row28 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row28_col5\" class=\"data row28 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row28_col6\" class=\"data row28 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row28_col7\" class=\"data row28 col7\" >['tabular_data', 'numerical_data', 'correlation']</td>\n",
-       "      <td id=\"T_0502a_row28_col8\" class=\"data row28 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row29_col0\" class=\"data row29 col0\" >validmind.data_validation.PhillipsPerronArch</td>\n",
-       "      <td id=\"T_0502a_row29_col1\" class=\"data row29 col1\" >Phillips Perron Arch</td>\n",
-       "      <td id=\"T_0502a_row29_col2\" class=\"data row29 col2\" >Assesses the stationarity of time series data in each feature of the ML model using the Phillips-Perron test....</td>\n",
-       "      <td id=\"T_0502a_row29_col3\" class=\"data row29 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row29_col4\" class=\"data row29 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row29_col5\" class=\"data row29 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row29_col6\" class=\"data row29 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row29_col7\" class=\"data row29 col7\" >['time_series_data', 'forecasting', 'statistical_test', 'unit_root_test']</td>\n",
-       "      <td id=\"T_0502a_row29_col8\" class=\"data row29 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row30_col0\" class=\"data row30 col0\" >validmind.data_validation.ProtectedClassesDescription</td>\n",
-       "      <td id=\"T_0502a_row30_col1\" class=\"data row30 col1\" >Protected Classes Description</td>\n",
-       "      <td id=\"T_0502a_row30_col2\" class=\"data row30 col2\" >Visualizes the distribution of protected classes in the dataset relative to the target variable...</td>\n",
-       "      <td id=\"T_0502a_row30_col3\" class=\"data row30 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row30_col4\" class=\"data row30 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row30_col5\" class=\"data row30 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row30_col6\" class=\"data row30 col6\" >{'protected_classes': {'type': '_empty', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row30_col7\" class=\"data row30 col7\" >['bias_and_fairness', 'descriptive_statistics']</td>\n",
-       "      <td id=\"T_0502a_row30_col8\" class=\"data row30 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row31_col0\" class=\"data row31 col0\" >validmind.data_validation.RollingStatsPlot</td>\n",
-       "      <td id=\"T_0502a_row31_col1\" class=\"data row31 col1\" >Rolling Stats Plot</td>\n",
-       "      <td id=\"T_0502a_row31_col2\" class=\"data row31 col2\" >Evaluates the stationarity of time series data by plotting its rolling mean and standard deviation over a specified...</td>\n",
-       "      <td id=\"T_0502a_row31_col3\" class=\"data row31 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row31_col4\" class=\"data row31 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row31_col5\" class=\"data row31 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row31_col6\" class=\"data row31 col6\" >{'window_size': {'type': 'int', 'default': 12}}</td>\n",
-       "      <td id=\"T_0502a_row31_col7\" class=\"data row31 col7\" >['time_series_data', 'visualization', 'stationarity']</td>\n",
-       "      <td id=\"T_0502a_row31_col8\" class=\"data row31 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row32_col0\" class=\"data row32 col0\" >validmind.data_validation.RunsTest</td>\n",
-       "      <td id=\"T_0502a_row32_col1\" class=\"data row32 col1\" >Runs Test</td>\n",
-       "      <td id=\"T_0502a_row32_col2\" class=\"data row32 col2\" >Executes Runs Test on ML model to detect non-random patterns in output data sequence....</td>\n",
-       "      <td id=\"T_0502a_row32_col3\" class=\"data row32 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row32_col4\" class=\"data row32 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row32_col5\" class=\"data row32 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row32_col6\" class=\"data row32 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row32_col7\" class=\"data row32 col7\" >['tabular_data', 'statistical_test', 'statsmodels']</td>\n",
-       "      <td id=\"T_0502a_row32_col8\" class=\"data row32 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row33_col0\" class=\"data row33 col0\" >validmind.data_validation.ScatterPlot</td>\n",
-       "      <td id=\"T_0502a_row33_col1\" class=\"data row33 col1\" >Scatter Plot</td>\n",
-       "      <td id=\"T_0502a_row33_col2\" class=\"data row33 col2\" >Assesses visual relationships, patterns, and outliers among features in a dataset through scatter plot matrices....</td>\n",
-       "      <td id=\"T_0502a_row33_col3\" class=\"data row33 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row33_col4\" class=\"data row33 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row33_col5\" class=\"data row33 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row33_col6\" class=\"data row33 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row33_col7\" class=\"data row33 col7\" >['tabular_data', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row33_col8\" class=\"data row33 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row34_col0\" class=\"data row34 col0\" >validmind.data_validation.ScoreBandDefaultRates</td>\n",
-       "      <td id=\"T_0502a_row34_col1\" class=\"data row34 col1\" >Score Band Default Rates</td>\n",
-       "      <td id=\"T_0502a_row34_col2\" class=\"data row34 col2\" >Analyzes default rates and population distribution across credit score bands....</td>\n",
-       "      <td id=\"T_0502a_row34_col3\" class=\"data row34 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row34_col4\" class=\"data row34 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row34_col5\" class=\"data row34 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row34_col6\" class=\"data row34 col6\" >{'score_column': {'type': 'str', 'default': 'score'}, 'score_bands': {'type': 'list', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row34_col7\" class=\"data row34 col7\" >['visualization', 'credit_risk', 'scorecard']</td>\n",
-       "      <td id=\"T_0502a_row34_col8\" class=\"data row34 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row35_col0\" class=\"data row35 col0\" >validmind.data_validation.SeasonalDecompose</td>\n",
-       "      <td id=\"T_0502a_row35_col1\" class=\"data row35 col1\" >Seasonal Decompose</td>\n",
-       "      <td id=\"T_0502a_row35_col2\" class=\"data row35 col2\" >Assesses patterns and seasonality in a time series dataset by decomposing its features into foundational components....</td>\n",
-       "      <td id=\"T_0502a_row35_col3\" class=\"data row35 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row35_col4\" class=\"data row35 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row35_col5\" class=\"data row35 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row35_col6\" class=\"data row35 col6\" >{'seasonal_model': {'type': 'str', 'default': 'additive'}}</td>\n",
-       "      <td id=\"T_0502a_row35_col7\" class=\"data row35 col7\" >['time_series_data', 'seasonality', 'statsmodels']</td>\n",
-       "      <td id=\"T_0502a_row35_col8\" class=\"data row35 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row36_col0\" class=\"data row36 col0\" >validmind.data_validation.ShapiroWilk</td>\n",
-       "      <td id=\"T_0502a_row36_col1\" class=\"data row36 col1\" >Shapiro Wilk</td>\n",
-       "      <td id=\"T_0502a_row36_col2\" class=\"data row36 col2\" >Evaluates feature-wise normality of training data using the Shapiro-Wilk test....</td>\n",
-       "      <td id=\"T_0502a_row36_col3\" class=\"data row36 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row36_col4\" class=\"data row36 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row36_col5\" class=\"data row36 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row36_col6\" class=\"data row36 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row36_col7\" class=\"data row36 col7\" >['tabular_data', 'data_distribution', 'statistical_test']</td>\n",
-       "      <td id=\"T_0502a_row36_col8\" class=\"data row36 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row37_col0\" class=\"data row37 col0\" >validmind.data_validation.Skewness</td>\n",
-       "      <td id=\"T_0502a_row37_col1\" class=\"data row37 col1\" >Skewness</td>\n",
-       "      <td id=\"T_0502a_row37_col2\" class=\"data row37 col2\" >Evaluates the skewness of numerical data in a dataset to check against a defined threshold, aiming to ensure data...</td>\n",
-       "      <td id=\"T_0502a_row37_col3\" class=\"data row37 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row37_col4\" class=\"data row37 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row37_col5\" class=\"data row37 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row37_col6\" class=\"data row37 col6\" >{'max_threshold': {'type': '_empty', 'default': 1}}</td>\n",
-       "      <td id=\"T_0502a_row37_col7\" class=\"data row37 col7\" >['data_quality', 'tabular_data']</td>\n",
-       "      <td id=\"T_0502a_row37_col8\" class=\"data row37 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row38_col0\" class=\"data row38 col0\" >validmind.data_validation.SpreadPlot</td>\n",
-       "      <td id=\"T_0502a_row38_col1\" class=\"data row38 col1\" >Spread Plot</td>\n",
-       "      <td id=\"T_0502a_row38_col2\" class=\"data row38 col2\" >Assesses potential correlations between pairs of time series variables through visualization to enhance...</td>\n",
-       "      <td id=\"T_0502a_row38_col3\" class=\"data row38 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row38_col4\" class=\"data row38 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row38_col5\" class=\"data row38 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row38_col6\" class=\"data row38 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row38_col7\" class=\"data row38 col7\" >['time_series_data', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row38_col8\" class=\"data row38 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row39_col0\" class=\"data row39 col0\" >validmind.data_validation.TabularCategoricalBarPlots</td>\n",
-       "      <td id=\"T_0502a_row39_col1\" class=\"data row39 col1\" >Tabular Categorical Bar Plots</td>\n",
-       "      <td id=\"T_0502a_row39_col2\" class=\"data row39 col2\" >Generates and visualizes bar plots for each category in categorical features to evaluate the dataset's composition....</td>\n",
-       "      <td id=\"T_0502a_row39_col3\" class=\"data row39 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row39_col4\" class=\"data row39 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row39_col5\" class=\"data row39 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row39_col6\" class=\"data row39 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row39_col7\" class=\"data row39 col7\" >['tabular_data', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row39_col8\" class=\"data row39 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row40_col0\" class=\"data row40 col0\" >validmind.data_validation.TabularDateTimeHistograms</td>\n",
-       "      <td id=\"T_0502a_row40_col1\" class=\"data row40 col1\" >Tabular Date Time Histograms</td>\n",
-       "      <td id=\"T_0502a_row40_col2\" class=\"data row40 col2\" >Generates histograms to provide graphical insight into the distribution of time intervals in a model's datetime...</td>\n",
-       "      <td id=\"T_0502a_row40_col3\" class=\"data row40 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row40_col4\" class=\"data row40 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row40_col5\" class=\"data row40 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row40_col6\" class=\"data row40 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row40_col7\" class=\"data row40 col7\" >['time_series_data', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row40_col8\" class=\"data row40 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row41_col0\" class=\"data row41 col0\" >validmind.data_validation.TabularDescriptionTables</td>\n",
-       "      <td id=\"T_0502a_row41_col1\" class=\"data row41 col1\" >Tabular Description Tables</td>\n",
-       "      <td id=\"T_0502a_row41_col2\" class=\"data row41 col2\" >Summarizes key descriptive statistics for numerical, categorical, and datetime variables in a dataset....</td>\n",
-       "      <td id=\"T_0502a_row41_col3\" class=\"data row41 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row41_col4\" class=\"data row41 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row41_col5\" class=\"data row41 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row41_col6\" class=\"data row41 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row41_col7\" class=\"data row41 col7\" >['tabular_data']</td>\n",
-       "      <td id=\"T_0502a_row41_col8\" class=\"data row41 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row42_col0\" class=\"data row42 col0\" >validmind.data_validation.TabularNumericalHistograms</td>\n",
-       "      <td id=\"T_0502a_row42_col1\" class=\"data row42 col1\" >Tabular Numerical Histograms</td>\n",
-       "      <td id=\"T_0502a_row42_col2\" class=\"data row42 col2\" >Generates histograms for each numerical feature in a dataset to provide visual insights into data distribution and...</td>\n",
-       "      <td id=\"T_0502a_row42_col3\" class=\"data row42 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row42_col4\" class=\"data row42 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row42_col5\" class=\"data row42 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row42_col6\" class=\"data row42 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row42_col7\" class=\"data row42 col7\" >['tabular_data', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row42_col8\" class=\"data row42 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row43_col0\" class=\"data row43 col0\" >validmind.data_validation.TargetRateBarPlots</td>\n",
-       "      <td id=\"T_0502a_row43_col1\" class=\"data row43 col1\" >Target Rate Bar Plots</td>\n",
-       "      <td id=\"T_0502a_row43_col2\" class=\"data row43 col2\" >Generates bar plots visualizing the default rates of categorical features for a classification machine learning...</td>\n",
-       "      <td id=\"T_0502a_row43_col3\" class=\"data row43 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row43_col4\" class=\"data row43 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row43_col5\" class=\"data row43 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row43_col6\" class=\"data row43 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row43_col7\" class=\"data row43 col7\" >['tabular_data', 'visualization', 'categorical_data']</td>\n",
-       "      <td id=\"T_0502a_row43_col8\" class=\"data row43 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row44_col0\" class=\"data row44 col0\" >validmind.data_validation.TimeSeriesDescription</td>\n",
-       "      <td id=\"T_0502a_row44_col1\" class=\"data row44 col1\" >Time Series Description</td>\n",
-       "      <td id=\"T_0502a_row44_col2\" class=\"data row44 col2\" >Generates a detailed analysis for the provided time series dataset, summarizing key statistics to identify trends,...</td>\n",
-       "      <td id=\"T_0502a_row44_col3\" class=\"data row44 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row44_col4\" class=\"data row44 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row44_col5\" class=\"data row44 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row44_col6\" class=\"data row44 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row44_col7\" class=\"data row44 col7\" >['time_series_data', 'analysis']</td>\n",
-       "      <td id=\"T_0502a_row44_col8\" class=\"data row44 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row45_col0\" class=\"data row45 col0\" >validmind.data_validation.TimeSeriesDescriptiveStatistics</td>\n",
-       "      <td id=\"T_0502a_row45_col1\" class=\"data row45 col1\" >Time Series Descriptive Statistics</td>\n",
-       "      <td id=\"T_0502a_row45_col2\" class=\"data row45 col2\" >Evaluates the descriptive statistics of a time series dataset to identify trends, patterns, and data quality issues....</td>\n",
-       "      <td id=\"T_0502a_row45_col3\" class=\"data row45 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row45_col4\" class=\"data row45 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row45_col5\" class=\"data row45 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row45_col6\" class=\"data row45 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row45_col7\" class=\"data row45 col7\" >['time_series_data', 'analysis']</td>\n",
-       "      <td id=\"T_0502a_row45_col8\" class=\"data row45 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row46_col0\" class=\"data row46 col0\" >validmind.data_validation.TimeSeriesFrequency</td>\n",
-       "      <td id=\"T_0502a_row46_col1\" class=\"data row46 col1\" >Time Series Frequency</td>\n",
-       "      <td id=\"T_0502a_row46_col2\" class=\"data row46 col2\" >Evaluates consistency of time series data frequency and generates a frequency plot....</td>\n",
-       "      <td id=\"T_0502a_row46_col3\" class=\"data row46 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row46_col4\" class=\"data row46 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row46_col5\" class=\"data row46 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row46_col6\" class=\"data row46 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row46_col7\" class=\"data row46 col7\" >['time_series_data']</td>\n",
-       "      <td id=\"T_0502a_row46_col8\" class=\"data row46 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row47_col0\" class=\"data row47 col0\" >validmind.data_validation.TimeSeriesHistogram</td>\n",
-       "      <td id=\"T_0502a_row47_col1\" class=\"data row47 col1\" >Time Series Histogram</td>\n",
-       "      <td id=\"T_0502a_row47_col2\" class=\"data row47 col2\" >Visualizes distribution of time-series data using histograms and Kernel Density Estimation (KDE) lines....</td>\n",
-       "      <td id=\"T_0502a_row47_col3\" class=\"data row47 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row47_col4\" class=\"data row47 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row47_col5\" class=\"data row47 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row47_col6\" class=\"data row47 col6\" >{'nbins': {'type': '_empty', 'default': 30}}</td>\n",
-       "      <td id=\"T_0502a_row47_col7\" class=\"data row47 col7\" >['data_validation', 'visualization', 'time_series_data']</td>\n",
-       "      <td id=\"T_0502a_row47_col8\" class=\"data row47 col8\" >['regression', 'time_series_forecasting']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row48_col0\" class=\"data row48 col0\" >validmind.data_validation.TimeSeriesLinePlot</td>\n",
-       "      <td id=\"T_0502a_row48_col1\" class=\"data row48 col1\" >Time Series Line Plot</td>\n",
-       "      <td id=\"T_0502a_row48_col2\" class=\"data row48 col2\" >Generates and analyses time-series data through line plots revealing trends, patterns, anomalies over time....</td>\n",
-       "      <td id=\"T_0502a_row48_col3\" class=\"data row48 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row48_col4\" class=\"data row48 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row48_col5\" class=\"data row48 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row48_col6\" class=\"data row48 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row48_col7\" class=\"data row48 col7\" >['time_series_data', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row48_col8\" class=\"data row48 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row49_col0\" class=\"data row49 col0\" >validmind.data_validation.TimeSeriesMissingValues</td>\n",
-       "      <td id=\"T_0502a_row49_col1\" class=\"data row49 col1\" >Time Series Missing Values</td>\n",
-       "      <td id=\"T_0502a_row49_col2\" class=\"data row49 col2\" >Validates time-series data quality by confirming the count of missing values is below a certain threshold....</td>\n",
-       "      <td id=\"T_0502a_row49_col3\" class=\"data row49 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row49_col4\" class=\"data row49 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row49_col5\" class=\"data row49 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row49_col6\" class=\"data row49 col6\" >{'min_threshold': {'type': 'int', 'default': 1}}</td>\n",
-       "      <td id=\"T_0502a_row49_col7\" class=\"data row49 col7\" >['time_series_data']</td>\n",
-       "      <td id=\"T_0502a_row49_col8\" class=\"data row49 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row50_col0\" class=\"data row50 col0\" >validmind.data_validation.TimeSeriesOutliers</td>\n",
-       "      <td id=\"T_0502a_row50_col1\" class=\"data row50 col1\" >Time Series Outliers</td>\n",
-       "      <td id=\"T_0502a_row50_col2\" class=\"data row50 col2\" >Identifies and visualizes outliers in time-series data using the z-score method....</td>\n",
-       "      <td id=\"T_0502a_row50_col3\" class=\"data row50 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row50_col4\" class=\"data row50 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row50_col5\" class=\"data row50 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row50_col6\" class=\"data row50 col6\" >{'zscore_threshold': {'type': 'int', 'default': 3}}</td>\n",
-       "      <td id=\"T_0502a_row50_col7\" class=\"data row50 col7\" >['time_series_data']</td>\n",
-       "      <td id=\"T_0502a_row50_col8\" class=\"data row50 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row51_col0\" class=\"data row51 col0\" >validmind.data_validation.TooManyZeroValues</td>\n",
-       "      <td id=\"T_0502a_row51_col1\" class=\"data row51 col1\" >Too Many Zero Values</td>\n",
-       "      <td id=\"T_0502a_row51_col2\" class=\"data row51 col2\" >Identifies numerical columns in a dataset that contain an excessive number of zero values, defined by a threshold...</td>\n",
-       "      <td id=\"T_0502a_row51_col3\" class=\"data row51 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row51_col4\" class=\"data row51 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row51_col5\" class=\"data row51 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row51_col6\" class=\"data row51 col6\" >{'max_percent_threshold': {'type': 'float', 'default': 0.03}}</td>\n",
-       "      <td id=\"T_0502a_row51_col7\" class=\"data row51 col7\" >['tabular_data']</td>\n",
-       "      <td id=\"T_0502a_row51_col8\" class=\"data row51 col8\" >['regression', 'classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row52_col0\" class=\"data row52 col0\" >validmind.data_validation.UniqueRows</td>\n",
-       "      <td id=\"T_0502a_row52_col1\" class=\"data row52 col1\" >Unique Rows</td>\n",
-       "      <td id=\"T_0502a_row52_col2\" class=\"data row52 col2\" >Verifies the diversity of the dataset by ensuring that the count of unique rows exceeds a prescribed threshold....</td>\n",
-       "      <td id=\"T_0502a_row52_col3\" class=\"data row52 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row52_col4\" class=\"data row52 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row52_col5\" class=\"data row52 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row52_col6\" class=\"data row52 col6\" >{'min_percent_threshold': {'type': 'float', 'default': 1}}</td>\n",
-       "      <td id=\"T_0502a_row52_col7\" class=\"data row52 col7\" >['tabular_data']</td>\n",
-       "      <td id=\"T_0502a_row52_col8\" class=\"data row52 col8\" >['regression', 'classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row53_col0\" class=\"data row53 col0\" >validmind.data_validation.WOEBinPlots</td>\n",
-       "      <td id=\"T_0502a_row53_col1\" class=\"data row53 col1\" >WOE Bin Plots</td>\n",
-       "      <td id=\"T_0502a_row53_col2\" class=\"data row53 col2\" >Generates visualizations of Weight of Evidence (WoE) and Information Value (IV) for understanding predictive power...</td>\n",
-       "      <td id=\"T_0502a_row53_col3\" class=\"data row53 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row53_col4\" class=\"data row53 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row53_col5\" class=\"data row53 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row53_col6\" class=\"data row53 col6\" >{'breaks_adj': {'type': 'list', 'default': None}, 'fig_height': {'type': 'int', 'default': 600}, 'fig_width': {'type': 'int', 'default': 500}}</td>\n",
-       "      <td id=\"T_0502a_row53_col7\" class=\"data row53 col7\" >['tabular_data', 'visualization', 'categorical_data']</td>\n",
-       "      <td id=\"T_0502a_row53_col8\" class=\"data row53 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row54_col0\" class=\"data row54 col0\" >validmind.data_validation.WOEBinTable</td>\n",
-       "      <td id=\"T_0502a_row54_col1\" class=\"data row54 col1\" >WOE Bin Table</td>\n",
-       "      <td id=\"T_0502a_row54_col2\" class=\"data row54 col2\" >Assesses the Weight of Evidence (WoE) and Information Value (IV) of each feature to evaluate its predictive power...</td>\n",
-       "      <td id=\"T_0502a_row54_col3\" class=\"data row54 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row54_col4\" class=\"data row54 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row54_col5\" class=\"data row54 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row54_col6\" class=\"data row54 col6\" >{'breaks_adj': {'type': 'list', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row54_col7\" class=\"data row54 col7\" >['tabular_data', 'categorical_data']</td>\n",
-       "      <td id=\"T_0502a_row54_col8\" class=\"data row54 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row55_col0\" class=\"data row55 col0\" >validmind.data_validation.ZivotAndrewsArch</td>\n",
-       "      <td id=\"T_0502a_row55_col1\" class=\"data row55 col1\" >Zivot Andrews Arch</td>\n",
-       "      <td id=\"T_0502a_row55_col2\" class=\"data row55 col2\" >Evaluates the order of integration and stationarity of time series data using the Zivot-Andrews unit root test....</td>\n",
-       "      <td id=\"T_0502a_row55_col3\" class=\"data row55 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row55_col4\" class=\"data row55 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row55_col5\" class=\"data row55 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row55_col6\" class=\"data row55 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row55_col7\" class=\"data row55 col7\" >['time_series_data', 'stationarity', 'unit_root_test']</td>\n",
-       "      <td id=\"T_0502a_row55_col8\" class=\"data row55 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row56_col0\" class=\"data row56 col0\" >validmind.data_validation.nlp.CommonWords</td>\n",
-       "      <td id=\"T_0502a_row56_col1\" class=\"data row56 col1\" >Common Words</td>\n",
-       "      <td id=\"T_0502a_row56_col2\" class=\"data row56 col2\" >Assesses the most frequent non-stopwords in a text column for identifying prevalent language patterns....</td>\n",
-       "      <td id=\"T_0502a_row56_col3\" class=\"data row56 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row56_col4\" class=\"data row56 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row56_col5\" class=\"data row56 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row56_col6\" class=\"data row56 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row56_col7\" class=\"data row56 col7\" >['nlp', 'text_data', 'visualization', 'frequency_analysis']</td>\n",
-       "      <td id=\"T_0502a_row56_col8\" class=\"data row56 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row57_col0\" class=\"data row57 col0\" >validmind.data_validation.nlp.Hashtags</td>\n",
-       "      <td id=\"T_0502a_row57_col1\" class=\"data row57 col1\" >Hashtags</td>\n",
-       "      <td id=\"T_0502a_row57_col2\" class=\"data row57 col2\" >Assesses hashtag frequency in a text column, highlighting usage trends and potential dataset bias or spam....</td>\n",
-       "      <td id=\"T_0502a_row57_col3\" class=\"data row57 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row57_col4\" class=\"data row57 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row57_col5\" class=\"data row57 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row57_col6\" class=\"data row57 col6\" >{'top_hashtags': {'type': 'int', 'default': 25}}</td>\n",
-       "      <td id=\"T_0502a_row57_col7\" class=\"data row57 col7\" >['nlp', 'text_data', 'visualization', 'frequency_analysis']</td>\n",
-       "      <td id=\"T_0502a_row57_col8\" class=\"data row57 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row58_col0\" class=\"data row58 col0\" >validmind.data_validation.nlp.LanguageDetection</td>\n",
-       "      <td id=\"T_0502a_row58_col1\" class=\"data row58 col1\" >Language Detection</td>\n",
-       "      <td id=\"T_0502a_row58_col2\" class=\"data row58 col2\" >Assesses the diversity of languages in a textual dataset by detecting and visualizing the distribution of languages....</td>\n",
-       "      <td id=\"T_0502a_row58_col3\" class=\"data row58 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row58_col4\" class=\"data row58 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row58_col5\" class=\"data row58 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row58_col6\" class=\"data row58 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row58_col7\" class=\"data row58 col7\" >['nlp', 'text_data', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row58_col8\" class=\"data row58 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row59_col0\" class=\"data row59 col0\" >validmind.data_validation.nlp.Mentions</td>\n",
-       "      <td id=\"T_0502a_row59_col1\" class=\"data row59 col1\" >Mentions</td>\n",
-       "      <td id=\"T_0502a_row59_col2\" class=\"data row59 col2\" >Calculates and visualizes frequencies of '@' prefixed mentions in a text-based dataset for NLP model analysis....</td>\n",
-       "      <td id=\"T_0502a_row59_col3\" class=\"data row59 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row59_col4\" class=\"data row59 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row59_col5\" class=\"data row59 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row59_col6\" class=\"data row59 col6\" >{'top_mentions': {'type': 'int', 'default': 25}}</td>\n",
-       "      <td id=\"T_0502a_row59_col7\" class=\"data row59 col7\" >['nlp', 'text_data', 'visualization', 'frequency_analysis']</td>\n",
-       "      <td id=\"T_0502a_row59_col8\" class=\"data row59 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row60_col0\" class=\"data row60 col0\" >validmind.data_validation.nlp.PolarityAndSubjectivity</td>\n",
-       "      <td id=\"T_0502a_row60_col1\" class=\"data row60 col1\" >Polarity And Subjectivity</td>\n",
-       "      <td id=\"T_0502a_row60_col2\" class=\"data row60 col2\" >Analyzes the polarity and subjectivity of text data within a given dataset to visualize the sentiment distribution....</td>\n",
-       "      <td id=\"T_0502a_row60_col3\" class=\"data row60 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row60_col4\" class=\"data row60 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row60_col5\" class=\"data row60 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row60_col6\" class=\"data row60 col6\" >{'threshold_subjectivity': {'type': '_empty', 'default': 0.5}, 'threshold_polarity': {'type': '_empty', 'default': 0}}</td>\n",
-       "      <td id=\"T_0502a_row60_col7\" class=\"data row60 col7\" >['nlp', 'text_data', 'data_validation']</td>\n",
-       "      <td id=\"T_0502a_row60_col8\" class=\"data row60 col8\" >['nlp']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row61_col0\" class=\"data row61 col0\" >validmind.data_validation.nlp.Punctuations</td>\n",
-       "      <td id=\"T_0502a_row61_col1\" class=\"data row61 col1\" >Punctuations</td>\n",
-       "      <td id=\"T_0502a_row61_col2\" class=\"data row61 col2\" >Analyzes and visualizes the frequency distribution of punctuation usage in a given text dataset....</td>\n",
-       "      <td id=\"T_0502a_row61_col3\" class=\"data row61 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row61_col4\" class=\"data row61 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row61_col5\" class=\"data row61 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row61_col6\" class=\"data row61 col6\" >{'count_mode': {'type': '_empty', 'default': 'token'}}</td>\n",
-       "      <td id=\"T_0502a_row61_col7\" class=\"data row61 col7\" >['nlp', 'text_data', 'visualization', 'frequency_analysis']</td>\n",
-       "      <td id=\"T_0502a_row61_col8\" class=\"data row61 col8\" >['text_classification', 'text_summarization', 'nlp']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row62_col0\" class=\"data row62 col0\" >validmind.data_validation.nlp.Sentiment</td>\n",
-       "      <td id=\"T_0502a_row62_col1\" class=\"data row62 col1\" >Sentiment</td>\n",
-       "      <td id=\"T_0502a_row62_col2\" class=\"data row62 col2\" >Analyzes the sentiment of text data within a dataset using the VADER sentiment analysis tool....</td>\n",
-       "      <td id=\"T_0502a_row62_col3\" class=\"data row62 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row62_col4\" class=\"data row62 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row62_col5\" class=\"data row62 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row62_col6\" class=\"data row62 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row62_col7\" class=\"data row62 col7\" >['nlp', 'text_data', 'data_validation']</td>\n",
-       "      <td id=\"T_0502a_row62_col8\" class=\"data row62 col8\" >['nlp']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row63_col0\" class=\"data row63 col0\" >validmind.data_validation.nlp.StopWords</td>\n",
-       "      <td id=\"T_0502a_row63_col1\" class=\"data row63 col1\" >Stop Words</td>\n",
-       "      <td id=\"T_0502a_row63_col2\" class=\"data row63 col2\" >Evaluates and visualizes the frequency of English stop words in a text dataset against a defined threshold....</td>\n",
-       "      <td id=\"T_0502a_row63_col3\" class=\"data row63 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row63_col4\" class=\"data row63 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row63_col5\" class=\"data row63 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row63_col6\" class=\"data row63 col6\" >{'min_percent_threshold': {'type': 'float', 'default': 0.5}, 'num_words': {'type': 'int', 'default': 25}}</td>\n",
-       "      <td id=\"T_0502a_row63_col7\" class=\"data row63 col7\" >['nlp', 'text_data', 'frequency_analysis', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row63_col8\" class=\"data row63 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row64_col0\" class=\"data row64 col0\" >validmind.data_validation.nlp.TextDescription</td>\n",
-       "      <td id=\"T_0502a_row64_col1\" class=\"data row64 col1\" >Text Description</td>\n",
-       "      <td id=\"T_0502a_row64_col2\" class=\"data row64 col2\" >Conducts comprehensive textual analysis on a dataset using NLTK to evaluate various parameters and generate...</td>\n",
-       "      <td id=\"T_0502a_row64_col3\" class=\"data row64 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row64_col4\" class=\"data row64 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row64_col5\" class=\"data row64 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row64_col6\" class=\"data row64 col6\" >{'unwanted_tokens': {'type': 'set', 'default': {'s', 'mrs', 'us', \"''\", ' ', 'ms', 'dr', 'dollar', '``', 'mr', \"'s\", \"s'\"}}, 'lang': {'type': 'str', 'default': 'english'}}</td>\n",
-       "      <td id=\"T_0502a_row64_col7\" class=\"data row64 col7\" >['nlp', 'text_data', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row64_col8\" class=\"data row64 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row65_col0\" class=\"data row65 col0\" >validmind.data_validation.nlp.Toxicity</td>\n",
-       "      <td id=\"T_0502a_row65_col1\" class=\"data row65 col1\" >Toxicity</td>\n",
-       "      <td id=\"T_0502a_row65_col2\" class=\"data row65 col2\" >Assesses the toxicity of text data within a dataset to visualize the distribution of toxicity scores....</td>\n",
-       "      <td id=\"T_0502a_row65_col3\" class=\"data row65 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row65_col4\" class=\"data row65 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row65_col5\" class=\"data row65 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row65_col6\" class=\"data row65 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row65_col7\" class=\"data row65 col7\" >['nlp', 'text_data', 'data_validation']</td>\n",
-       "      <td id=\"T_0502a_row65_col8\" class=\"data row65 col8\" >['nlp']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row66_col0\" class=\"data row66 col0\" >validmind.model_validation.BertScore</td>\n",
-       "      <td id=\"T_0502a_row66_col1\" class=\"data row66 col1\" >Bert Score</td>\n",
-       "      <td id=\"T_0502a_row66_col2\" class=\"data row66 col2\" >Assesses the quality of machine-generated text using BERTScore metrics and visualizes results through histograms...</td>\n",
-       "      <td id=\"T_0502a_row66_col3\" class=\"data row66 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row66_col4\" class=\"data row66 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row66_col5\" class=\"data row66 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row66_col6\" class=\"data row66 col6\" >{'evaluation_model': {'type': '_empty', 'default': 'distilbert-base-uncased'}}</td>\n",
-       "      <td id=\"T_0502a_row66_col7\" class=\"data row66 col7\" >['nlp', 'text_data', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row66_col8\" class=\"data row66 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row67_col0\" class=\"data row67 col0\" >validmind.model_validation.BleuScore</td>\n",
-       "      <td id=\"T_0502a_row67_col1\" class=\"data row67 col1\" >Bleu Score</td>\n",
-       "      <td id=\"T_0502a_row67_col2\" class=\"data row67 col2\" >Evaluates the quality of machine-generated text using BLEU metrics and visualizes the results through histograms...</td>\n",
-       "      <td id=\"T_0502a_row67_col3\" class=\"data row67 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row67_col4\" class=\"data row67 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row67_col5\" class=\"data row67 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row67_col6\" class=\"data row67 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row67_col7\" class=\"data row67 col7\" >['nlp', 'text_data', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row67_col8\" class=\"data row67 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row68_col0\" class=\"data row68 col0\" >validmind.model_validation.ClusterSizeDistribution</td>\n",
-       "      <td id=\"T_0502a_row68_col1\" class=\"data row68 col1\" >Cluster Size Distribution</td>\n",
-       "      <td id=\"T_0502a_row68_col2\" class=\"data row68 col2\" >Assesses the performance of clustering models by comparing the distribution of cluster sizes in model predictions...</td>\n",
-       "      <td id=\"T_0502a_row68_col3\" class=\"data row68 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row68_col4\" class=\"data row68 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row68_col5\" class=\"data row68 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row68_col6\" class=\"data row68 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row68_col7\" class=\"data row68 col7\" >['sklearn', 'model_performance']</td>\n",
-       "      <td id=\"T_0502a_row68_col8\" class=\"data row68 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row69_col0\" class=\"data row69 col0\" >validmind.model_validation.ContextualRecall</td>\n",
-       "      <td id=\"T_0502a_row69_col1\" class=\"data row69 col1\" >Contextual Recall</td>\n",
-       "      <td id=\"T_0502a_row69_col2\" class=\"data row69 col2\" >Evaluates a Natural Language Generation model's ability to generate contextually relevant and factually correct...</td>\n",
-       "      <td id=\"T_0502a_row69_col3\" class=\"data row69 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row69_col4\" class=\"data row69 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row69_col5\" class=\"data row69 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row69_col6\" class=\"data row69 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row69_col7\" class=\"data row69 col7\" >['nlp', 'text_data', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row69_col8\" class=\"data row69 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row70_col0\" class=\"data row70 col0\" >validmind.model_validation.FeaturesAUC</td>\n",
-       "      <td id=\"T_0502a_row70_col1\" class=\"data row70 col1\" >Features AUC</td>\n",
-       "      <td id=\"T_0502a_row70_col2\" class=\"data row70 col2\" >Evaluates the discriminatory power of each individual feature within a binary classification model by calculating...</td>\n",
-       "      <td id=\"T_0502a_row70_col3\" class=\"data row70 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row70_col4\" class=\"data row70 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row70_col5\" class=\"data row70 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row70_col6\" class=\"data row70 col6\" >{'fontsize': {'type': 'int', 'default': 12}, 'figure_height': {'type': 'int', 'default': 500}}</td>\n",
-       "      <td id=\"T_0502a_row70_col7\" class=\"data row70 col7\" >['feature_importance', 'AUC', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row70_col8\" class=\"data row70 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row71_col0\" class=\"data row71 col0\" >validmind.model_validation.MeteorScore</td>\n",
-       "      <td id=\"T_0502a_row71_col1\" class=\"data row71 col1\" >Meteor Score</td>\n",
-       "      <td id=\"T_0502a_row71_col2\" class=\"data row71 col2\" >Assesses the quality of machine-generated translations by comparing them to human-produced references using the...</td>\n",
-       "      <td id=\"T_0502a_row71_col3\" class=\"data row71 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row71_col4\" class=\"data row71 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row71_col5\" class=\"data row71 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row71_col6\" class=\"data row71 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row71_col7\" class=\"data row71 col7\" >['nlp', 'text_data', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row71_col8\" class=\"data row71 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row72_col0\" class=\"data row72 col0\" >validmind.model_validation.ModelMetadata</td>\n",
-       "      <td id=\"T_0502a_row72_col1\" class=\"data row72 col1\" >Model Metadata</td>\n",
-       "      <td id=\"T_0502a_row72_col2\" class=\"data row72 col2\" >Compare metadata of different models and generate a summary table with the results....</td>\n",
-       "      <td id=\"T_0502a_row72_col3\" class=\"data row72 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row72_col4\" class=\"data row72 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row72_col5\" class=\"data row72 col5\" >['model']</td>\n",
-       "      <td id=\"T_0502a_row72_col6\" class=\"data row72 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row72_col7\" class=\"data row72 col7\" >['model_training', 'metadata']</td>\n",
-       "      <td id=\"T_0502a_row72_col8\" class=\"data row72 col8\" >['regression', 'time_series_forecasting']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row73_col0\" class=\"data row73 col0\" >validmind.model_validation.ModelPredictionResiduals</td>\n",
-       "      <td id=\"T_0502a_row73_col1\" class=\"data row73 col1\" >Model Prediction Residuals</td>\n",
-       "      <td id=\"T_0502a_row73_col2\" class=\"data row73 col2\" >Assesses normality and behavior of residuals in regression models through visualization and statistical tests....</td>\n",
-       "      <td id=\"T_0502a_row73_col3\" class=\"data row73 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row73_col4\" class=\"data row73 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row73_col5\" class=\"data row73 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row73_col6\" class=\"data row73 col6\" >{'nbins': {'type': 'int', 'default': 100}, 'p_value_threshold': {'type': 'float', 'default': 0.05}, 'start_date': {'type': None, 'default': None}, 'end_date': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row73_col7\" class=\"data row73 col7\" >['regression']</td>\n",
-       "      <td id=\"T_0502a_row73_col8\" class=\"data row73 col8\" >['residual_analysis', 'visualization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row74_col0\" class=\"data row74 col0\" >validmind.model_validation.RegardScore</td>\n",
-       "      <td id=\"T_0502a_row74_col1\" class=\"data row74 col1\" >Regard Score</td>\n",
-       "      <td id=\"T_0502a_row74_col2\" class=\"data row74 col2\" >Assesses the sentiment and potential biases in text generated by NLP models by computing and visualizing regard...</td>\n",
-       "      <td id=\"T_0502a_row74_col3\" class=\"data row74 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row74_col4\" class=\"data row74 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row74_col5\" class=\"data row74 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row74_col6\" class=\"data row74 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row74_col7\" class=\"data row74 col7\" >['nlp', 'text_data', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row74_col8\" class=\"data row74 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row75_col0\" class=\"data row75 col0\" >validmind.model_validation.RegressionResidualsPlot</td>\n",
-       "      <td id=\"T_0502a_row75_col1\" class=\"data row75 col1\" >Regression Residuals Plot</td>\n",
-       "      <td id=\"T_0502a_row75_col2\" class=\"data row75 col2\" >Evaluates regression model performance using residual distribution and actual vs. predicted plots....</td>\n",
-       "      <td id=\"T_0502a_row75_col3\" class=\"data row75 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row75_col4\" class=\"data row75 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row75_col5\" class=\"data row75 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row75_col6\" class=\"data row75 col6\" >{'bin_size': {'type': 'float', 'default': 0.1}}</td>\n",
-       "      <td id=\"T_0502a_row75_col7\" class=\"data row75 col7\" >['model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row75_col8\" class=\"data row75 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row76_col0\" class=\"data row76 col0\" >validmind.model_validation.RougeScore</td>\n",
-       "      <td id=\"T_0502a_row76_col1\" class=\"data row76 col1\" >Rouge Score</td>\n",
-       "      <td id=\"T_0502a_row76_col2\" class=\"data row76 col2\" >Assesses the quality of machine-generated text using ROUGE metrics and visualizes the results to provide...</td>\n",
-       "      <td id=\"T_0502a_row76_col3\" class=\"data row76 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row76_col4\" class=\"data row76 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row76_col5\" class=\"data row76 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row76_col6\" class=\"data row76 col6\" >{'metric': {'type': 'str', 'default': 'rouge-1'}}</td>\n",
-       "      <td id=\"T_0502a_row76_col7\" class=\"data row76 col7\" >['nlp', 'text_data', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row76_col8\" class=\"data row76 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row77_col0\" class=\"data row77 col0\" >validmind.model_validation.TimeSeriesPredictionWithCI</td>\n",
-       "      <td id=\"T_0502a_row77_col1\" class=\"data row77 col1\" >Time Series Prediction With CI</td>\n",
-       "      <td id=\"T_0502a_row77_col2\" class=\"data row77 col2\" >Assesses predictive accuracy and uncertainty in time series models, highlighting breaches beyond confidence...</td>\n",
-       "      <td id=\"T_0502a_row77_col3\" class=\"data row77 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row77_col4\" class=\"data row77 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row77_col5\" class=\"data row77 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row77_col6\" class=\"data row77 col6\" >{'confidence': {'type': 'float', 'default': 0.95}}</td>\n",
-       "      <td id=\"T_0502a_row77_col7\" class=\"data row77 col7\" >['model_predictions', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row77_col8\" class=\"data row77 col8\" >['regression', 'time_series_forecasting']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row78_col0\" class=\"data row78 col0\" >validmind.model_validation.TimeSeriesPredictionsPlot</td>\n",
-       "      <td id=\"T_0502a_row78_col1\" class=\"data row78 col1\" >Time Series Predictions Plot</td>\n",
-       "      <td id=\"T_0502a_row78_col2\" class=\"data row78 col2\" >Plot actual vs predicted values for time series data and generate a visual comparison for the model....</td>\n",
-       "      <td id=\"T_0502a_row78_col3\" class=\"data row78 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row78_col4\" class=\"data row78 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row78_col5\" class=\"data row78 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row78_col6\" class=\"data row78 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row78_col7\" class=\"data row78 col7\" >['model_predictions', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row78_col8\" class=\"data row78 col8\" >['regression', 'time_series_forecasting']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row79_col0\" class=\"data row79 col0\" >validmind.model_validation.TimeSeriesR2SquareBySegments</td>\n",
-       "      <td id=\"T_0502a_row79_col1\" class=\"data row79 col1\" >Time Series R2 Square By Segments</td>\n",
-       "      <td id=\"T_0502a_row79_col2\" class=\"data row79 col2\" >Evaluates the R-Squared values of regression models over specified time segments in time series data to assess...</td>\n",
-       "      <td id=\"T_0502a_row79_col3\" class=\"data row79 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row79_col4\" class=\"data row79 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row79_col5\" class=\"data row79 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row79_col6\" class=\"data row79 col6\" >{'segments': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row79_col7\" class=\"data row79 col7\" >['model_performance', 'sklearn']</td>\n",
-       "      <td id=\"T_0502a_row79_col8\" class=\"data row79 col8\" >['regression', 'time_series_forecasting']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row80_col0\" class=\"data row80 col0\" >validmind.model_validation.TokenDisparity</td>\n",
-       "      <td id=\"T_0502a_row80_col1\" class=\"data row80 col1\" >Token Disparity</td>\n",
-       "      <td id=\"T_0502a_row80_col2\" class=\"data row80 col2\" >Evaluates the token disparity between reference and generated texts, visualizing the results through histograms and...</td>\n",
-       "      <td id=\"T_0502a_row80_col3\" class=\"data row80 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row80_col4\" class=\"data row80 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row80_col5\" class=\"data row80 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row80_col6\" class=\"data row80 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row80_col7\" class=\"data row80 col7\" >['nlp', 'text_data', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row80_col8\" class=\"data row80 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row81_col0\" class=\"data row81 col0\" >validmind.model_validation.ToxicityScore</td>\n",
-       "      <td id=\"T_0502a_row81_col1\" class=\"data row81 col1\" >Toxicity Score</td>\n",
-       "      <td id=\"T_0502a_row81_col2\" class=\"data row81 col2\" >Assesses the toxicity levels of texts generated by NLP models to identify and mitigate harmful or offensive content....</td>\n",
-       "      <td id=\"T_0502a_row81_col3\" class=\"data row81 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row81_col4\" class=\"data row81 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row81_col5\" class=\"data row81 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row81_col6\" class=\"data row81 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row81_col7\" class=\"data row81 col7\" >['nlp', 'text_data', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row81_col8\" class=\"data row81 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row82_col0\" class=\"data row82 col0\" >validmind.model_validation.embeddings.ClusterDistribution</td>\n",
-       "      <td id=\"T_0502a_row82_col1\" class=\"data row82 col1\" >Cluster Distribution</td>\n",
-       "      <td id=\"T_0502a_row82_col2\" class=\"data row82 col2\" >Assesses the distribution of text embeddings across clusters produced by a model using KMeans clustering....</td>\n",
-       "      <td id=\"T_0502a_row82_col3\" class=\"data row82 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row82_col4\" class=\"data row82 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row82_col5\" class=\"data row82 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row82_col6\" class=\"data row82 col6\" >{'num_clusters': {'type': 'int', 'default': 5}}</td>\n",
-       "      <td id=\"T_0502a_row82_col7\" class=\"data row82 col7\" >['llm', 'text_data', 'embeddings', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row82_col8\" class=\"data row82 col8\" >['feature_extraction']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row83_col0\" class=\"data row83 col0\" >validmind.model_validation.embeddings.CosineSimilarityComparison</td>\n",
-       "      <td id=\"T_0502a_row83_col1\" class=\"data row83 col1\" >Cosine Similarity Comparison</td>\n",
-       "      <td id=\"T_0502a_row83_col2\" class=\"data row83 col2\" >Assesses the similarity between embeddings generated by different models using Cosine Similarity, providing both...</td>\n",
-       "      <td id=\"T_0502a_row83_col3\" class=\"data row83 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row83_col4\" class=\"data row83 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row83_col5\" class=\"data row83 col5\" >['dataset', 'models']</td>\n",
-       "      <td id=\"T_0502a_row83_col6\" class=\"data row83 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row83_col7\" class=\"data row83 col7\" >['visualization', 'dimensionality_reduction', 'embeddings']</td>\n",
-       "      <td id=\"T_0502a_row83_col8\" class=\"data row83 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row84_col0\" class=\"data row84 col0\" >validmind.model_validation.embeddings.CosineSimilarityDistribution</td>\n",
-       "      <td id=\"T_0502a_row84_col1\" class=\"data row84 col1\" >Cosine Similarity Distribution</td>\n",
-       "      <td id=\"T_0502a_row84_col2\" class=\"data row84 col2\" >Assesses the similarity between predicted text embeddings from a model using a Cosine Similarity distribution...</td>\n",
-       "      <td id=\"T_0502a_row84_col3\" class=\"data row84 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row84_col4\" class=\"data row84 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row84_col5\" class=\"data row84 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row84_col6\" class=\"data row84 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row84_col7\" class=\"data row84 col7\" >['llm', 'text_data', 'embeddings', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row84_col8\" class=\"data row84 col8\" >['feature_extraction']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row85_col0\" class=\"data row85 col0\" >validmind.model_validation.embeddings.CosineSimilarityHeatmap</td>\n",
-       "      <td id=\"T_0502a_row85_col1\" class=\"data row85 col1\" >Cosine Similarity Heatmap</td>\n",
-       "      <td id=\"T_0502a_row85_col2\" class=\"data row85 col2\" >Generates an interactive heatmap to visualize the cosine similarities among embeddings derived from a given model....</td>\n",
-       "      <td id=\"T_0502a_row85_col3\" class=\"data row85 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row85_col4\" class=\"data row85 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row85_col5\" class=\"data row85 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row85_col6\" class=\"data row85 col6\" >{'title': {'type': '_empty', 'default': 'Cosine Similarity Matrix'}, 'color': {'type': '_empty', 'default': 'Cosine Similarity'}, 'xaxis_title': {'type': '_empty', 'default': 'Index'}, 'yaxis_title': {'type': '_empty', 'default': 'Index'}, 'color_scale': {'type': '_empty', 'default': 'Blues'}}</td>\n",
-       "      <td id=\"T_0502a_row85_col7\" class=\"data row85 col7\" >['visualization', 'dimensionality_reduction', 'embeddings']</td>\n",
-       "      <td id=\"T_0502a_row85_col8\" class=\"data row85 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row86_col0\" class=\"data row86 col0\" >validmind.model_validation.embeddings.DescriptiveAnalytics</td>\n",
-       "      <td id=\"T_0502a_row86_col1\" class=\"data row86 col1\" >Descriptive Analytics</td>\n",
-       "      <td id=\"T_0502a_row86_col2\" class=\"data row86 col2\" >Evaluates statistical properties of text embeddings in an ML model via mean, median, and standard deviation...</td>\n",
-       "      <td id=\"T_0502a_row86_col3\" class=\"data row86 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row86_col4\" class=\"data row86 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row86_col5\" class=\"data row86 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row86_col6\" class=\"data row86 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row86_col7\" class=\"data row86 col7\" >['llm', 'text_data', 'embeddings', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row86_col8\" class=\"data row86 col8\" >['feature_extraction']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row87_col0\" class=\"data row87 col0\" >validmind.model_validation.embeddings.EmbeddingsVisualization2D</td>\n",
-       "      <td id=\"T_0502a_row87_col1\" class=\"data row87 col1\" >Embeddings Visualization2 D</td>\n",
-       "      <td id=\"T_0502a_row87_col2\" class=\"data row87 col2\" >Visualizes 2D representation of text embeddings generated by a model using t-SNE technique....</td>\n",
-       "      <td id=\"T_0502a_row87_col3\" class=\"data row87 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row87_col4\" class=\"data row87 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row87_col5\" class=\"data row87 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row87_col6\" class=\"data row87 col6\" >{'cluster_column': {'type': None, 'default': None}, 'perplexity': {'type': 'int', 'default': 30}}</td>\n",
-       "      <td id=\"T_0502a_row87_col7\" class=\"data row87 col7\" >['llm', 'text_data', 'embeddings', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row87_col8\" class=\"data row87 col8\" >['feature_extraction']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row88_col0\" class=\"data row88 col0\" >validmind.model_validation.embeddings.EuclideanDistanceComparison</td>\n",
-       "      <td id=\"T_0502a_row88_col1\" class=\"data row88 col1\" >Euclidean Distance Comparison</td>\n",
-       "      <td id=\"T_0502a_row88_col2\" class=\"data row88 col2\" >Assesses and visualizes the dissimilarity between model embeddings using Euclidean distance, providing insights...</td>\n",
-       "      <td id=\"T_0502a_row88_col3\" class=\"data row88 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row88_col4\" class=\"data row88 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row88_col5\" class=\"data row88 col5\" >['dataset', 'models']</td>\n",
-       "      <td id=\"T_0502a_row88_col6\" class=\"data row88 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row88_col7\" class=\"data row88 col7\" >['visualization', 'dimensionality_reduction', 'embeddings']</td>\n",
-       "      <td id=\"T_0502a_row88_col8\" class=\"data row88 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row89_col0\" class=\"data row89 col0\" >validmind.model_validation.embeddings.EuclideanDistanceHeatmap</td>\n",
-       "      <td id=\"T_0502a_row89_col1\" class=\"data row89 col1\" >Euclidean Distance Heatmap</td>\n",
-       "      <td id=\"T_0502a_row89_col2\" class=\"data row89 col2\" >Generates an interactive heatmap to visualize the Euclidean distances among embeddings derived from a given model....</td>\n",
-       "      <td id=\"T_0502a_row89_col3\" class=\"data row89 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row89_col4\" class=\"data row89 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row89_col5\" class=\"data row89 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row89_col6\" class=\"data row89 col6\" >{'title': {'type': '_empty', 'default': 'Euclidean Distance Matrix'}, 'color': {'type': '_empty', 'default': 'Euclidean Distance'}, 'xaxis_title': {'type': '_empty', 'default': 'Index'}, 'yaxis_title': {'type': '_empty', 'default': 'Index'}, 'color_scale': {'type': '_empty', 'default': 'Blues'}}</td>\n",
-       "      <td id=\"T_0502a_row89_col7\" class=\"data row89 col7\" >['visualization', 'dimensionality_reduction', 'embeddings']</td>\n",
-       "      <td id=\"T_0502a_row89_col8\" class=\"data row89 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row90_col0\" class=\"data row90 col0\" >validmind.model_validation.embeddings.PCAComponentsPairwisePlots</td>\n",
-       "      <td id=\"T_0502a_row90_col1\" class=\"data row90 col1\" >PCA Components Pairwise Plots</td>\n",
-       "      <td id=\"T_0502a_row90_col2\" class=\"data row90 col2\" >Generates scatter plots for pairwise combinations of principal component analysis (PCA) components of model...</td>\n",
-       "      <td id=\"T_0502a_row90_col3\" class=\"data row90 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row90_col4\" class=\"data row90 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row90_col5\" class=\"data row90 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row90_col6\" class=\"data row90 col6\" >{'n_components': {'type': 'int', 'default': 3}}</td>\n",
-       "      <td id=\"T_0502a_row90_col7\" class=\"data row90 col7\" >['visualization', 'dimensionality_reduction', 'embeddings']</td>\n",
-       "      <td id=\"T_0502a_row90_col8\" class=\"data row90 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row91_col0\" class=\"data row91 col0\" >validmind.model_validation.embeddings.StabilityAnalysisKeyword</td>\n",
-       "      <td id=\"T_0502a_row91_col1\" class=\"data row91 col1\" >Stability Analysis Keyword</td>\n",
-       "      <td id=\"T_0502a_row91_col2\" class=\"data row91 col2\" >Evaluates robustness of embedding models to keyword swaps in the test dataset....</td>\n",
-       "      <td id=\"T_0502a_row91_col3\" class=\"data row91 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row91_col4\" class=\"data row91 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row91_col5\" class=\"data row91 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row91_col6\" class=\"data row91 col6\" >{'keyword_dict': {'type': None, 'default': None}, 'mean_similarity_threshold': {'type': 'float', 'default': 0.7}}</td>\n",
-       "      <td id=\"T_0502a_row91_col7\" class=\"data row91 col7\" >['llm', 'text_data', 'embeddings', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row91_col8\" class=\"data row91 col8\" >['feature_extraction']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row92_col0\" class=\"data row92 col0\" >validmind.model_validation.embeddings.StabilityAnalysisRandomNoise</td>\n",
-       "      <td id=\"T_0502a_row92_col1\" class=\"data row92 col1\" >Stability Analysis Random Noise</td>\n",
-       "      <td id=\"T_0502a_row92_col2\" class=\"data row92 col2\" >Assesses the robustness of text embeddings models to random noise introduced via text perturbations....</td>\n",
-       "      <td id=\"T_0502a_row92_col3\" class=\"data row92 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row92_col4\" class=\"data row92 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row92_col5\" class=\"data row92 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row92_col6\" class=\"data row92 col6\" >{'probability': {'type': 'float', 'default': 0.02}, 'mean_similarity_threshold': {'type': 'float', 'default': 0.7}}</td>\n",
-       "      <td id=\"T_0502a_row92_col7\" class=\"data row92 col7\" >['llm', 'text_data', 'embeddings', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row92_col8\" class=\"data row92 col8\" >['feature_extraction']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row93_col0\" class=\"data row93 col0\" >validmind.model_validation.embeddings.StabilityAnalysisSynonyms</td>\n",
-       "      <td id=\"T_0502a_row93_col1\" class=\"data row93 col1\" >Stability Analysis Synonyms</td>\n",
-       "      <td id=\"T_0502a_row93_col2\" class=\"data row93 col2\" >Evaluates the stability of text embeddings models when words in test data are replaced by their synonyms randomly....</td>\n",
-       "      <td id=\"T_0502a_row93_col3\" class=\"data row93 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row93_col4\" class=\"data row93 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row93_col5\" class=\"data row93 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row93_col6\" class=\"data row93 col6\" >{'probability': {'type': 'float', 'default': 0.02}, 'mean_similarity_threshold': {'type': 'float', 'default': 0.7}}</td>\n",
-       "      <td id=\"T_0502a_row93_col7\" class=\"data row93 col7\" >['llm', 'text_data', 'embeddings', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row93_col8\" class=\"data row93 col8\" >['feature_extraction']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row94_col0\" class=\"data row94 col0\" >validmind.model_validation.embeddings.StabilityAnalysisTranslation</td>\n",
-       "      <td id=\"T_0502a_row94_col1\" class=\"data row94 col1\" >Stability Analysis Translation</td>\n",
-       "      <td id=\"T_0502a_row94_col2\" class=\"data row94 col2\" >Evaluates robustness of text embeddings models to noise introduced by translating the original text to another...</td>\n",
-       "      <td id=\"T_0502a_row94_col3\" class=\"data row94 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row94_col4\" class=\"data row94 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row94_col5\" class=\"data row94 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row94_col6\" class=\"data row94 col6\" >{'source_lang': {'type': 'str', 'default': 'en'}, 'target_lang': {'type': 'str', 'default': 'fr'}, 'mean_similarity_threshold': {'type': 'float', 'default': 0.7}}</td>\n",
-       "      <td id=\"T_0502a_row94_col7\" class=\"data row94 col7\" >['llm', 'text_data', 'embeddings', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row94_col8\" class=\"data row94 col8\" >['feature_extraction']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row95_col0\" class=\"data row95 col0\" >validmind.model_validation.embeddings.TSNEComponentsPairwisePlots</td>\n",
-       "      <td id=\"T_0502a_row95_col1\" class=\"data row95 col1\" >TSNE Components Pairwise Plots</td>\n",
-       "      <td id=\"T_0502a_row95_col2\" class=\"data row95 col2\" >Creates scatter plots for pairwise combinations of t-SNE components to visualize embeddings and highlight potential...</td>\n",
-       "      <td id=\"T_0502a_row95_col3\" class=\"data row95 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row95_col4\" class=\"data row95 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row95_col5\" class=\"data row95 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row95_col6\" class=\"data row95 col6\" >{'n_components': {'type': 'int', 'default': 2}, 'perplexity': {'type': 'int', 'default': 30}, 'title': {'type': 'str', 'default': 't-SNE'}}</td>\n",
-       "      <td id=\"T_0502a_row95_col7\" class=\"data row95 col7\" >['visualization', 'dimensionality_reduction', 'embeddings']</td>\n",
-       "      <td id=\"T_0502a_row95_col8\" class=\"data row95 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row96_col0\" class=\"data row96 col0\" >validmind.model_validation.ragas.AnswerCorrectness</td>\n",
-       "      <td id=\"T_0502a_row96_col1\" class=\"data row96 col1\" >Answer Correctness</td>\n",
-       "      <td id=\"T_0502a_row96_col2\" class=\"data row96 col2\" >Evaluates the correctness of answers in a dataset with respect to the provided ground...</td>\n",
-       "      <td id=\"T_0502a_row96_col3\" class=\"data row96 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row96_col4\" class=\"data row96 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row96_col5\" class=\"data row96 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row96_col6\" class=\"data row96 col6\" >{'user_input_column': {'type': 'str', 'default': 'user_input'}, 'response_column': {'type': 'str', 'default': 'response'}, 'reference_column': {'type': 'str', 'default': 'reference'}, 'judge_llm': {'type': '_empty', 'default': None}, 'judge_embeddings': {'type': '_empty', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row96_col7\" class=\"data row96 col7\" >['ragas', 'llm']</td>\n",
-       "      <td id=\"T_0502a_row96_col8\" class=\"data row96 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row97_col0\" class=\"data row97 col0\" >validmind.model_validation.ragas.AspectCritic</td>\n",
-       "      <td id=\"T_0502a_row97_col1\" class=\"data row97 col1\" >Aspect Critic</td>\n",
-       "      <td id=\"T_0502a_row97_col2\" class=\"data row97 col2\" >Evaluates generations against the following aspects: harmfulness, maliciousness,...</td>\n",
-       "      <td id=\"T_0502a_row97_col3\" class=\"data row97 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row97_col4\" class=\"data row97 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row97_col5\" class=\"data row97 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row97_col6\" class=\"data row97 col6\" >{'user_input_column': {'type': 'str', 'default': 'user_input'}, 'response_column': {'type': 'str', 'default': 'response'}, 'retrieved_contexts_column': {'type': None, 'default': None}, 'aspects': {'type': None, 'default': ['coherence', 'conciseness', 'correctness', 'harmfulness', 'maliciousness']}, 'additional_aspects': {'type': None, 'default': None}, 'judge_llm': {'type': '_empty', 'default': None}, 'judge_embeddings': {'type': '_empty', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row97_col7\" class=\"data row97 col7\" >['ragas', 'llm', 'qualitative']</td>\n",
-       "      <td id=\"T_0502a_row97_col8\" class=\"data row97 col8\" >['text_summarization', 'text_generation', 'text_qa']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row98_col0\" class=\"data row98 col0\" >validmind.model_validation.ragas.ContextEntityRecall</td>\n",
-       "      <td id=\"T_0502a_row98_col1\" class=\"data row98 col1\" >Context Entity Recall</td>\n",
-       "      <td id=\"T_0502a_row98_col2\" class=\"data row98 col2\" >Evaluates the context entity recall for dataset entries and visualizes the results....</td>\n",
-       "      <td id=\"T_0502a_row98_col3\" class=\"data row98 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row98_col4\" class=\"data row98 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row98_col5\" class=\"data row98 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row98_col6\" class=\"data row98 col6\" >{'retrieved_contexts_column': {'type': 'str', 'default': 'retrieved_contexts'}, 'reference_column': {'type': 'str', 'default': 'reference'}, 'judge_llm': {'type': '_empty', 'default': None}, 'judge_embeddings': {'type': '_empty', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row98_col7\" class=\"data row98 col7\" >['ragas', 'llm', 'retrieval_performance']</td>\n",
-       "      <td id=\"T_0502a_row98_col8\" class=\"data row98 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row99_col0\" class=\"data row99 col0\" >validmind.model_validation.ragas.ContextPrecision</td>\n",
-       "      <td id=\"T_0502a_row99_col1\" class=\"data row99 col1\" >Context Precision</td>\n",
-       "      <td id=\"T_0502a_row99_col2\" class=\"data row99 col2\" >Context Precision is a metric that evaluates whether all of the ground-truth...</td>\n",
-       "      <td id=\"T_0502a_row99_col3\" class=\"data row99 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row99_col4\" class=\"data row99 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row99_col5\" class=\"data row99 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row99_col6\" class=\"data row99 col6\" >{'user_input_column': {'type': 'str', 'default': 'user_input'}, 'retrieved_contexts_column': {'type': 'str', 'default': 'retrieved_contexts'}, 'reference_column': {'type': 'str', 'default': 'reference'}, 'judge_llm': {'type': '_empty', 'default': None}, 'judge_embeddings': {'type': '_empty', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row99_col7\" class=\"data row99 col7\" >['ragas', 'llm', 'retrieval_performance']</td>\n",
-       "      <td id=\"T_0502a_row99_col8\" class=\"data row99 col8\" >['text_qa', 'text_generation', 'text_summarization', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row100_col0\" class=\"data row100 col0\" >validmind.model_validation.ragas.ContextPrecisionWithoutReference</td>\n",
-       "      <td id=\"T_0502a_row100_col1\" class=\"data row100 col1\" >Context Precision Without Reference</td>\n",
-       "      <td id=\"T_0502a_row100_col2\" class=\"data row100 col2\" >Context Precision Without Reference is a metric used to evaluate the relevance of...</td>\n",
-       "      <td id=\"T_0502a_row100_col3\" class=\"data row100 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row100_col4\" class=\"data row100 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row100_col5\" class=\"data row100 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row100_col6\" class=\"data row100 col6\" >{'user_input_column': {'type': 'str', 'default': 'user_input'}, 'retrieved_contexts_column': {'type': 'str', 'default': 'retrieved_contexts'}, 'response_column': {'type': 'str', 'default': 'response'}, 'judge_llm': {'type': '_empty', 'default': None}, 'judge_embeddings': {'type': '_empty', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row100_col7\" class=\"data row100 col7\" >['ragas', 'llm', 'retrieval_performance']</td>\n",
-       "      <td id=\"T_0502a_row100_col8\" class=\"data row100 col8\" >['text_qa', 'text_generation', 'text_summarization', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row101_col0\" class=\"data row101 col0\" >validmind.model_validation.ragas.ContextRecall</td>\n",
-       "      <td id=\"T_0502a_row101_col1\" class=\"data row101 col1\" >Context Recall</td>\n",
-       "      <td id=\"T_0502a_row101_col2\" class=\"data row101 col2\" >Context recall measures the extent to which the retrieved context aligns with the...</td>\n",
-       "      <td id=\"T_0502a_row101_col3\" class=\"data row101 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row101_col4\" class=\"data row101 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row101_col5\" class=\"data row101 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row101_col6\" class=\"data row101 col6\" >{'user_input_column': {'type': 'str', 'default': 'user_input'}, 'retrieved_contexts_column': {'type': 'str', 'default': 'retrieved_contexts'}, 'reference_column': {'type': 'str', 'default': 'reference'}, 'judge_llm': {'type': '_empty', 'default': None}, 'judge_embeddings': {'type': '_empty', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row101_col7\" class=\"data row101 col7\" >['ragas', 'llm', 'retrieval_performance']</td>\n",
-       "      <td id=\"T_0502a_row101_col8\" class=\"data row101 col8\" >['text_qa', 'text_generation', 'text_summarization', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row102_col0\" class=\"data row102 col0\" >validmind.model_validation.ragas.Faithfulness</td>\n",
-       "      <td id=\"T_0502a_row102_col1\" class=\"data row102 col1\" >Faithfulness</td>\n",
-       "      <td id=\"T_0502a_row102_col2\" class=\"data row102 col2\" >Evaluates the faithfulness of the generated answers with respect to retrieved contexts....</td>\n",
-       "      <td id=\"T_0502a_row102_col3\" class=\"data row102 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row102_col4\" class=\"data row102 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row102_col5\" class=\"data row102 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row102_col6\" class=\"data row102 col6\" >{'user_input_column': {'type': 'str', 'default': 'user_input'}, 'response_column': {'type': 'str', 'default': 'response'}, 'retrieved_contexts_column': {'type': 'str', 'default': 'retrieved_contexts'}, 'judge_llm': {'type': '_empty', 'default': None}, 'judge_embeddings': {'type': '_empty', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row102_col7\" class=\"data row102 col7\" >['ragas', 'llm', 'rag_performance']</td>\n",
-       "      <td id=\"T_0502a_row102_col8\" class=\"data row102 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row103_col0\" class=\"data row103 col0\" >validmind.model_validation.ragas.NoiseSensitivity</td>\n",
-       "      <td id=\"T_0502a_row103_col1\" class=\"data row103 col1\" >Noise Sensitivity</td>\n",
-       "      <td id=\"T_0502a_row103_col2\" class=\"data row103 col2\" >Assesses the sensitivity of a Large Language Model (LLM) to noise in retrieved context by measuring how often it...</td>\n",
-       "      <td id=\"T_0502a_row103_col3\" class=\"data row103 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row103_col4\" class=\"data row103 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row103_col5\" class=\"data row103 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row103_col6\" class=\"data row103 col6\" >{'response_column': {'type': 'str', 'default': 'response'}, 'retrieved_contexts_column': {'type': 'str', 'default': 'retrieved_contexts'}, 'reference_column': {'type': 'str', 'default': 'reference'}, 'focus': {'type': 'str', 'default': 'relevant'}, 'user_input_column': {'type': 'str', 'default': 'user_input'}, 'judge_llm': {'type': '_empty', 'default': None}, 'judge_embeddings': {'type': '_empty', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row103_col7\" class=\"data row103 col7\" >['ragas', 'llm', 'rag_performance']</td>\n",
-       "      <td id=\"T_0502a_row103_col8\" class=\"data row103 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row104_col0\" class=\"data row104 col0\" >validmind.model_validation.ragas.ResponseRelevancy</td>\n",
-       "      <td id=\"T_0502a_row104_col1\" class=\"data row104 col1\" >Response Relevancy</td>\n",
-       "      <td id=\"T_0502a_row104_col2\" class=\"data row104 col2\" >Assesses how pertinent the generated answer is to the given prompt....</td>\n",
-       "      <td id=\"T_0502a_row104_col3\" class=\"data row104 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row104_col4\" class=\"data row104 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row104_col5\" class=\"data row104 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row104_col6\" class=\"data row104 col6\" >{'user_input_column': {'type': 'str', 'default': 'user_input'}, 'retrieved_contexts_column': {'type': 'str', 'default': None}, 'response_column': {'type': 'str', 'default': 'response'}, 'judge_llm': {'type': '_empty', 'default': None}, 'judge_embeddings': {'type': '_empty', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row104_col7\" class=\"data row104 col7\" >['ragas', 'llm', 'rag_performance']</td>\n",
-       "      <td id=\"T_0502a_row104_col8\" class=\"data row104 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row105_col0\" class=\"data row105 col0\" >validmind.model_validation.ragas.SemanticSimilarity</td>\n",
-       "      <td id=\"T_0502a_row105_col1\" class=\"data row105 col1\" >Semantic Similarity</td>\n",
-       "      <td id=\"T_0502a_row105_col2\" class=\"data row105 col2\" >Calculates the semantic similarity between generated responses and ground truths...</td>\n",
-       "      <td id=\"T_0502a_row105_col3\" class=\"data row105 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row105_col4\" class=\"data row105 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row105_col5\" class=\"data row105 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row105_col6\" class=\"data row105 col6\" >{'response_column': {'type': 'str', 'default': 'response'}, 'reference_column': {'type': 'str', 'default': 'reference'}, 'judge_llm': {'type': '_empty', 'default': None}, 'judge_embeddings': {'type': '_empty', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row105_col7\" class=\"data row105 col7\" >['ragas', 'llm']</td>\n",
-       "      <td id=\"T_0502a_row105_col8\" class=\"data row105 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row106_col0\" class=\"data row106 col0\" >validmind.model_validation.sklearn.AdjustedMutualInformation</td>\n",
-       "      <td id=\"T_0502a_row106_col1\" class=\"data row106 col1\" >Adjusted Mutual Information</td>\n",
-       "      <td id=\"T_0502a_row106_col2\" class=\"data row106 col2\" >Evaluates clustering model performance by measuring mutual information between true and predicted labels, adjusting...</td>\n",
-       "      <td id=\"T_0502a_row106_col3\" class=\"data row106 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row106_col4\" class=\"data row106 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row106_col5\" class=\"data row106 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row106_col6\" class=\"data row106 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row106_col7\" class=\"data row106 col7\" >['sklearn', 'model_performance', 'clustering']</td>\n",
-       "      <td id=\"T_0502a_row106_col8\" class=\"data row106 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row107_col0\" class=\"data row107 col0\" >validmind.model_validation.sklearn.AdjustedRandIndex</td>\n",
-       "      <td id=\"T_0502a_row107_col1\" class=\"data row107 col1\" >Adjusted Rand Index</td>\n",
-       "      <td id=\"T_0502a_row107_col2\" class=\"data row107 col2\" >Measures the similarity between two data clusters using the Adjusted Rand Index (ARI) metric in clustering machine...</td>\n",
-       "      <td id=\"T_0502a_row107_col3\" class=\"data row107 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row107_col4\" class=\"data row107 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row107_col5\" class=\"data row107 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row107_col6\" class=\"data row107 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row107_col7\" class=\"data row107 col7\" >['sklearn', 'model_performance', 'clustering']</td>\n",
-       "      <td id=\"T_0502a_row107_col8\" class=\"data row107 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row108_col0\" class=\"data row108 col0\" >validmind.model_validation.sklearn.CalibrationCurve</td>\n",
-       "      <td id=\"T_0502a_row108_col1\" class=\"data row108 col1\" >Calibration Curve</td>\n",
-       "      <td id=\"T_0502a_row108_col2\" class=\"data row108 col2\" >Evaluates the calibration of probability estimates by comparing predicted probabilities against observed...</td>\n",
-       "      <td id=\"T_0502a_row108_col3\" class=\"data row108 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row108_col4\" class=\"data row108 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row108_col5\" class=\"data row108 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row108_col6\" class=\"data row108 col6\" >{'n_bins': {'type': 'int', 'default': 10}}</td>\n",
-       "      <td id=\"T_0502a_row108_col7\" class=\"data row108 col7\" >['sklearn', 'model_performance', 'classification']</td>\n",
-       "      <td id=\"T_0502a_row108_col8\" class=\"data row108 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row109_col0\" class=\"data row109 col0\" >validmind.model_validation.sklearn.ClassifierPerformance</td>\n",
-       "      <td id=\"T_0502a_row109_col1\" class=\"data row109 col1\" >Classifier Performance</td>\n",
-       "      <td id=\"T_0502a_row109_col2\" class=\"data row109 col2\" >Evaluates performance of binary or multiclass classification models using precision, recall, F1-Score, accuracy,...</td>\n",
-       "      <td id=\"T_0502a_row109_col3\" class=\"data row109 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row109_col4\" class=\"data row109 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row109_col5\" class=\"data row109 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row109_col6\" class=\"data row109 col6\" >{'average': {'type': 'str', 'default': 'macro'}}</td>\n",
-       "      <td id=\"T_0502a_row109_col7\" class=\"data row109 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_0502a_row109_col8\" class=\"data row109 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row110_col0\" class=\"data row110 col0\" >validmind.model_validation.sklearn.ClassifierThresholdOptimization</td>\n",
-       "      <td id=\"T_0502a_row110_col1\" class=\"data row110 col1\" >Classifier Threshold Optimization</td>\n",
-       "      <td id=\"T_0502a_row110_col2\" class=\"data row110 col2\" >Analyzes and visualizes different threshold optimization methods for binary classification models....</td>\n",
-       "      <td id=\"T_0502a_row110_col3\" class=\"data row110 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row110_col4\" class=\"data row110 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row110_col5\" class=\"data row110 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row110_col6\" class=\"data row110 col6\" >{'methods': {'type': None, 'default': None}, 'target_recall': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row110_col7\" class=\"data row110 col7\" >['model_validation', 'threshold_optimization', 'classification_metrics']</td>\n",
-       "      <td id=\"T_0502a_row110_col8\" class=\"data row110 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row111_col0\" class=\"data row111 col0\" >validmind.model_validation.sklearn.ClusterCosineSimilarity</td>\n",
-       "      <td id=\"T_0502a_row111_col1\" class=\"data row111 col1\" >Cluster Cosine Similarity</td>\n",
-       "      <td id=\"T_0502a_row111_col2\" class=\"data row111 col2\" >Measures the intra-cluster similarity of a clustering model using cosine similarity....</td>\n",
-       "      <td id=\"T_0502a_row111_col3\" class=\"data row111 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row111_col4\" class=\"data row111 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row111_col5\" class=\"data row111 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row111_col6\" class=\"data row111 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row111_col7\" class=\"data row111 col7\" >['sklearn', 'model_performance', 'clustering']</td>\n",
-       "      <td id=\"T_0502a_row111_col8\" class=\"data row111 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row112_col0\" class=\"data row112 col0\" >validmind.model_validation.sklearn.ClusterPerformanceMetrics</td>\n",
-       "      <td id=\"T_0502a_row112_col1\" class=\"data row112 col1\" >Cluster Performance Metrics</td>\n",
-       "      <td id=\"T_0502a_row112_col2\" class=\"data row112 col2\" >Evaluates the performance of clustering machine learning models using multiple established metrics....</td>\n",
-       "      <td id=\"T_0502a_row112_col3\" class=\"data row112 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row112_col4\" class=\"data row112 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row112_col5\" class=\"data row112 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row112_col6\" class=\"data row112 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row112_col7\" class=\"data row112 col7\" >['sklearn', 'model_performance', 'clustering']</td>\n",
-       "      <td id=\"T_0502a_row112_col8\" class=\"data row112 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row113_col0\" class=\"data row113 col0\" >validmind.model_validation.sklearn.CompletenessScore</td>\n",
-       "      <td id=\"T_0502a_row113_col1\" class=\"data row113 col1\" >Completeness Score</td>\n",
-       "      <td id=\"T_0502a_row113_col2\" class=\"data row113 col2\" >Evaluates a clustering model's capacity to categorize instances from a single class into the same cluster....</td>\n",
-       "      <td id=\"T_0502a_row113_col3\" class=\"data row113 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row113_col4\" class=\"data row113 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row113_col5\" class=\"data row113 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row113_col6\" class=\"data row113 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row113_col7\" class=\"data row113 col7\" >['sklearn', 'model_performance', 'clustering']</td>\n",
-       "      <td id=\"T_0502a_row113_col8\" class=\"data row113 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row114_col0\" class=\"data row114 col0\" >validmind.model_validation.sklearn.ConfusionMatrix</td>\n",
-       "      <td id=\"T_0502a_row114_col1\" class=\"data row114 col1\" >Confusion Matrix</td>\n",
-       "      <td id=\"T_0502a_row114_col2\" class=\"data row114 col2\" >Evaluates and visually represents the classification ML model's predictive performance using a Confusion Matrix...</td>\n",
-       "      <td id=\"T_0502a_row114_col3\" class=\"data row114 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row114_col4\" class=\"data row114 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row114_col5\" class=\"data row114 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row114_col6\" class=\"data row114 col6\" >{'threshold': {'type': 'float', 'default': 0.5}}</td>\n",
-       "      <td id=\"T_0502a_row114_col7\" class=\"data row114 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row114_col8\" class=\"data row114 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row115_col0\" class=\"data row115 col0\" >validmind.model_validation.sklearn.FeatureImportance</td>\n",
-       "      <td id=\"T_0502a_row115_col1\" class=\"data row115 col1\" >Feature Importance</td>\n",
-       "      <td id=\"T_0502a_row115_col2\" class=\"data row115 col2\" >Compute feature importance scores for a given model and generate a summary table...</td>\n",
-       "      <td id=\"T_0502a_row115_col3\" class=\"data row115 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row115_col4\" class=\"data row115 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row115_col5\" class=\"data row115 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row115_col6\" class=\"data row115 col6\" >{'num_features': {'type': 'int', 'default': 3}}</td>\n",
-       "      <td id=\"T_0502a_row115_col7\" class=\"data row115 col7\" >['model_explainability', 'sklearn']</td>\n",
-       "      <td id=\"T_0502a_row115_col8\" class=\"data row115 col8\" >['regression', 'time_series_forecasting']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row116_col0\" class=\"data row116 col0\" >validmind.model_validation.sklearn.FowlkesMallowsScore</td>\n",
-       "      <td id=\"T_0502a_row116_col1\" class=\"data row116 col1\" >Fowlkes Mallows Score</td>\n",
-       "      <td id=\"T_0502a_row116_col2\" class=\"data row116 col2\" >Evaluates the similarity between predicted and actual cluster assignments in a model using the Fowlkes-Mallows...</td>\n",
-       "      <td id=\"T_0502a_row116_col3\" class=\"data row116 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row116_col4\" class=\"data row116 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row116_col5\" class=\"data row116 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row116_col6\" class=\"data row116 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row116_col7\" class=\"data row116 col7\" >['sklearn', 'model_performance']</td>\n",
-       "      <td id=\"T_0502a_row116_col8\" class=\"data row116 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row117_col0\" class=\"data row117 col0\" >validmind.model_validation.sklearn.HomogeneityScore</td>\n",
-       "      <td id=\"T_0502a_row117_col1\" class=\"data row117 col1\" >Homogeneity Score</td>\n",
-       "      <td id=\"T_0502a_row117_col2\" class=\"data row117 col2\" >Assesses clustering homogeneity by comparing true and predicted labels, scoring from 0 (heterogeneous) to 1...</td>\n",
-       "      <td id=\"T_0502a_row117_col3\" class=\"data row117 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row117_col4\" class=\"data row117 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row117_col5\" class=\"data row117 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row117_col6\" class=\"data row117 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row117_col7\" class=\"data row117 col7\" >['sklearn', 'model_performance']</td>\n",
-       "      <td id=\"T_0502a_row117_col8\" class=\"data row117 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row118_col0\" class=\"data row118 col0\" >validmind.model_validation.sklearn.HyperParametersTuning</td>\n",
-       "      <td id=\"T_0502a_row118_col1\" class=\"data row118 col1\" >Hyper Parameters Tuning</td>\n",
-       "      <td id=\"T_0502a_row118_col2\" class=\"data row118 col2\" >Performs exhaustive grid search over specified parameter ranges to find optimal model configurations...</td>\n",
-       "      <td id=\"T_0502a_row118_col3\" class=\"data row118 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row118_col4\" class=\"data row118 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row118_col5\" class=\"data row118 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row118_col6\" class=\"data row118 col6\" >{'param_grid': {'type': 'dict', 'default': None}, 'scoring': {'type': None, 'default': None}, 'thresholds': {'type': None, 'default': None}, 'fit_params': {'type': 'dict', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row118_col7\" class=\"data row118 col7\" >['sklearn', 'model_performance']</td>\n",
-       "      <td id=\"T_0502a_row118_col8\" class=\"data row118 col8\" >['clustering', 'classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row119_col0\" class=\"data row119 col0\" >validmind.model_validation.sklearn.KMeansClustersOptimization</td>\n",
-       "      <td id=\"T_0502a_row119_col1\" class=\"data row119 col1\" >K Means Clusters Optimization</td>\n",
-       "      <td id=\"T_0502a_row119_col2\" class=\"data row119 col2\" >Optimizes the number of clusters in K-means models using Elbow and Silhouette methods....</td>\n",
-       "      <td id=\"T_0502a_row119_col3\" class=\"data row119 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row119_col4\" class=\"data row119 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row119_col5\" class=\"data row119 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row119_col6\" class=\"data row119 col6\" >{'n_clusters': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row119_col7\" class=\"data row119 col7\" >['sklearn', 'model_performance', 'kmeans']</td>\n",
-       "      <td id=\"T_0502a_row119_col8\" class=\"data row119 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row120_col0\" class=\"data row120 col0\" >validmind.model_validation.sklearn.MinimumAccuracy</td>\n",
-       "      <td id=\"T_0502a_row120_col1\" class=\"data row120 col1\" >Minimum Accuracy</td>\n",
-       "      <td id=\"T_0502a_row120_col2\" class=\"data row120 col2\" >Checks if the model's prediction accuracy meets or surpasses a specified threshold....</td>\n",
-       "      <td id=\"T_0502a_row120_col3\" class=\"data row120 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row120_col4\" class=\"data row120 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row120_col5\" class=\"data row120 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row120_col6\" class=\"data row120 col6\" >{'min_threshold': {'type': 'float', 'default': 0.7}}</td>\n",
-       "      <td id=\"T_0502a_row120_col7\" class=\"data row120 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_0502a_row120_col8\" class=\"data row120 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row121_col0\" class=\"data row121 col0\" >validmind.model_validation.sklearn.MinimumF1Score</td>\n",
-       "      <td id=\"T_0502a_row121_col1\" class=\"data row121 col1\" >Minimum F1 Score</td>\n",
-       "      <td id=\"T_0502a_row121_col2\" class=\"data row121 col2\" >Assesses if the model's F1 score on the validation set meets a predefined minimum threshold, ensuring balanced...</td>\n",
-       "      <td id=\"T_0502a_row121_col3\" class=\"data row121 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row121_col4\" class=\"data row121 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row121_col5\" class=\"data row121 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row121_col6\" class=\"data row121 col6\" >{'min_threshold': {'type': 'float', 'default': 0.5}}</td>\n",
-       "      <td id=\"T_0502a_row121_col7\" class=\"data row121 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_0502a_row121_col8\" class=\"data row121 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row122_col0\" class=\"data row122 col0\" >validmind.model_validation.sklearn.MinimumROCAUCScore</td>\n",
-       "      <td id=\"T_0502a_row122_col1\" class=\"data row122 col1\" >Minimum ROCAUC Score</td>\n",
-       "      <td id=\"T_0502a_row122_col2\" class=\"data row122 col2\" >Validates model by checking if the ROC AUC score meets or surpasses a specified threshold....</td>\n",
-       "      <td id=\"T_0502a_row122_col3\" class=\"data row122 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row122_col4\" class=\"data row122 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row122_col5\" class=\"data row122 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row122_col6\" class=\"data row122 col6\" >{'min_threshold': {'type': 'float', 'default': 0.5}}</td>\n",
-       "      <td id=\"T_0502a_row122_col7\" class=\"data row122 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_0502a_row122_col8\" class=\"data row122 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row123_col0\" class=\"data row123 col0\" >validmind.model_validation.sklearn.ModelParameters</td>\n",
-       "      <td id=\"T_0502a_row123_col1\" class=\"data row123 col1\" >Model Parameters</td>\n",
-       "      <td id=\"T_0502a_row123_col2\" class=\"data row123 col2\" >Extracts and displays model parameters in a structured format for transparency and reproducibility....</td>\n",
-       "      <td id=\"T_0502a_row123_col3\" class=\"data row123 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row123_col4\" class=\"data row123 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row123_col5\" class=\"data row123 col5\" >['model']</td>\n",
-       "      <td id=\"T_0502a_row123_col6\" class=\"data row123 col6\" >{'model_params': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row123_col7\" class=\"data row123 col7\" >['model_training', 'metadata']</td>\n",
-       "      <td id=\"T_0502a_row123_col8\" class=\"data row123 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row124_col0\" class=\"data row124 col0\" >validmind.model_validation.sklearn.ModelsPerformanceComparison</td>\n",
-       "      <td id=\"T_0502a_row124_col1\" class=\"data row124 col1\" >Models Performance Comparison</td>\n",
-       "      <td id=\"T_0502a_row124_col2\" class=\"data row124 col2\" >Evaluates and compares the performance of multiple Machine Learning models using various metrics like accuracy,...</td>\n",
-       "      <td id=\"T_0502a_row124_col3\" class=\"data row124 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row124_col4\" class=\"data row124 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row124_col5\" class=\"data row124 col5\" >['dataset', 'models']</td>\n",
-       "      <td id=\"T_0502a_row124_col6\" class=\"data row124 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row124_col7\" class=\"data row124 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'model_comparison']</td>\n",
-       "      <td id=\"T_0502a_row124_col8\" class=\"data row124 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row125_col0\" class=\"data row125 col0\" >validmind.model_validation.sklearn.OverfitDiagnosis</td>\n",
-       "      <td id=\"T_0502a_row125_col1\" class=\"data row125 col1\" >Overfit Diagnosis</td>\n",
-       "      <td id=\"T_0502a_row125_col2\" class=\"data row125 col2\" >Assesses potential overfitting in a model's predictions, identifying regions where performance between training and...</td>\n",
-       "      <td id=\"T_0502a_row125_col3\" class=\"data row125 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row125_col4\" class=\"data row125 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row125_col5\" class=\"data row125 col5\" >['model', 'datasets']</td>\n",
-       "      <td id=\"T_0502a_row125_col6\" class=\"data row125 col6\" >{'metric': {'type': 'str', 'default': None}, 'cut_off_threshold': {'type': 'float', 'default': 0.04}}</td>\n",
-       "      <td id=\"T_0502a_row125_col7\" class=\"data row125 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'linear_regression', 'model_diagnosis']</td>\n",
-       "      <td id=\"T_0502a_row125_col8\" class=\"data row125 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row126_col0\" class=\"data row126 col0\" >validmind.model_validation.sklearn.PermutationFeatureImportance</td>\n",
-       "      <td id=\"T_0502a_row126_col1\" class=\"data row126 col1\" >Permutation Feature Importance</td>\n",
-       "      <td id=\"T_0502a_row126_col2\" class=\"data row126 col2\" >Assesses the significance of each feature in a model by evaluating the impact on model performance when feature...</td>\n",
-       "      <td id=\"T_0502a_row126_col3\" class=\"data row126 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row126_col4\" class=\"data row126 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row126_col5\" class=\"data row126 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row126_col6\" class=\"data row126 col6\" >{'fontsize': {'type': None, 'default': None}, 'figure_height': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row126_col7\" class=\"data row126 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'feature_importance', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row126_col8\" class=\"data row126 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row127_col0\" class=\"data row127 col0\" >validmind.model_validation.sklearn.PopulationStabilityIndex</td>\n",
-       "      <td id=\"T_0502a_row127_col1\" class=\"data row127 col1\" >Population Stability Index</td>\n",
-       "      <td id=\"T_0502a_row127_col2\" class=\"data row127 col2\" >Assesses the Population Stability Index (PSI) to quantify the stability of an ML model's predictions across...</td>\n",
-       "      <td id=\"T_0502a_row127_col3\" class=\"data row127 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row127_col4\" class=\"data row127 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row127_col5\" class=\"data row127 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_0502a_row127_col6\" class=\"data row127 col6\" >{'num_bins': {'type': 'int', 'default': 10}, 'mode': {'type': 'str', 'default': 'fixed'}}</td>\n",
-       "      <td id=\"T_0502a_row127_col7\" class=\"data row127 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_0502a_row127_col8\" class=\"data row127 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row128_col0\" class=\"data row128 col0\" >validmind.model_validation.sklearn.PrecisionRecallCurve</td>\n",
-       "      <td id=\"T_0502a_row128_col1\" class=\"data row128 col1\" >Precision Recall Curve</td>\n",
-       "      <td id=\"T_0502a_row128_col2\" class=\"data row128 col2\" >Evaluates the precision-recall trade-off for binary classification models and visualizes the Precision-Recall curve....</td>\n",
-       "      <td id=\"T_0502a_row128_col3\" class=\"data row128 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row128_col4\" class=\"data row128 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row128_col5\" class=\"data row128 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row128_col6\" class=\"data row128 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row128_col7\" class=\"data row128 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row128_col8\" class=\"data row128 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row129_col0\" class=\"data row129 col0\" >validmind.model_validation.sklearn.ROCCurve</td>\n",
-       "      <td id=\"T_0502a_row129_col1\" class=\"data row129 col1\" >ROC Curve</td>\n",
-       "      <td id=\"T_0502a_row129_col2\" class=\"data row129 col2\" >Evaluates binary classification model performance by generating and plotting the Receiver Operating Characteristic...</td>\n",
-       "      <td id=\"T_0502a_row129_col3\" class=\"data row129 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row129_col4\" class=\"data row129 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row129_col5\" class=\"data row129 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row129_col6\" class=\"data row129 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row129_col7\" class=\"data row129 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row129_col8\" class=\"data row129 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row130_col0\" class=\"data row130 col0\" >validmind.model_validation.sklearn.RegressionErrors</td>\n",
-       "      <td id=\"T_0502a_row130_col1\" class=\"data row130 col1\" >Regression Errors</td>\n",
-       "      <td id=\"T_0502a_row130_col2\" class=\"data row130 col2\" >Assesses the performance and error distribution of a regression model using various error metrics....</td>\n",
-       "      <td id=\"T_0502a_row130_col3\" class=\"data row130 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row130_col4\" class=\"data row130 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row130_col5\" class=\"data row130 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row130_col6\" class=\"data row130 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row130_col7\" class=\"data row130 col7\" >['sklearn', 'model_performance']</td>\n",
-       "      <td id=\"T_0502a_row130_col8\" class=\"data row130 col8\" >['regression', 'classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row131_col0\" class=\"data row131 col0\" >validmind.model_validation.sklearn.RegressionErrorsComparison</td>\n",
-       "      <td id=\"T_0502a_row131_col1\" class=\"data row131 col1\" >Regression Errors Comparison</td>\n",
-       "      <td id=\"T_0502a_row131_col2\" class=\"data row131 col2\" >Assesses multiple regression error metrics to compare model performance across different datasets, emphasizing...</td>\n",
-       "      <td id=\"T_0502a_row131_col3\" class=\"data row131 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row131_col4\" class=\"data row131 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row131_col5\" class=\"data row131 col5\" >['datasets', 'models']</td>\n",
-       "      <td id=\"T_0502a_row131_col6\" class=\"data row131 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row131_col7\" class=\"data row131 col7\" >['model_performance', 'sklearn']</td>\n",
-       "      <td id=\"T_0502a_row131_col8\" class=\"data row131 col8\" >['regression', 'time_series_forecasting']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row132_col0\" class=\"data row132 col0\" >validmind.model_validation.sklearn.RegressionPerformance</td>\n",
-       "      <td id=\"T_0502a_row132_col1\" class=\"data row132 col1\" >Regression Performance</td>\n",
-       "      <td id=\"T_0502a_row132_col2\" class=\"data row132 col2\" >Evaluates the performance of a regression model using five different metrics: MAE, MSE, RMSE, MAPE, and MBD....</td>\n",
-       "      <td id=\"T_0502a_row132_col3\" class=\"data row132 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row132_col4\" class=\"data row132 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row132_col5\" class=\"data row132 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row132_col6\" class=\"data row132 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row132_col7\" class=\"data row132 col7\" >['sklearn', 'model_performance']</td>\n",
-       "      <td id=\"T_0502a_row132_col8\" class=\"data row132 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row133_col0\" class=\"data row133 col0\" >validmind.model_validation.sklearn.RegressionR2Square</td>\n",
-       "      <td id=\"T_0502a_row133_col1\" class=\"data row133 col1\" >Regression R2 Square</td>\n",
-       "      <td id=\"T_0502a_row133_col2\" class=\"data row133 col2\" >Assesses the overall goodness-of-fit of a regression model by evaluating R-squared (R2) and Adjusted R-squared (Adj...</td>\n",
-       "      <td id=\"T_0502a_row133_col3\" class=\"data row133 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row133_col4\" class=\"data row133 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row133_col5\" class=\"data row133 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row133_col6\" class=\"data row133 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row133_col7\" class=\"data row133 col7\" >['sklearn', 'model_performance']</td>\n",
-       "      <td id=\"T_0502a_row133_col8\" class=\"data row133 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row134_col0\" class=\"data row134 col0\" >validmind.model_validation.sklearn.RegressionR2SquareComparison</td>\n",
-       "      <td id=\"T_0502a_row134_col1\" class=\"data row134 col1\" >Regression R2 Square Comparison</td>\n",
-       "      <td id=\"T_0502a_row134_col2\" class=\"data row134 col2\" >Compares R-Squared and Adjusted R-Squared values for different regression models across multiple datasets to assess...</td>\n",
-       "      <td id=\"T_0502a_row134_col3\" class=\"data row134 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row134_col4\" class=\"data row134 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row134_col5\" class=\"data row134 col5\" >['datasets', 'models']</td>\n",
-       "      <td id=\"T_0502a_row134_col6\" class=\"data row134 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row134_col7\" class=\"data row134 col7\" >['model_performance', 'sklearn']</td>\n",
-       "      <td id=\"T_0502a_row134_col8\" class=\"data row134 col8\" >['regression', 'time_series_forecasting']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row135_col0\" class=\"data row135 col0\" >validmind.model_validation.sklearn.RobustnessDiagnosis</td>\n",
-       "      <td id=\"T_0502a_row135_col1\" class=\"data row135 col1\" >Robustness Diagnosis</td>\n",
-       "      <td id=\"T_0502a_row135_col2\" class=\"data row135 col2\" >Assesses the robustness of a machine learning model by evaluating performance decay under noisy conditions....</td>\n",
-       "      <td id=\"T_0502a_row135_col3\" class=\"data row135 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row135_col4\" class=\"data row135 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row135_col5\" class=\"data row135 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_0502a_row135_col6\" class=\"data row135 col6\" >{'metric': {'type': 'str', 'default': None}, 'scaling_factor_std_dev_list': {'type': None, 'default': [0.1, 0.2, 0.3, 0.4, 0.5]}, 'performance_decay_threshold': {'type': 'float', 'default': 0.05}}</td>\n",
-       "      <td id=\"T_0502a_row135_col7\" class=\"data row135 col7\" >['sklearn', 'model_diagnosis', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row135_col8\" class=\"data row135 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row136_col0\" class=\"data row136 col0\" >validmind.model_validation.sklearn.SHAPGlobalImportance</td>\n",
-       "      <td id=\"T_0502a_row136_col1\" class=\"data row136 col1\" >SHAP Global Importance</td>\n",
-       "      <td id=\"T_0502a_row136_col2\" class=\"data row136 col2\" >Evaluates and visualizes global feature importance using SHAP values for model explanation and risk identification....</td>\n",
-       "      <td id=\"T_0502a_row136_col3\" class=\"data row136 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row136_col4\" class=\"data row136 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row136_col5\" class=\"data row136 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row136_col6\" class=\"data row136 col6\" >{'kernel_explainer_samples': {'type': 'int', 'default': 10}, 'tree_or_linear_explainer_samples': {'type': 'int', 'default': 200}, 'class_of_interest': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row136_col7\" class=\"data row136 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'feature_importance', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row136_col8\" class=\"data row136 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row137_col0\" class=\"data row137 col0\" >validmind.model_validation.sklearn.ScoreProbabilityAlignment</td>\n",
-       "      <td id=\"T_0502a_row137_col1\" class=\"data row137 col1\" >Score Probability Alignment</td>\n",
-       "      <td id=\"T_0502a_row137_col2\" class=\"data row137 col2\" >Analyzes the alignment between credit scores and predicted probabilities....</td>\n",
-       "      <td id=\"T_0502a_row137_col3\" class=\"data row137 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row137_col4\" class=\"data row137 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row137_col5\" class=\"data row137 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row137_col6\" class=\"data row137 col6\" >{'score_column': {'type': 'str', 'default': 'score'}, 'n_bins': {'type': 'int', 'default': 10}}</td>\n",
-       "      <td id=\"T_0502a_row137_col7\" class=\"data row137 col7\" >['visualization', 'credit_risk', 'calibration']</td>\n",
-       "      <td id=\"T_0502a_row137_col8\" class=\"data row137 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row138_col0\" class=\"data row138 col0\" >validmind.model_validation.sklearn.SilhouettePlot</td>\n",
-       "      <td id=\"T_0502a_row138_col1\" class=\"data row138 col1\" >Silhouette Plot</td>\n",
-       "      <td id=\"T_0502a_row138_col2\" class=\"data row138 col2\" >Calculates and visualizes Silhouette Score, assessing the degree of data point suitability to its cluster in ML...</td>\n",
-       "      <td id=\"T_0502a_row138_col3\" class=\"data row138 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row138_col4\" class=\"data row138 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row138_col5\" class=\"data row138 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row138_col6\" class=\"data row138 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row138_col7\" class=\"data row138 col7\" >['sklearn', 'model_performance']</td>\n",
-       "      <td id=\"T_0502a_row138_col8\" class=\"data row138 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row139_col0\" class=\"data row139 col0\" >validmind.model_validation.sklearn.TrainingTestDegradation</td>\n",
-       "      <td id=\"T_0502a_row139_col1\" class=\"data row139 col1\" >Training Test Degradation</td>\n",
-       "      <td id=\"T_0502a_row139_col2\" class=\"data row139 col2\" >Tests if model performance degradation between training and test datasets exceeds a predefined threshold....</td>\n",
-       "      <td id=\"T_0502a_row139_col3\" class=\"data row139 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row139_col4\" class=\"data row139 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row139_col5\" class=\"data row139 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_0502a_row139_col6\" class=\"data row139 col6\" >{'max_threshold': {'type': 'float', 'default': 0.1}}</td>\n",
-       "      <td id=\"T_0502a_row139_col7\" class=\"data row139 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row139_col8\" class=\"data row139 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row140_col0\" class=\"data row140 col0\" >validmind.model_validation.sklearn.VMeasure</td>\n",
-       "      <td id=\"T_0502a_row140_col1\" class=\"data row140 col1\" >V Measure</td>\n",
-       "      <td id=\"T_0502a_row140_col2\" class=\"data row140 col2\" >Evaluates homogeneity and completeness of a clustering model using the V Measure Score....</td>\n",
-       "      <td id=\"T_0502a_row140_col3\" class=\"data row140 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row140_col4\" class=\"data row140 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row140_col5\" class=\"data row140 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row140_col6\" class=\"data row140 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row140_col7\" class=\"data row140 col7\" >['sklearn', 'model_performance']</td>\n",
-       "      <td id=\"T_0502a_row140_col8\" class=\"data row140 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row141_col0\" class=\"data row141 col0\" >validmind.model_validation.sklearn.WeakspotsDiagnosis</td>\n",
-       "      <td id=\"T_0502a_row141_col1\" class=\"data row141 col1\" >Weakspots Diagnosis</td>\n",
-       "      <td id=\"T_0502a_row141_col2\" class=\"data row141 col2\" >Identifies and visualizes weak spots in a machine learning model's performance across various sections of the...</td>\n",
-       "      <td id=\"T_0502a_row141_col3\" class=\"data row141 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row141_col4\" class=\"data row141 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row141_col5\" class=\"data row141 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_0502a_row141_col6\" class=\"data row141 col6\" >{'features_columns': {'type': None, 'default': None}, 'metrics': {'type': None, 'default': None}, 'thresholds': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row141_col7\" class=\"data row141 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_diagnosis', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row141_col8\" class=\"data row141 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row142_col0\" class=\"data row142 col0\" >validmind.model_validation.statsmodels.AutoARIMA</td>\n",
-       "      <td id=\"T_0502a_row142_col1\" class=\"data row142 col1\" >Auto ARIMA</td>\n",
-       "      <td id=\"T_0502a_row142_col2\" class=\"data row142 col2\" >Evaluates ARIMA models for time-series forecasting, ranking them using Bayesian and Akaike Information Criteria....</td>\n",
-       "      <td id=\"T_0502a_row142_col3\" class=\"data row142 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row142_col4\" class=\"data row142 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row142_col5\" class=\"data row142 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row142_col6\" class=\"data row142 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row142_col7\" class=\"data row142 col7\" >['time_series_data', 'forecasting', 'model_selection', 'statsmodels']</td>\n",
-       "      <td id=\"T_0502a_row142_col8\" class=\"data row142 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row143_col0\" class=\"data row143 col0\" >validmind.model_validation.statsmodels.CumulativePredictionProbabilities</td>\n",
-       "      <td id=\"T_0502a_row143_col1\" class=\"data row143 col1\" >Cumulative Prediction Probabilities</td>\n",
-       "      <td id=\"T_0502a_row143_col2\" class=\"data row143 col2\" >Visualizes cumulative probabilities of positive and negative classes for both training and testing in classification models....</td>\n",
-       "      <td id=\"T_0502a_row143_col3\" class=\"data row143 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row143_col4\" class=\"data row143 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row143_col5\" class=\"data row143 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row143_col6\" class=\"data row143 col6\" >{'title': {'type': 'str', 'default': 'Cumulative Probabilities'}}</td>\n",
-       "      <td id=\"T_0502a_row143_col7\" class=\"data row143 col7\" >['visualization', 'credit_risk']</td>\n",
-       "      <td id=\"T_0502a_row143_col8\" class=\"data row143 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row144_col0\" class=\"data row144 col0\" >validmind.model_validation.statsmodels.DurbinWatsonTest</td>\n",
-       "      <td id=\"T_0502a_row144_col1\" class=\"data row144 col1\" >Durbin Watson Test</td>\n",
-       "      <td id=\"T_0502a_row144_col2\" class=\"data row144 col2\" >Assesses autocorrelation in time series data features using the Durbin-Watson statistic....</td>\n",
-       "      <td id=\"T_0502a_row144_col3\" class=\"data row144 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row144_col4\" class=\"data row144 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row144_col5\" class=\"data row144 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row144_col6\" class=\"data row144 col6\" >{'threshold': {'type': None, 'default': [1.5, 2.5]}}</td>\n",
-       "      <td id=\"T_0502a_row144_col7\" class=\"data row144 col7\" >['time_series_data', 'forecasting', 'statistical_test', 'statsmodels']</td>\n",
-       "      <td id=\"T_0502a_row144_col8\" class=\"data row144 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row145_col0\" class=\"data row145 col0\" >validmind.model_validation.statsmodels.GINITable</td>\n",
-       "      <td id=\"T_0502a_row145_col1\" class=\"data row145 col1\" >GINI Table</td>\n",
-       "      <td id=\"T_0502a_row145_col2\" class=\"data row145 col2\" >Evaluates classification model performance using AUC, GINI, and KS metrics for training and test datasets....</td>\n",
-       "      <td id=\"T_0502a_row145_col3\" class=\"data row145 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row145_col4\" class=\"data row145 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row145_col5\" class=\"data row145 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row145_col6\" class=\"data row145 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row145_col7\" class=\"data row145 col7\" >['model_performance']</td>\n",
-       "      <td id=\"T_0502a_row145_col8\" class=\"data row145 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row146_col0\" class=\"data row146 col0\" >validmind.model_validation.statsmodels.KolmogorovSmirnov</td>\n",
-       "      <td id=\"T_0502a_row146_col1\" class=\"data row146 col1\" >Kolmogorov Smirnov</td>\n",
-       "      <td id=\"T_0502a_row146_col2\" class=\"data row146 col2\" >Assesses whether each feature in the dataset aligns with a normal distribution using the Kolmogorov-Smirnov test....</td>\n",
-       "      <td id=\"T_0502a_row146_col3\" class=\"data row146 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row146_col4\" class=\"data row146 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row146_col5\" class=\"data row146 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row146_col6\" class=\"data row146 col6\" >{'dist': {'type': 'str', 'default': 'norm'}}</td>\n",
-       "      <td id=\"T_0502a_row146_col7\" class=\"data row146 col7\" >['tabular_data', 'data_distribution', 'statistical_test', 'statsmodels']</td>\n",
-       "      <td id=\"T_0502a_row146_col8\" class=\"data row146 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row147_col0\" class=\"data row147 col0\" >validmind.model_validation.statsmodels.Lilliefors</td>\n",
-       "      <td id=\"T_0502a_row147_col1\" class=\"data row147 col1\" >Lilliefors</td>\n",
-       "      <td id=\"T_0502a_row147_col2\" class=\"data row147 col2\" >Assesses the normality of feature distributions in an ML model's training dataset using the Lilliefors test....</td>\n",
-       "      <td id=\"T_0502a_row147_col3\" class=\"data row147 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row147_col4\" class=\"data row147 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row147_col5\" class=\"data row147 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row147_col6\" class=\"data row147 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row147_col7\" class=\"data row147 col7\" >['tabular_data', 'data_distribution', 'statistical_test', 'statsmodels']</td>\n",
-       "      <td id=\"T_0502a_row147_col8\" class=\"data row147 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row148_col0\" class=\"data row148 col0\" >validmind.model_validation.statsmodels.PredictionProbabilitiesHistogram</td>\n",
-       "      <td id=\"T_0502a_row148_col1\" class=\"data row148 col1\" >Prediction Probabilities Histogram</td>\n",
-       "      <td id=\"T_0502a_row148_col2\" class=\"data row148 col2\" >Assesses the predictive probability distribution for binary classification to evaluate model performance and...</td>\n",
-       "      <td id=\"T_0502a_row148_col3\" class=\"data row148 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row148_col4\" class=\"data row148 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row148_col5\" class=\"data row148 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row148_col6\" class=\"data row148 col6\" >{'title': {'type': 'str', 'default': 'Histogram of Predictive Probabilities'}}</td>\n",
-       "      <td id=\"T_0502a_row148_col7\" class=\"data row148 col7\" >['visualization', 'credit_risk']</td>\n",
-       "      <td id=\"T_0502a_row148_col8\" class=\"data row148 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row149_col0\" class=\"data row149 col0\" >validmind.model_validation.statsmodels.RegressionCoeffs</td>\n",
-       "      <td id=\"T_0502a_row149_col1\" class=\"data row149 col1\" >Regression Coeffs</td>\n",
-       "      <td id=\"T_0502a_row149_col2\" class=\"data row149 col2\" >Assesses the significance and uncertainty of predictor variables in a regression model through visualization of...</td>\n",
-       "      <td id=\"T_0502a_row149_col3\" class=\"data row149 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row149_col4\" class=\"data row149 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row149_col5\" class=\"data row149 col5\" >['model']</td>\n",
-       "      <td id=\"T_0502a_row149_col6\" class=\"data row149 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row149_col7\" class=\"data row149 col7\" >['tabular_data', 'visualization', 'model_training']</td>\n",
-       "      <td id=\"T_0502a_row149_col8\" class=\"data row149 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row150_col0\" class=\"data row150 col0\" >validmind.model_validation.statsmodels.RegressionFeatureSignificance</td>\n",
-       "      <td id=\"T_0502a_row150_col1\" class=\"data row150 col1\" >Regression Feature Significance</td>\n",
-       "      <td id=\"T_0502a_row150_col2\" class=\"data row150 col2\" >Assesses and visualizes the statistical significance of features in a regression model....</td>\n",
-       "      <td id=\"T_0502a_row150_col3\" class=\"data row150 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row150_col4\" class=\"data row150 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row150_col5\" class=\"data row150 col5\" >['model']</td>\n",
-       "      <td id=\"T_0502a_row150_col6\" class=\"data row150 col6\" >{'fontsize': {'type': 'int', 'default': 10}, 'p_threshold': {'type': 'float', 'default': 0.05}}</td>\n",
-       "      <td id=\"T_0502a_row150_col7\" class=\"data row150 col7\" >['statistical_test', 'model_interpretation', 'visualization', 'feature_importance']</td>\n",
-       "      <td id=\"T_0502a_row150_col8\" class=\"data row150 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row151_col0\" class=\"data row151 col0\" >validmind.model_validation.statsmodels.RegressionModelForecastPlot</td>\n",
-       "      <td id=\"T_0502a_row151_col1\" class=\"data row151 col1\" >Regression Model Forecast Plot</td>\n",
-       "      <td id=\"T_0502a_row151_col2\" class=\"data row151 col2\" >Generates plots to visually compare the forecasted outcomes of a regression model against actual observed values over...</td>\n",
-       "      <td id=\"T_0502a_row151_col3\" class=\"data row151 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row151_col4\" class=\"data row151 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row151_col5\" class=\"data row151 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row151_col6\" class=\"data row151 col6\" >{'start_date': {'type': None, 'default': None}, 'end_date': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row151_col7\" class=\"data row151 col7\" >['time_series_data', 'forecasting', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row151_col8\" class=\"data row151 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row152_col0\" class=\"data row152 col0\" >validmind.model_validation.statsmodels.RegressionModelForecastPlotLevels</td>\n",
-       "      <td id=\"T_0502a_row152_col1\" class=\"data row152 col1\" >Regression Model Forecast Plot Levels</td>\n",
-       "      <td id=\"T_0502a_row152_col2\" class=\"data row152 col2\" >Assesses the alignment between forecasted and observed values in regression models through visual plots...</td>\n",
-       "      <td id=\"T_0502a_row152_col3\" class=\"data row152 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row152_col4\" class=\"data row152 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row152_col5\" class=\"data row152 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row152_col6\" class=\"data row152 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row152_col7\" class=\"data row152 col7\" >['time_series_data', 'forecasting', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row152_col8\" class=\"data row152 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row153_col0\" class=\"data row153 col0\" >validmind.model_validation.statsmodels.RegressionModelSensitivityPlot</td>\n",
-       "      <td id=\"T_0502a_row153_col1\" class=\"data row153 col1\" >Regression Model Sensitivity Plot</td>\n",
-       "      <td id=\"T_0502a_row153_col2\" class=\"data row153 col2\" >Assesses the sensitivity of a regression model to changes in independent variables by applying shocks and...</td>\n",
-       "      <td id=\"T_0502a_row153_col3\" class=\"data row153 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row153_col4\" class=\"data row153 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row153_col5\" class=\"data row153 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row153_col6\" class=\"data row153 col6\" >{'shocks': {'type': None, 'default': [0.1]}, 'transformation': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row153_col7\" class=\"data row153 col7\" >['senstivity_analysis', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row153_col8\" class=\"data row153 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row154_col0\" class=\"data row154 col0\" >validmind.model_validation.statsmodels.RegressionModelSummary</td>\n",
-       "      <td id=\"T_0502a_row154_col1\" class=\"data row154 col1\" >Regression Model Summary</td>\n",
-       "      <td id=\"T_0502a_row154_col2\" class=\"data row154 col2\" >Evaluates regression model performance using metrics including R-Squared, Adjusted R-Squared, MSE, and RMSE....</td>\n",
-       "      <td id=\"T_0502a_row154_col3\" class=\"data row154 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row154_col4\" class=\"data row154 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row154_col5\" class=\"data row154 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row154_col6\" class=\"data row154 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row154_col7\" class=\"data row154 col7\" >['model_performance', 'regression']</td>\n",
-       "      <td id=\"T_0502a_row154_col8\" class=\"data row154 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row155_col0\" class=\"data row155 col0\" >validmind.model_validation.statsmodels.RegressionPermutationFeatureImportance</td>\n",
-       "      <td id=\"T_0502a_row155_col1\" class=\"data row155 col1\" >Regression Permutation Feature Importance</td>\n",
-       "      <td id=\"T_0502a_row155_col2\" class=\"data row155 col2\" >Assesses the significance of each feature in a model by evaluating the impact on model performance when feature...</td>\n",
-       "      <td id=\"T_0502a_row155_col3\" class=\"data row155 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row155_col4\" class=\"data row155 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row155_col5\" class=\"data row155 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row155_col6\" class=\"data row155 col6\" >{'fontsize': {'type': 'int', 'default': 12}, 'figure_height': {'type': 'int', 'default': 500}}</td>\n",
-       "      <td id=\"T_0502a_row155_col7\" class=\"data row155 col7\" >['statsmodels', 'feature_importance', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row155_col8\" class=\"data row155 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row156_col0\" class=\"data row156 col0\" >validmind.model_validation.statsmodels.ScorecardHistogram</td>\n",
-       "      <td id=\"T_0502a_row156_col1\" class=\"data row156 col1\" >Scorecard Histogram</td>\n",
-       "      <td id=\"T_0502a_row156_col2\" class=\"data row156 col2\" >The Scorecard Histogram test evaluates the distribution of credit scores between default and non-default instances,...</td>\n",
-       "      <td id=\"T_0502a_row156_col3\" class=\"data row156 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row156_col4\" class=\"data row156 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row156_col5\" class=\"data row156 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_0502a_row156_col6\" class=\"data row156 col6\" >{'title': {'type': 'str', 'default': 'Histogram of Scores'}, 'score_column': {'type': 'str', 'default': 'score'}}</td>\n",
-       "      <td id=\"T_0502a_row156_col7\" class=\"data row156 col7\" >['visualization', 'credit_risk', 'logistic_regression']</td>\n",
-       "      <td id=\"T_0502a_row156_col8\" class=\"data row156 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row157_col0\" class=\"data row157 col0\" >validmind.ongoing_monitoring.CalibrationCurveDrift</td>\n",
-       "      <td id=\"T_0502a_row157_col1\" class=\"data row157 col1\" >Calibration Curve Drift</td>\n",
-       "      <td id=\"T_0502a_row157_col2\" class=\"data row157 col2\" >Evaluates changes in probability calibration between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_0502a_row157_col3\" class=\"data row157 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row157_col4\" class=\"data row157 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row157_col5\" class=\"data row157 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_0502a_row157_col6\" class=\"data row157 col6\" >{'n_bins': {'type': 'int', 'default': 10}, 'drift_pct_threshold': {'type': 'float', 'default': 20}}</td>\n",
-       "      <td id=\"T_0502a_row157_col7\" class=\"data row157 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row157_col8\" class=\"data row157 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row158_col0\" class=\"data row158 col0\" >validmind.ongoing_monitoring.ClassDiscriminationDrift</td>\n",
-       "      <td id=\"T_0502a_row158_col1\" class=\"data row158 col1\" >Class Discrimination Drift</td>\n",
-       "      <td id=\"T_0502a_row158_col2\" class=\"data row158 col2\" >Compares classification discrimination metrics between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_0502a_row158_col3\" class=\"data row158 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row158_col4\" class=\"data row158 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row158_col5\" class=\"data row158 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_0502a_row158_col6\" class=\"data row158 col6\" >{'drift_pct_threshold': {'type': '_empty', 'default': 20}}</td>\n",
-       "      <td id=\"T_0502a_row158_col7\" class=\"data row158 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_0502a_row158_col8\" class=\"data row158 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row159_col0\" class=\"data row159 col0\" >validmind.ongoing_monitoring.ClassImbalanceDrift</td>\n",
-       "      <td id=\"T_0502a_row159_col1\" class=\"data row159 col1\" >Class Imbalance Drift</td>\n",
-       "      <td id=\"T_0502a_row159_col2\" class=\"data row159 col2\" >Evaluates drift in class distribution between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_0502a_row159_col3\" class=\"data row159 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row159_col4\" class=\"data row159 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row159_col5\" class=\"data row159 col5\" >['datasets']</td>\n",
-       "      <td id=\"T_0502a_row159_col6\" class=\"data row159 col6\" >{'drift_pct_threshold': {'type': 'float', 'default': 5.0}, 'title': {'type': 'str', 'default': 'Class Distribution Drift'}}</td>\n",
-       "      <td id=\"T_0502a_row159_col7\" class=\"data row159 col7\" >['tabular_data', 'binary_classification', 'multiclass_classification']</td>\n",
-       "      <td id=\"T_0502a_row159_col8\" class=\"data row159 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row160_col0\" class=\"data row160 col0\" >validmind.ongoing_monitoring.ClassificationAccuracyDrift</td>\n",
-       "      <td id=\"T_0502a_row160_col1\" class=\"data row160 col1\" >Classification Accuracy Drift</td>\n",
-       "      <td id=\"T_0502a_row160_col2\" class=\"data row160 col2\" >Compares classification accuracy metrics between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_0502a_row160_col3\" class=\"data row160 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row160_col4\" class=\"data row160 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row160_col5\" class=\"data row160 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_0502a_row160_col6\" class=\"data row160 col6\" >{'drift_pct_threshold': {'type': '_empty', 'default': 20}}</td>\n",
-       "      <td id=\"T_0502a_row160_col7\" class=\"data row160 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_0502a_row160_col8\" class=\"data row160 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row161_col0\" class=\"data row161 col0\" >validmind.ongoing_monitoring.ConfusionMatrixDrift</td>\n",
-       "      <td id=\"T_0502a_row161_col1\" class=\"data row161 col1\" >Confusion Matrix Drift</td>\n",
-       "      <td id=\"T_0502a_row161_col2\" class=\"data row161 col2\" >Compares confusion matrix metrics between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_0502a_row161_col3\" class=\"data row161 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row161_col4\" class=\"data row161 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row161_col5\" class=\"data row161 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_0502a_row161_col6\" class=\"data row161 col6\" >{'drift_pct_threshold': {'type': '_empty', 'default': 20}}</td>\n",
-       "      <td id=\"T_0502a_row161_col7\" class=\"data row161 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_0502a_row161_col8\" class=\"data row161 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row162_col0\" class=\"data row162 col0\" >validmind.ongoing_monitoring.CumulativePredictionProbabilitiesDrift</td>\n",
-       "      <td id=\"T_0502a_row162_col1\" class=\"data row162 col1\" >Cumulative Prediction Probabilities Drift</td>\n",
-       "      <td id=\"T_0502a_row162_col2\" class=\"data row162 col2\" >Compares cumulative prediction probability distributions between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_0502a_row162_col3\" class=\"data row162 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row162_col4\" class=\"data row162 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row162_col5\" class=\"data row162 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_0502a_row162_col6\" class=\"data row162 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row162_col7\" class=\"data row162 col7\" >['visualization', 'credit_risk']</td>\n",
-       "      <td id=\"T_0502a_row162_col8\" class=\"data row162 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row163_col0\" class=\"data row163 col0\" >validmind.ongoing_monitoring.FeatureDrift</td>\n",
-       "      <td id=\"T_0502a_row163_col1\" class=\"data row163 col1\" >Feature Drift</td>\n",
-       "      <td id=\"T_0502a_row163_col2\" class=\"data row163 col2\" >Evaluates changes in feature distribution over time to identify potential model drift....</td>\n",
-       "      <td id=\"T_0502a_row163_col3\" class=\"data row163 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row163_col4\" class=\"data row163 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row163_col5\" class=\"data row163 col5\" >['datasets']</td>\n",
-       "      <td id=\"T_0502a_row163_col6\" class=\"data row163 col6\" >{'bins': {'type': '_empty', 'default': [0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9]}, 'feature_columns': {'type': '_empty', 'default': None}, 'psi_threshold': {'type': '_empty', 'default': 0.2}}</td>\n",
-       "      <td id=\"T_0502a_row163_col7\" class=\"data row163 col7\" >['visualization']</td>\n",
-       "      <td id=\"T_0502a_row163_col8\" class=\"data row163 col8\" >['monitoring']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row164_col0\" class=\"data row164 col0\" >validmind.ongoing_monitoring.PredictionAcrossEachFeature</td>\n",
-       "      <td id=\"T_0502a_row164_col1\" class=\"data row164 col1\" >Prediction Across Each Feature</td>\n",
-       "      <td id=\"T_0502a_row164_col2\" class=\"data row164 col2\" >Assesses differences in model predictions across individual features between reference and monitoring datasets...</td>\n",
-       "      <td id=\"T_0502a_row164_col3\" class=\"data row164 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row164_col4\" class=\"data row164 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row164_col5\" class=\"data row164 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_0502a_row164_col6\" class=\"data row164 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row164_col7\" class=\"data row164 col7\" >['visualization']</td>\n",
-       "      <td id=\"T_0502a_row164_col8\" class=\"data row164 col8\" >['monitoring']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row165_col0\" class=\"data row165 col0\" >validmind.ongoing_monitoring.PredictionCorrelation</td>\n",
-       "      <td id=\"T_0502a_row165_col1\" class=\"data row165 col1\" >Prediction Correlation</td>\n",
-       "      <td id=\"T_0502a_row165_col2\" class=\"data row165 col2\" >Assesses correlation changes between model predictions from reference and monitoring datasets to detect potential...</td>\n",
-       "      <td id=\"T_0502a_row165_col3\" class=\"data row165 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row165_col4\" class=\"data row165 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row165_col5\" class=\"data row165 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_0502a_row165_col6\" class=\"data row165 col6\" >{'drift_pct_threshold': {'type': 'float', 'default': 20}}</td>\n",
-       "      <td id=\"T_0502a_row165_col7\" class=\"data row165 col7\" >['visualization']</td>\n",
-       "      <td id=\"T_0502a_row165_col8\" class=\"data row165 col8\" >['monitoring']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row166_col0\" class=\"data row166 col0\" >validmind.ongoing_monitoring.PredictionProbabilitiesHistogramDrift</td>\n",
-       "      <td id=\"T_0502a_row166_col1\" class=\"data row166 col1\" >Prediction Probabilities Histogram Drift</td>\n",
-       "      <td id=\"T_0502a_row166_col2\" class=\"data row166 col2\" >Compares prediction probability distributions between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_0502a_row166_col3\" class=\"data row166 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row166_col4\" class=\"data row166 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row166_col5\" class=\"data row166 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_0502a_row166_col6\" class=\"data row166 col6\" >{'title': {'type': '_empty', 'default': 'Prediction Probabilities Histogram Drift'}, 'drift_pct_threshold': {'type': 'float', 'default': 20.0}}</td>\n",
-       "      <td id=\"T_0502a_row166_col7\" class=\"data row166 col7\" >['visualization', 'credit_risk']</td>\n",
-       "      <td id=\"T_0502a_row166_col8\" class=\"data row166 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row167_col0\" class=\"data row167 col0\" >validmind.ongoing_monitoring.PredictionQuantilesAcrossFeatures</td>\n",
-       "      <td id=\"T_0502a_row167_col1\" class=\"data row167 col1\" >Prediction Quantiles Across Features</td>\n",
-       "      <td id=\"T_0502a_row167_col2\" class=\"data row167 col2\" >Assesses differences in model prediction distributions across individual features between reference...</td>\n",
-       "      <td id=\"T_0502a_row167_col3\" class=\"data row167 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row167_col4\" class=\"data row167 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row167_col5\" class=\"data row167 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_0502a_row167_col6\" class=\"data row167 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row167_col7\" class=\"data row167 col7\" >['visualization']</td>\n",
-       "      <td id=\"T_0502a_row167_col8\" class=\"data row167 col8\" >['monitoring']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row168_col0\" class=\"data row168 col0\" >validmind.ongoing_monitoring.ROCCurveDrift</td>\n",
-       "      <td id=\"T_0502a_row168_col1\" class=\"data row168 col1\" >ROC Curve Drift</td>\n",
-       "      <td id=\"T_0502a_row168_col2\" class=\"data row168 col2\" >Compares ROC curves between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_0502a_row168_col3\" class=\"data row168 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row168_col4\" class=\"data row168 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row168_col5\" class=\"data row168 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_0502a_row168_col6\" class=\"data row168 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row168_col7\" class=\"data row168 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_0502a_row168_col8\" class=\"data row168 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row169_col0\" class=\"data row169 col0\" >validmind.ongoing_monitoring.ScoreBandsDrift</td>\n",
-       "      <td id=\"T_0502a_row169_col1\" class=\"data row169 col1\" >Score Bands Drift</td>\n",
-       "      <td id=\"T_0502a_row169_col2\" class=\"data row169 col2\" >Analyzes drift in population distribution and default rates across score bands....</td>\n",
-       "      <td id=\"T_0502a_row169_col3\" class=\"data row169 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row169_col4\" class=\"data row169 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row169_col5\" class=\"data row169 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_0502a_row169_col6\" class=\"data row169 col6\" >{'score_column': {'type': 'str', 'default': 'score'}, 'score_bands': {'type': 'list', 'default': None}, 'drift_threshold': {'type': 'float', 'default': 20.0}}</td>\n",
-       "      <td id=\"T_0502a_row169_col7\" class=\"data row169 col7\" >['visualization', 'credit_risk', 'scorecard']</td>\n",
-       "      <td id=\"T_0502a_row169_col8\" class=\"data row169 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row170_col0\" class=\"data row170 col0\" >validmind.ongoing_monitoring.ScorecardHistogramDrift</td>\n",
-       "      <td id=\"T_0502a_row170_col1\" class=\"data row170 col1\" >Scorecard Histogram Drift</td>\n",
-       "      <td id=\"T_0502a_row170_col2\" class=\"data row170 col2\" >Compares score distributions between reference and monitoring datasets for each class....</td>\n",
-       "      <td id=\"T_0502a_row170_col3\" class=\"data row170 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row170_col4\" class=\"data row170 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row170_col5\" class=\"data row170 col5\" >['datasets']</td>\n",
-       "      <td id=\"T_0502a_row170_col6\" class=\"data row170 col6\" >{'score_column': {'type': 'str', 'default': 'score'}, 'title': {'type': 'str', 'default': 'Scorecard Histogram Drift'}, 'drift_pct_threshold': {'type': 'float', 'default': 20.0}}</td>\n",
-       "      <td id=\"T_0502a_row170_col7\" class=\"data row170 col7\" >['visualization', 'credit_risk', 'logistic_regression']</td>\n",
-       "      <td id=\"T_0502a_row170_col8\" class=\"data row170 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row171_col0\" class=\"data row171 col0\" >validmind.ongoing_monitoring.TargetPredictionDistributionPlot</td>\n",
-       "      <td id=\"T_0502a_row171_col1\" class=\"data row171 col1\" >Target Prediction Distribution Plot</td>\n",
-       "      <td id=\"T_0502a_row171_col2\" class=\"data row171 col2\" >Assesses differences in prediction distributions between a reference dataset and a monitoring dataset to identify...</td>\n",
-       "      <td id=\"T_0502a_row171_col3\" class=\"data row171 col3\" >True</td>\n",
-       "      <td id=\"T_0502a_row171_col4\" class=\"data row171 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row171_col5\" class=\"data row171 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_0502a_row171_col6\" class=\"data row171 col6\" >{'drift_pct_threshold': {'type': 'float', 'default': 20}}</td>\n",
-       "      <td id=\"T_0502a_row171_col7\" class=\"data row171 col7\" >['visualization']</td>\n",
-       "      <td id=\"T_0502a_row171_col8\" class=\"data row171 col8\" >['monitoring']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row172_col0\" class=\"data row172 col0\" >validmind.prompt_validation.Bias</td>\n",
-       "      <td id=\"T_0502a_row172_col1\" class=\"data row172 col1\" >Bias</td>\n",
-       "      <td id=\"T_0502a_row172_col2\" class=\"data row172 col2\" >Assesses potential bias in a Large Language Model by analyzing the distribution and order of exemplars in the...</td>\n",
-       "      <td id=\"T_0502a_row172_col3\" class=\"data row172 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row172_col4\" class=\"data row172 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row172_col5\" class=\"data row172 col5\" >['model']</td>\n",
-       "      <td id=\"T_0502a_row172_col6\" class=\"data row172 col6\" >{'min_threshold': {'type': '_empty', 'default': 7}, 'judge_llm': {'type': '_empty', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row172_col7\" class=\"data row172 col7\" >['llm', 'few_shot']</td>\n",
-       "      <td id=\"T_0502a_row172_col8\" class=\"data row172 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row173_col0\" class=\"data row173 col0\" >validmind.prompt_validation.Clarity</td>\n",
-       "      <td id=\"T_0502a_row173_col1\" class=\"data row173 col1\" >Clarity</td>\n",
-       "      <td id=\"T_0502a_row173_col2\" class=\"data row173 col2\" >Evaluates and scores the clarity of prompts in a Large Language Model based on specified guidelines....</td>\n",
-       "      <td id=\"T_0502a_row173_col3\" class=\"data row173 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row173_col4\" class=\"data row173 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row173_col5\" class=\"data row173 col5\" >['model']</td>\n",
-       "      <td id=\"T_0502a_row173_col6\" class=\"data row173 col6\" >{'min_threshold': {'type': '_empty', 'default': 7}, 'judge_llm': {'type': '_empty', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row173_col7\" class=\"data row173 col7\" >['llm', 'zero_shot', 'few_shot']</td>\n",
-       "      <td id=\"T_0502a_row173_col8\" class=\"data row173 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row174_col0\" class=\"data row174 col0\" >validmind.prompt_validation.Conciseness</td>\n",
-       "      <td id=\"T_0502a_row174_col1\" class=\"data row174 col1\" >Conciseness</td>\n",
-       "      <td id=\"T_0502a_row174_col2\" class=\"data row174 col2\" >Analyzes and grades the conciseness of prompts provided to a Large Language Model....</td>\n",
-       "      <td id=\"T_0502a_row174_col3\" class=\"data row174 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row174_col4\" class=\"data row174 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row174_col5\" class=\"data row174 col5\" >['model']</td>\n",
-       "      <td id=\"T_0502a_row174_col6\" class=\"data row174 col6\" >{'min_threshold': {'type': '_empty', 'default': 7}, 'judge_llm': {'type': '_empty', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row174_col7\" class=\"data row174 col7\" >['llm', 'zero_shot', 'few_shot']</td>\n",
-       "      <td id=\"T_0502a_row174_col8\" class=\"data row174 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row175_col0\" class=\"data row175 col0\" >validmind.prompt_validation.Delimitation</td>\n",
-       "      <td id=\"T_0502a_row175_col1\" class=\"data row175 col1\" >Delimitation</td>\n",
-       "      <td id=\"T_0502a_row175_col2\" class=\"data row175 col2\" >Evaluates the proper use of delimiters in prompts provided to Large Language Models....</td>\n",
-       "      <td id=\"T_0502a_row175_col3\" class=\"data row175 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row175_col4\" class=\"data row175 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row175_col5\" class=\"data row175 col5\" >['model']</td>\n",
-       "      <td id=\"T_0502a_row175_col6\" class=\"data row175 col6\" >{'min_threshold': {'type': '_empty', 'default': 7}, 'judge_llm': {'type': '_empty', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row175_col7\" class=\"data row175 col7\" >['llm', 'zero_shot', 'few_shot']</td>\n",
-       "      <td id=\"T_0502a_row175_col8\" class=\"data row175 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row176_col0\" class=\"data row176 col0\" >validmind.prompt_validation.NegativeInstruction</td>\n",
-       "      <td id=\"T_0502a_row176_col1\" class=\"data row176 col1\" >Negative Instruction</td>\n",
-       "      <td id=\"T_0502a_row176_col2\" class=\"data row176 col2\" >Evaluates and grades the use of affirmative, proactive language over negative instructions in LLM prompts....</td>\n",
-       "      <td id=\"T_0502a_row176_col3\" class=\"data row176 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row176_col4\" class=\"data row176 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row176_col5\" class=\"data row176 col5\" >['model']</td>\n",
-       "      <td id=\"T_0502a_row176_col6\" class=\"data row176 col6\" >{'min_threshold': {'type': '_empty', 'default': 7}, 'judge_llm': {'type': '_empty', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row176_col7\" class=\"data row176 col7\" >['llm', 'zero_shot', 'few_shot']</td>\n",
-       "      <td id=\"T_0502a_row176_col8\" class=\"data row176 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row177_col0\" class=\"data row177 col0\" >validmind.prompt_validation.Robustness</td>\n",
-       "      <td id=\"T_0502a_row177_col1\" class=\"data row177 col1\" >Robustness</td>\n",
-       "      <td id=\"T_0502a_row177_col2\" class=\"data row177 col2\" >Assesses the robustness of prompts provided to a Large Language Model under varying conditions and contexts. This test...</td>\n",
-       "      <td id=\"T_0502a_row177_col3\" class=\"data row177 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row177_col4\" class=\"data row177 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row177_col5\" class=\"data row177 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row177_col6\" class=\"data row177 col6\" >{'num_tests': {'type': '_empty', 'default': 10}, 'judge_llm': {'type': '_empty', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row177_col7\" class=\"data row177 col7\" >['llm', 'zero_shot', 'few_shot']</td>\n",
-       "      <td id=\"T_0502a_row177_col8\" class=\"data row177 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row178_col0\" class=\"data row178 col0\" >validmind.prompt_validation.Specificity</td>\n",
-       "      <td id=\"T_0502a_row178_col1\" class=\"data row178 col1\" >Specificity</td>\n",
-       "      <td id=\"T_0502a_row178_col2\" class=\"data row178 col2\" >Evaluates and scores the specificity of prompts provided to a Large Language Model (LLM), based on clarity, detail,...</td>\n",
-       "      <td id=\"T_0502a_row178_col3\" class=\"data row178 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row178_col4\" class=\"data row178 col4\" >True</td>\n",
-       "      <td id=\"T_0502a_row178_col5\" class=\"data row178 col5\" >['model']</td>\n",
-       "      <td id=\"T_0502a_row178_col6\" class=\"data row178 col6\" >{'min_threshold': {'type': '_empty', 'default': 7}, 'judge_llm': {'type': '_empty', 'default': None}}</td>\n",
-       "      <td id=\"T_0502a_row178_col7\" class=\"data row178 col7\" >['llm', 'zero_shot', 'few_shot']</td>\n",
-       "      <td id=\"T_0502a_row178_col8\" class=\"data row178 col8\" >['text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row179_col0\" class=\"data row179 col0\" >validmind.unit_metrics.classification.Accuracy</td>\n",
-       "      <td id=\"T_0502a_row179_col1\" class=\"data row179 col1\" >Accuracy</td>\n",
-       "      <td id=\"T_0502a_row179_col2\" class=\"data row179 col2\" >Calculates the accuracy of a model</td>\n",
-       "      <td id=\"T_0502a_row179_col3\" class=\"data row179 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row179_col4\" class=\"data row179 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row179_col5\" class=\"data row179 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row179_col6\" class=\"data row179 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row179_col7\" class=\"data row179 col7\" >['classification']</td>\n",
-       "      <td id=\"T_0502a_row179_col8\" class=\"data row179 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row180_col0\" class=\"data row180 col0\" >validmind.unit_metrics.classification.F1</td>\n",
-       "      <td id=\"T_0502a_row180_col1\" class=\"data row180 col1\" >F1</td>\n",
-       "      <td id=\"T_0502a_row180_col2\" class=\"data row180 col2\" >Calculates the F1 score for a classification model.</td>\n",
-       "      <td id=\"T_0502a_row180_col3\" class=\"data row180 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row180_col4\" class=\"data row180 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row180_col5\" class=\"data row180 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row180_col6\" class=\"data row180 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row180_col7\" class=\"data row180 col7\" >['classification']</td>\n",
-       "      <td id=\"T_0502a_row180_col8\" class=\"data row180 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row181_col0\" class=\"data row181 col0\" >validmind.unit_metrics.classification.Precision</td>\n",
-       "      <td id=\"T_0502a_row181_col1\" class=\"data row181 col1\" >Precision</td>\n",
-       "      <td id=\"T_0502a_row181_col2\" class=\"data row181 col2\" >Calculates the precision for a classification model.</td>\n",
-       "      <td id=\"T_0502a_row181_col3\" class=\"data row181 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row181_col4\" class=\"data row181 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row181_col5\" class=\"data row181 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row181_col6\" class=\"data row181 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row181_col7\" class=\"data row181 col7\" >['classification']</td>\n",
-       "      <td id=\"T_0502a_row181_col8\" class=\"data row181 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row182_col0\" class=\"data row182 col0\" >validmind.unit_metrics.classification.ROC_AUC</td>\n",
-       "      <td id=\"T_0502a_row182_col1\" class=\"data row182 col1\" >ROC AUC</td>\n",
-       "      <td id=\"T_0502a_row182_col2\" class=\"data row182 col2\" >Calculates the ROC AUC for a classification model.</td>\n",
-       "      <td id=\"T_0502a_row182_col3\" class=\"data row182 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row182_col4\" class=\"data row182 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row182_col5\" class=\"data row182 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row182_col6\" class=\"data row182 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row182_col7\" class=\"data row182 col7\" >['classification']</td>\n",
-       "      <td id=\"T_0502a_row182_col8\" class=\"data row182 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row183_col0\" class=\"data row183 col0\" >validmind.unit_metrics.classification.Recall</td>\n",
-       "      <td id=\"T_0502a_row183_col1\" class=\"data row183 col1\" >Recall</td>\n",
-       "      <td id=\"T_0502a_row183_col2\" class=\"data row183 col2\" >Calculates the recall for a classification model.</td>\n",
-       "      <td id=\"T_0502a_row183_col3\" class=\"data row183 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row183_col4\" class=\"data row183 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row183_col5\" class=\"data row183 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row183_col6\" class=\"data row183 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row183_col7\" class=\"data row183 col7\" >['classification']</td>\n",
-       "      <td id=\"T_0502a_row183_col8\" class=\"data row183 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row184_col0\" class=\"data row184 col0\" >validmind.unit_metrics.regression.AdjustedRSquaredScore</td>\n",
-       "      <td id=\"T_0502a_row184_col1\" class=\"data row184 col1\" >Adjusted R Squared Score</td>\n",
-       "      <td id=\"T_0502a_row184_col2\" class=\"data row184 col2\" >Calculates the adjusted R-squared score for a regression model.</td>\n",
-       "      <td id=\"T_0502a_row184_col3\" class=\"data row184 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row184_col4\" class=\"data row184 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row184_col5\" class=\"data row184 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row184_col6\" class=\"data row184 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row184_col7\" class=\"data row184 col7\" >['regression']</td>\n",
-       "      <td id=\"T_0502a_row184_col8\" class=\"data row184 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row185_col0\" class=\"data row185 col0\" >validmind.unit_metrics.regression.GiniCoefficient</td>\n",
-       "      <td id=\"T_0502a_row185_col1\" class=\"data row185 col1\" >Gini Coefficient</td>\n",
-       "      <td id=\"T_0502a_row185_col2\" class=\"data row185 col2\" >Calculates the Gini coefficient for a regression model.</td>\n",
-       "      <td id=\"T_0502a_row185_col3\" class=\"data row185 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row185_col4\" class=\"data row185 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row185_col5\" class=\"data row185 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row185_col6\" class=\"data row185 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row185_col7\" class=\"data row185 col7\" >['regression']</td>\n",
-       "      <td id=\"T_0502a_row185_col8\" class=\"data row185 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row186_col0\" class=\"data row186 col0\" >validmind.unit_metrics.regression.HuberLoss</td>\n",
-       "      <td id=\"T_0502a_row186_col1\" class=\"data row186 col1\" >Huber Loss</td>\n",
-       "      <td id=\"T_0502a_row186_col2\" class=\"data row186 col2\" >Calculates the Huber loss for a regression model.</td>\n",
-       "      <td id=\"T_0502a_row186_col3\" class=\"data row186 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row186_col4\" class=\"data row186 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row186_col5\" class=\"data row186 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row186_col6\" class=\"data row186 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row186_col7\" class=\"data row186 col7\" >['regression']</td>\n",
-       "      <td id=\"T_0502a_row186_col8\" class=\"data row186 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row187_col0\" class=\"data row187 col0\" >validmind.unit_metrics.regression.KolmogorovSmirnovStatistic</td>\n",
-       "      <td id=\"T_0502a_row187_col1\" class=\"data row187 col1\" >Kolmogorov Smirnov Statistic</td>\n",
-       "      <td id=\"T_0502a_row187_col2\" class=\"data row187 col2\" >Calculates the Kolmogorov-Smirnov statistic for a regression model.</td>\n",
-       "      <td id=\"T_0502a_row187_col3\" class=\"data row187 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row187_col4\" class=\"data row187 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row187_col5\" class=\"data row187 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_0502a_row187_col6\" class=\"data row187 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row187_col7\" class=\"data row187 col7\" >['regression']</td>\n",
-       "      <td id=\"T_0502a_row187_col8\" class=\"data row187 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row188_col0\" class=\"data row188 col0\" >validmind.unit_metrics.regression.MeanAbsoluteError</td>\n",
-       "      <td id=\"T_0502a_row188_col1\" class=\"data row188 col1\" >Mean Absolute Error</td>\n",
-       "      <td id=\"T_0502a_row188_col2\" class=\"data row188 col2\" >Calculates the mean absolute error for a regression model.</td>\n",
-       "      <td id=\"T_0502a_row188_col3\" class=\"data row188 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row188_col4\" class=\"data row188 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row188_col5\" class=\"data row188 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row188_col6\" class=\"data row188 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row188_col7\" class=\"data row188 col7\" >['regression']</td>\n",
-       "      <td id=\"T_0502a_row188_col8\" class=\"data row188 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row189_col0\" class=\"data row189 col0\" >validmind.unit_metrics.regression.MeanAbsolutePercentageError</td>\n",
-       "      <td id=\"T_0502a_row189_col1\" class=\"data row189 col1\" >Mean Absolute Percentage Error</td>\n",
-       "      <td id=\"T_0502a_row189_col2\" class=\"data row189 col2\" >Calculates the mean absolute percentage error for a regression model.</td>\n",
-       "      <td id=\"T_0502a_row189_col3\" class=\"data row189 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row189_col4\" class=\"data row189 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row189_col5\" class=\"data row189 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row189_col6\" class=\"data row189 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row189_col7\" class=\"data row189 col7\" >['regression']</td>\n",
-       "      <td id=\"T_0502a_row189_col8\" class=\"data row189 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row190_col0\" class=\"data row190 col0\" >validmind.unit_metrics.regression.MeanBiasDeviation</td>\n",
-       "      <td id=\"T_0502a_row190_col1\" class=\"data row190 col1\" >Mean Bias Deviation</td>\n",
-       "      <td id=\"T_0502a_row190_col2\" class=\"data row190 col2\" >Calculates the mean bias deviation for a regression model.</td>\n",
-       "      <td id=\"T_0502a_row190_col3\" class=\"data row190 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row190_col4\" class=\"data row190 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row190_col5\" class=\"data row190 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row190_col6\" class=\"data row190 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row190_col7\" class=\"data row190 col7\" >['regression']</td>\n",
-       "      <td id=\"T_0502a_row190_col8\" class=\"data row190 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row191_col0\" class=\"data row191 col0\" >validmind.unit_metrics.regression.MeanSquaredError</td>\n",
-       "      <td id=\"T_0502a_row191_col1\" class=\"data row191 col1\" >Mean Squared Error</td>\n",
-       "      <td id=\"T_0502a_row191_col2\" class=\"data row191 col2\" >Calculates the mean squared error for a regression model.</td>\n",
-       "      <td id=\"T_0502a_row191_col3\" class=\"data row191 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row191_col4\" class=\"data row191 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row191_col5\" class=\"data row191 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row191_col6\" class=\"data row191 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row191_col7\" class=\"data row191 col7\" >['regression']</td>\n",
-       "      <td id=\"T_0502a_row191_col8\" class=\"data row191 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row192_col0\" class=\"data row192 col0\" >validmind.unit_metrics.regression.QuantileLoss</td>\n",
-       "      <td id=\"T_0502a_row192_col1\" class=\"data row192 col1\" >Quantile Loss</td>\n",
-       "      <td id=\"T_0502a_row192_col2\" class=\"data row192 col2\" >Calculates the quantile loss for a regression model.</td>\n",
-       "      <td id=\"T_0502a_row192_col3\" class=\"data row192 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row192_col4\" class=\"data row192 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row192_col5\" class=\"data row192 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row192_col6\" class=\"data row192 col6\" >{'quantile': {'type': '_empty', 'default': 0.5}}</td>\n",
-       "      <td id=\"T_0502a_row192_col7\" class=\"data row192 col7\" >['regression']</td>\n",
-       "      <td id=\"T_0502a_row192_col8\" class=\"data row192 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row193_col0\" class=\"data row193 col0\" >validmind.unit_metrics.regression.RSquaredScore</td>\n",
-       "      <td id=\"T_0502a_row193_col1\" class=\"data row193 col1\" >R Squared Score</td>\n",
-       "      <td id=\"T_0502a_row193_col2\" class=\"data row193 col2\" >Calculates the R-squared score for a regression model.</td>\n",
-       "      <td id=\"T_0502a_row193_col3\" class=\"data row193 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row193_col4\" class=\"data row193 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row193_col5\" class=\"data row193 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row193_col6\" class=\"data row193 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row193_col7\" class=\"data row193 col7\" >['regression']</td>\n",
-       "      <td id=\"T_0502a_row193_col8\" class=\"data row193 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_0502a_row194_col0\" class=\"data row194 col0\" >validmind.unit_metrics.regression.RootMeanSquaredError</td>\n",
-       "      <td id=\"T_0502a_row194_col1\" class=\"data row194 col1\" >Root Mean Squared Error</td>\n",
-       "      <td id=\"T_0502a_row194_col2\" class=\"data row194 col2\" >Calculates the root mean squared error for a regression model.</td>\n",
-       "      <td id=\"T_0502a_row194_col3\" class=\"data row194 col3\" >False</td>\n",
-       "      <td id=\"T_0502a_row194_col4\" class=\"data row194 col4\" >False</td>\n",
-       "      <td id=\"T_0502a_row194_col5\" class=\"data row194 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_0502a_row194_col6\" class=\"data row194 col6\" >{}</td>\n",
-       "      <td id=\"T_0502a_row194_col7\" class=\"data row194 col7\" >['regression']</td>\n",
-       "      <td id=\"T_0502a_row194_col8\" class=\"data row194 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n"
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "from validmind.tests import (\n",
+        "    list_tests,\n",
+        "    list_tasks,\n",
+        "    list_tags,\n",
+        "    list_tasks_and_tags,\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Use [list_tests()](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) to retrieve all available ValidMind tests, which returns a DataFrame with the following columns:\n",
+        "\n",
+        "- **ID** – A unique identifier for each test.\n",
+        "- **Name** – The test’s name.\n",
+        "- **Description** – A short summary of what the test evaluates.\n",
+        "- **Tags** –  Keywords that describe what the test does or applies to.\n",
+        "- **Tasks** – The type of modeling task the test supports."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style type=\"text/css\">\n",
+              "#T_0502a th {\n",
+              "  text-align: left;\n",
+              "}\n",
+              "#T_0502a_row0_col0, #T_0502a_row0_col1, #T_0502a_row0_col2, #T_0502a_row0_col3, #T_0502a_row0_col4, #T_0502a_row0_col5, #T_0502a_row0_col6, #T_0502a_row0_col7, #T_0502a_row0_col8, #T_0502a_row1_col0, #T_0502a_row1_col1, #T_0502a_row1_col2, #T_0502a_row1_col3, #T_0502a_row1_col4, #T_0502a_row1_col5, #T_0502a_row1_col6, #T_0502a_row1_col7, #T_0502a_row1_col8, #T_0502a_row2_col0, #T_0502a_row2_col1, #T_0502a_row2_col2, #T_0502a_row2_col3, #T_0502a_row2_col4, #T_0502a_row2_col5, #T_0502a_row2_col6, #T_0502a_row2_col7, #T_0502a_row2_col8, #T_0502a_row3_col0, #T_0502a_row3_col1, #T_0502a_row3_col2, #T_0502a_row3_col3, #T_0502a_row3_col4, #T_0502a_row3_col5, #T_0502a_row3_col6, #T_0502a_row3_col7, #T_0502a_row3_col8, #T_0502a_row4_col0, #T_0502a_row4_col1, #T_0502a_row4_col2, #T_0502a_row4_col3, #T_0502a_row4_col4, #T_0502a_row4_col5, #T_0502a_row4_col6, #T_0502a_row4_col7, #T_0502a_row4_col8, #T_0502a_row5_col0, #T_0502a_row5_col1, #T_0502a_row5_col2, #T_0502a_row5_col3, #T_0502a_row5_col4, #T_0502a_row5_col5, #T_0502a_row5_col6, #T_0502a_row5_col7, #T_0502a_row5_col8, #T_0502a_row6_col0, #T_0502a_row6_col1, #T_0502a_row6_col2, #T_0502a_row6_col3, #T_0502a_row6_col4, #T_0502a_row6_col5, #T_0502a_row6_col6, #T_0502a_row6_col7, #T_0502a_row6_col8, #T_0502a_row7_col0, #T_0502a_row7_col1, #T_0502a_row7_col2, #T_0502a_row7_col3, #T_0502a_row7_col4, #T_0502a_row7_col5, #T_0502a_row7_col6, #T_0502a_row7_col7, #T_0502a_row7_col8, #T_0502a_row8_col0, #T_0502a_row8_col1, #T_0502a_row8_col2, #T_0502a_row8_col3, #T_0502a_row8_col4, #T_0502a_row8_col5, #T_0502a_row8_col6, #T_0502a_row8_col7, #T_0502a_row8_col8, #T_0502a_row9_col0, #T_0502a_row9_col1, #T_0502a_row9_col2, #T_0502a_row9_col3, #T_0502a_row9_col4, #T_0502a_row9_col5, #T_0502a_row9_col6, #T_0502a_row9_col7, #T_0502a_row9_col8, #T_0502a_row10_col0, #T_0502a_row10_col1, #T_0502a_row10_col2, #T_0502a_row10_col3, #T_0502a_row10_col4, #T_0502a_row10_col5, #T_0502a_row10_col6, #T_0502a_row10_col7, #T_0502a_row10_col8, #T_0502a_row11_col0, #T_0502a_row11_col1, #T_0502a_row11_col2, #T_0502a_row11_col3, #T_0502a_row11_col4, #T_0502a_row11_col5, #T_0502a_row11_col6, #T_0502a_row11_col7, #T_0502a_row11_col8, #T_0502a_row12_col0, #T_0502a_row12_col1, #T_0502a_row12_col2, #T_0502a_row12_col3, #T_0502a_row12_col4, #T_0502a_row12_col5, #T_0502a_row12_col6, #T_0502a_row12_col7, #T_0502a_row12_col8, #T_0502a_row13_col0, #T_0502a_row13_col1, #T_0502a_row13_col2, #T_0502a_row13_col3, #T_0502a_row13_col4, #T_0502a_row13_col5, #T_0502a_row13_col6, #T_0502a_row13_col7, #T_0502a_row13_col8, #T_0502a_row14_col0, #T_0502a_row14_col1, #T_0502a_row14_col2, #T_0502a_row14_col3, #T_0502a_row14_col4, #T_0502a_row14_col5, #T_0502a_row14_col6, #T_0502a_row14_col7, #T_0502a_row14_col8, #T_0502a_row15_col0, #T_0502a_row15_col1, #T_0502a_row15_col2, #T_0502a_row15_col3, #T_0502a_row15_col4, #T_0502a_row15_col5, #T_0502a_row15_col6, #T_0502a_row15_col7, #T_0502a_row15_col8, #T_0502a_row16_col0, #T_0502a_row16_col1, #T_0502a_row16_col2, #T_0502a_row16_col3, #T_0502a_row16_col4, #T_0502a_row16_col5, #T_0502a_row16_col6, #T_0502a_row16_col7, #T_0502a_row16_col8, #T_0502a_row17_col0, #T_0502a_row17_col1, #T_0502a_row17_col2, #T_0502a_row17_col3, #T_0502a_row17_col4, #T_0502a_row17_col5, #T_0502a_row17_col6, #T_0502a_row17_col7, #T_0502a_row17_col8, #T_0502a_row18_col0, #T_0502a_row18_col1, #T_0502a_row18_col2, #T_0502a_row18_col3, #T_0502a_row18_col4, #T_0502a_row18_col5, #T_0502a_row18_col6, #T_0502a_row18_col7, #T_0502a_row18_col8, #T_0502a_row19_col0, #T_0502a_row19_col1, #T_0502a_row19_col2, #T_0502a_row19_col3, #T_0502a_row19_col4, #T_0502a_row19_col5, #T_0502a_row19_col6, #T_0502a_row19_col7, #T_0502a_row19_col8, #T_0502a_row20_col0, #T_0502a_row20_col1, #T_0502a_row20_col2, #T_0502a_row20_col3, #T_0502a_row20_col4, #T_0502a_row20_col5, #T_0502a_row20_col6, #T_0502a_row20_col7, #T_0502a_row20_col8, #T_0502a_row21_col0, #T_0502a_row21_col1, #T_0502a_row21_col2, #T_0502a_row21_col3, #T_0502a_row21_col4, #T_0502a_row21_col5, #T_0502a_row21_col6, #T_0502a_row21_col7, #T_0502a_row21_col8, #T_0502a_row22_col0, #T_0502a_row22_col1, #T_0502a_row22_col2, #T_0502a_row22_col3, #T_0502a_row22_col4, #T_0502a_row22_col5, #T_0502a_row22_col6, #T_0502a_row22_col7, #T_0502a_row22_col8, #T_0502a_row23_col0, #T_0502a_row23_col1, #T_0502a_row23_col2, #T_0502a_row23_col3, #T_0502a_row23_col4, #T_0502a_row23_col5, #T_0502a_row23_col6, #T_0502a_row23_col7, #T_0502a_row23_col8, #T_0502a_row24_col0, #T_0502a_row24_col1, #T_0502a_row24_col2, #T_0502a_row24_col3, #T_0502a_row24_col4, #T_0502a_row24_col5, #T_0502a_row24_col6, #T_0502a_row24_col7, #T_0502a_row24_col8, #T_0502a_row25_col0, #T_0502a_row25_col1, #T_0502a_row25_col2, #T_0502a_row25_col3, #T_0502a_row25_col4, #T_0502a_row25_col5, #T_0502a_row25_col6, #T_0502a_row25_col7, #T_0502a_row25_col8, #T_0502a_row26_col0, #T_0502a_row26_col1, #T_0502a_row26_col2, #T_0502a_row26_col3, #T_0502a_row26_col4, #T_0502a_row26_col5, #T_0502a_row26_col6, #T_0502a_row26_col7, #T_0502a_row26_col8, #T_0502a_row27_col0, #T_0502a_row27_col1, #T_0502a_row27_col2, #T_0502a_row27_col3, #T_0502a_row27_col4, #T_0502a_row27_col5, #T_0502a_row27_col6, #T_0502a_row27_col7, #T_0502a_row27_col8, #T_0502a_row28_col0, #T_0502a_row28_col1, #T_0502a_row28_col2, #T_0502a_row28_col3, #T_0502a_row28_col4, #T_0502a_row28_col5, #T_0502a_row28_col6, #T_0502a_row28_col7, #T_0502a_row28_col8, #T_0502a_row29_col0, #T_0502a_row29_col1, #T_0502a_row29_col2, #T_0502a_row29_col3, #T_0502a_row29_col4, #T_0502a_row29_col5, #T_0502a_row29_col6, #T_0502a_row29_col7, #T_0502a_row29_col8, #T_0502a_row30_col0, #T_0502a_row30_col1, #T_0502a_row30_col2, #T_0502a_row30_col3, #T_0502a_row30_col4, #T_0502a_row30_col5, #T_0502a_row30_col6, #T_0502a_row30_col7, #T_0502a_row30_col8, #T_0502a_row31_col0, #T_0502a_row31_col1, #T_0502a_row31_col2, #T_0502a_row31_col3, #T_0502a_row31_col4, #T_0502a_row31_col5, #T_0502a_row31_col6, #T_0502a_row31_col7, #T_0502a_row31_col8, #T_0502a_row32_col0, #T_0502a_row32_col1, #T_0502a_row32_col2, #T_0502a_row32_col3, #T_0502a_row32_col4, #T_0502a_row32_col5, #T_0502a_row32_col6, #T_0502a_row32_col7, #T_0502a_row32_col8, #T_0502a_row33_col0, #T_0502a_row33_col1, #T_0502a_row33_col2, #T_0502a_row33_col3, #T_0502a_row33_col4, #T_0502a_row33_col5, #T_0502a_row33_col6, #T_0502a_row33_col7, #T_0502a_row33_col8, #T_0502a_row34_col0, #T_0502a_row34_col1, #T_0502a_row34_col2, #T_0502a_row34_col3, #T_0502a_row34_col4, #T_0502a_row34_col5, #T_0502a_row34_col6, #T_0502a_row34_col7, #T_0502a_row34_col8, #T_0502a_row35_col0, #T_0502a_row35_col1, #T_0502a_row35_col2, #T_0502a_row35_col3, #T_0502a_row35_col4, #T_0502a_row35_col5, #T_0502a_row35_col6, #T_0502a_row35_col7, #T_0502a_row35_col8, #T_0502a_row36_col0, #T_0502a_row36_col1, #T_0502a_row36_col2, #T_0502a_row36_col3, #T_0502a_row36_col4, #T_0502a_row36_col5, #T_0502a_row36_col6, #T_0502a_row36_col7, #T_0502a_row36_col8, #T_0502a_row37_col0, #T_0502a_row37_col1, #T_0502a_row37_col2, #T_0502a_row37_col3, #T_0502a_row37_col4, #T_0502a_row37_col5, #T_0502a_row37_col6, #T_0502a_row37_col7, #T_0502a_row37_col8, #T_0502a_row38_col0, #T_0502a_row38_col1, #T_0502a_row38_col2, #T_0502a_row38_col3, #T_0502a_row38_col4, #T_0502a_row38_col5, #T_0502a_row38_col6, #T_0502a_row38_col7, #T_0502a_row38_col8, #T_0502a_row39_col0, #T_0502a_row39_col1, #T_0502a_row39_col2, #T_0502a_row39_col3, #T_0502a_row39_col4, #T_0502a_row39_col5, #T_0502a_row39_col6, #T_0502a_row39_col7, #T_0502a_row39_col8, #T_0502a_row40_col0, #T_0502a_row40_col1, #T_0502a_row40_col2, #T_0502a_row40_col3, #T_0502a_row40_col4, #T_0502a_row40_col5, #T_0502a_row40_col6, #T_0502a_row40_col7, #T_0502a_row40_col8, #T_0502a_row41_col0, #T_0502a_row41_col1, #T_0502a_row41_col2, #T_0502a_row41_col3, #T_0502a_row41_col4, #T_0502a_row41_col5, #T_0502a_row41_col6, #T_0502a_row41_col7, #T_0502a_row41_col8, #T_0502a_row42_col0, #T_0502a_row42_col1, #T_0502a_row42_col2, #T_0502a_row42_col3, #T_0502a_row42_col4, #T_0502a_row42_col5, #T_0502a_row42_col6, #T_0502a_row42_col7, #T_0502a_row42_col8, #T_0502a_row43_col0, #T_0502a_row43_col1, #T_0502a_row43_col2, #T_0502a_row43_col3, #T_0502a_row43_col4, #T_0502a_row43_col5, #T_0502a_row43_col6, #T_0502a_row43_col7, #T_0502a_row43_col8, #T_0502a_row44_col0, #T_0502a_row44_col1, #T_0502a_row44_col2, #T_0502a_row44_col3, #T_0502a_row44_col4, #T_0502a_row44_col5, #T_0502a_row44_col6, #T_0502a_row44_col7, #T_0502a_row44_col8, #T_0502a_row45_col0, #T_0502a_row45_col1, #T_0502a_row45_col2, #T_0502a_row45_col3, #T_0502a_row45_col4, #T_0502a_row45_col5, #T_0502a_row45_col6, #T_0502a_row45_col7, #T_0502a_row45_col8, #T_0502a_row46_col0, #T_0502a_row46_col1, #T_0502a_row46_col2, #T_0502a_row46_col3, #T_0502a_row46_col4, #T_0502a_row46_col5, #T_0502a_row46_col6, #T_0502a_row46_col7, #T_0502a_row46_col8, #T_0502a_row47_col0, #T_0502a_row47_col1, #T_0502a_row47_col2, #T_0502a_row47_col3, #T_0502a_row47_col4, #T_0502a_row47_col5, #T_0502a_row47_col6, #T_0502a_row47_col7, #T_0502a_row47_col8, #T_0502a_row48_col0, #T_0502a_row48_col1, #T_0502a_row48_col2, #T_0502a_row48_col3, #T_0502a_row48_col4, #T_0502a_row48_col5, #T_0502a_row48_col6, #T_0502a_row48_col7, #T_0502a_row48_col8, #T_0502a_row49_col0, #T_0502a_row49_col1, #T_0502a_row49_col2, #T_0502a_row49_col3, #T_0502a_row49_col4, #T_0502a_row49_col5, #T_0502a_row49_col6, #T_0502a_row49_col7, #T_0502a_row49_col8, #T_0502a_row50_col0, #T_0502a_row50_col1, #T_0502a_row50_col2, #T_0502a_row50_col3, #T_0502a_row50_col4, #T_0502a_row50_col5, #T_0502a_row50_col6, #T_0502a_row50_col7, #T_0502a_row50_col8, #T_0502a_row51_col0, #T_0502a_row51_col1, #T_0502a_row51_col2, #T_0502a_row51_col3, #T_0502a_row51_col4, #T_0502a_row51_col5, #T_0502a_row51_col6, #T_0502a_row51_col7, #T_0502a_row51_col8, #T_0502a_row52_col0, #T_0502a_row52_col1, #T_0502a_row52_col2, #T_0502a_row52_col3, #T_0502a_row52_col4, #T_0502a_row52_col5, #T_0502a_row52_col6, #T_0502a_row52_col7, #T_0502a_row52_col8, #T_0502a_row53_col0, #T_0502a_row53_col1, #T_0502a_row53_col2, #T_0502a_row53_col3, #T_0502a_row53_col4, #T_0502a_row53_col5, #T_0502a_row53_col6, #T_0502a_row53_col7, #T_0502a_row53_col8, #T_0502a_row54_col0, #T_0502a_row54_col1, #T_0502a_row54_col2, #T_0502a_row54_col3, #T_0502a_row54_col4, #T_0502a_row54_col5, #T_0502a_row54_col6, #T_0502a_row54_col7, #T_0502a_row54_col8, #T_0502a_row55_col0, #T_0502a_row55_col1, #T_0502a_row55_col2, #T_0502a_row55_col3, #T_0502a_row55_col4, #T_0502a_row55_col5, #T_0502a_row55_col6, #T_0502a_row55_col7, #T_0502a_row55_col8, #T_0502a_row56_col0, #T_0502a_row56_col1, #T_0502a_row56_col2, #T_0502a_row56_col3, #T_0502a_row56_col4, #T_0502a_row56_col5, #T_0502a_row56_col6, #T_0502a_row56_col7, #T_0502a_row56_col8, #T_0502a_row57_col0, #T_0502a_row57_col1, #T_0502a_row57_col2, #T_0502a_row57_col3, #T_0502a_row57_col4, #T_0502a_row57_col5, #T_0502a_row57_col6, #T_0502a_row57_col7, #T_0502a_row57_col8, #T_0502a_row58_col0, #T_0502a_row58_col1, #T_0502a_row58_col2, #T_0502a_row58_col3, #T_0502a_row58_col4, #T_0502a_row58_col5, #T_0502a_row58_col6, #T_0502a_row58_col7, #T_0502a_row58_col8, #T_0502a_row59_col0, #T_0502a_row59_col1, #T_0502a_row59_col2, #T_0502a_row59_col3, #T_0502a_row59_col4, #T_0502a_row59_col5, #T_0502a_row59_col6, #T_0502a_row59_col7, #T_0502a_row59_col8, #T_0502a_row60_col0, #T_0502a_row60_col1, #T_0502a_row60_col2, #T_0502a_row60_col3, #T_0502a_row60_col4, #T_0502a_row60_col5, #T_0502a_row60_col6, #T_0502a_row60_col7, #T_0502a_row60_col8, #T_0502a_row61_col0, #T_0502a_row61_col1, #T_0502a_row61_col2, #T_0502a_row61_col3, #T_0502a_row61_col4, #T_0502a_row61_col5, #T_0502a_row61_col6, #T_0502a_row61_col7, #T_0502a_row61_col8, #T_0502a_row62_col0, #T_0502a_row62_col1, #T_0502a_row62_col2, #T_0502a_row62_col3, #T_0502a_row62_col4, #T_0502a_row62_col5, #T_0502a_row62_col6, #T_0502a_row62_col7, #T_0502a_row62_col8, #T_0502a_row63_col0, #T_0502a_row63_col1, #T_0502a_row63_col2, #T_0502a_row63_col3, #T_0502a_row63_col4, #T_0502a_row63_col5, #T_0502a_row63_col6, #T_0502a_row63_col7, #T_0502a_row63_col8, #T_0502a_row64_col0, #T_0502a_row64_col1, #T_0502a_row64_col2, #T_0502a_row64_col3, #T_0502a_row64_col4, #T_0502a_row64_col5, #T_0502a_row64_col6, #T_0502a_row64_col7, #T_0502a_row64_col8, #T_0502a_row65_col0, #T_0502a_row65_col1, #T_0502a_row65_col2, #T_0502a_row65_col3, #T_0502a_row65_col4, #T_0502a_row65_col5, #T_0502a_row65_col6, #T_0502a_row65_col7, #T_0502a_row65_col8, #T_0502a_row66_col0, #T_0502a_row66_col1, #T_0502a_row66_col2, #T_0502a_row66_col3, #T_0502a_row66_col4, #T_0502a_row66_col5, #T_0502a_row66_col6, #T_0502a_row66_col7, #T_0502a_row66_col8, #T_0502a_row67_col0, #T_0502a_row67_col1, #T_0502a_row67_col2, #T_0502a_row67_col3, #T_0502a_row67_col4, #T_0502a_row67_col5, #T_0502a_row67_col6, #T_0502a_row67_col7, #T_0502a_row67_col8, #T_0502a_row68_col0, #T_0502a_row68_col1, #T_0502a_row68_col2, #T_0502a_row68_col3, #T_0502a_row68_col4, #T_0502a_row68_col5, #T_0502a_row68_col6, #T_0502a_row68_col7, #T_0502a_row68_col8, #T_0502a_row69_col0, #T_0502a_row69_col1, #T_0502a_row69_col2, #T_0502a_row69_col3, #T_0502a_row69_col4, #T_0502a_row69_col5, #T_0502a_row69_col6, #T_0502a_row69_col7, #T_0502a_row69_col8, #T_0502a_row70_col0, #T_0502a_row70_col1, #T_0502a_row70_col2, #T_0502a_row70_col3, #T_0502a_row70_col4, #T_0502a_row70_col5, #T_0502a_row70_col6, #T_0502a_row70_col7, #T_0502a_row70_col8, #T_0502a_row71_col0, #T_0502a_row71_col1, #T_0502a_row71_col2, #T_0502a_row71_col3, #T_0502a_row71_col4, #T_0502a_row71_col5, #T_0502a_row71_col6, #T_0502a_row71_col7, #T_0502a_row71_col8, #T_0502a_row72_col0, #T_0502a_row72_col1, #T_0502a_row72_col2, #T_0502a_row72_col3, #T_0502a_row72_col4, #T_0502a_row72_col5, #T_0502a_row72_col6, #T_0502a_row72_col7, #T_0502a_row72_col8, #T_0502a_row73_col0, #T_0502a_row73_col1, #T_0502a_row73_col2, #T_0502a_row73_col3, #T_0502a_row73_col4, #T_0502a_row73_col5, #T_0502a_row73_col6, #T_0502a_row73_col7, #T_0502a_row73_col8, #T_0502a_row74_col0, #T_0502a_row74_col1, #T_0502a_row74_col2, #T_0502a_row74_col3, #T_0502a_row74_col4, #T_0502a_row74_col5, #T_0502a_row74_col6, #T_0502a_row74_col7, #T_0502a_row74_col8, #T_0502a_row75_col0, #T_0502a_row75_col1, #T_0502a_row75_col2, #T_0502a_row75_col3, #T_0502a_row75_col4, #T_0502a_row75_col5, #T_0502a_row75_col6, #T_0502a_row75_col7, #T_0502a_row75_col8, #T_0502a_row76_col0, #T_0502a_row76_col1, #T_0502a_row76_col2, #T_0502a_row76_col3, #T_0502a_row76_col4, #T_0502a_row76_col5, #T_0502a_row76_col6, #T_0502a_row76_col7, #T_0502a_row76_col8, #T_0502a_row77_col0, #T_0502a_row77_col1, #T_0502a_row77_col2, #T_0502a_row77_col3, #T_0502a_row77_col4, #T_0502a_row77_col5, #T_0502a_row77_col6, #T_0502a_row77_col7, #T_0502a_row77_col8, #T_0502a_row78_col0, #T_0502a_row78_col1, #T_0502a_row78_col2, #T_0502a_row78_col3, #T_0502a_row78_col4, #T_0502a_row78_col5, #T_0502a_row78_col6, #T_0502a_row78_col7, #T_0502a_row78_col8, #T_0502a_row79_col0, #T_0502a_row79_col1, #T_0502a_row79_col2, #T_0502a_row79_col3, #T_0502a_row79_col4, #T_0502a_row79_col5, #T_0502a_row79_col6, #T_0502a_row79_col7, #T_0502a_row79_col8, #T_0502a_row80_col0, #T_0502a_row80_col1, #T_0502a_row80_col2, #T_0502a_row80_col3, #T_0502a_row80_col4, #T_0502a_row80_col5, #T_0502a_row80_col6, #T_0502a_row80_col7, #T_0502a_row80_col8, #T_0502a_row81_col0, #T_0502a_row81_col1, #T_0502a_row81_col2, #T_0502a_row81_col3, #T_0502a_row81_col4, #T_0502a_row81_col5, #T_0502a_row81_col6, #T_0502a_row81_col7, #T_0502a_row81_col8, #T_0502a_row82_col0, #T_0502a_row82_col1, #T_0502a_row82_col2, #T_0502a_row82_col3, #T_0502a_row82_col4, #T_0502a_row82_col5, #T_0502a_row82_col6, #T_0502a_row82_col7, #T_0502a_row82_col8, #T_0502a_row83_col0, #T_0502a_row83_col1, #T_0502a_row83_col2, #T_0502a_row83_col3, #T_0502a_row83_col4, #T_0502a_row83_col5, #T_0502a_row83_col6, #T_0502a_row83_col7, #T_0502a_row83_col8, #T_0502a_row84_col0, #T_0502a_row84_col1, #T_0502a_row84_col2, #T_0502a_row84_col3, #T_0502a_row84_col4, #T_0502a_row84_col5, #T_0502a_row84_col6, #T_0502a_row84_col7, #T_0502a_row84_col8, #T_0502a_row85_col0, #T_0502a_row85_col1, #T_0502a_row85_col2, #T_0502a_row85_col3, #T_0502a_row85_col4, #T_0502a_row85_col5, #T_0502a_row85_col6, #T_0502a_row85_col7, #T_0502a_row85_col8, #T_0502a_row86_col0, #T_0502a_row86_col1, #T_0502a_row86_col2, #T_0502a_row86_col3, #T_0502a_row86_col4, #T_0502a_row86_col5, #T_0502a_row86_col6, #T_0502a_row86_col7, #T_0502a_row86_col8, #T_0502a_row87_col0, #T_0502a_row87_col1, #T_0502a_row87_col2, #T_0502a_row87_col3, #T_0502a_row87_col4, #T_0502a_row87_col5, #T_0502a_row87_col6, #T_0502a_row87_col7, #T_0502a_row87_col8, #T_0502a_row88_col0, #T_0502a_row88_col1, #T_0502a_row88_col2, #T_0502a_row88_col3, #T_0502a_row88_col4, #T_0502a_row88_col5, #T_0502a_row88_col6, #T_0502a_row88_col7, #T_0502a_row88_col8, #T_0502a_row89_col0, #T_0502a_row89_col1, #T_0502a_row89_col2, #T_0502a_row89_col3, #T_0502a_row89_col4, #T_0502a_row89_col5, #T_0502a_row89_col6, #T_0502a_row89_col7, #T_0502a_row89_col8, #T_0502a_row90_col0, #T_0502a_row90_col1, #T_0502a_row90_col2, #T_0502a_row90_col3, #T_0502a_row90_col4, #T_0502a_row90_col5, #T_0502a_row90_col6, #T_0502a_row90_col7, #T_0502a_row90_col8, #T_0502a_row91_col0, #T_0502a_row91_col1, #T_0502a_row91_col2, #T_0502a_row91_col3, #T_0502a_row91_col4, #T_0502a_row91_col5, #T_0502a_row91_col6, #T_0502a_row91_col7, #T_0502a_row91_col8, #T_0502a_row92_col0, #T_0502a_row92_col1, #T_0502a_row92_col2, #T_0502a_row92_col3, #T_0502a_row92_col4, #T_0502a_row92_col5, #T_0502a_row92_col6, #T_0502a_row92_col7, #T_0502a_row92_col8, #T_0502a_row93_col0, #T_0502a_row93_col1, #T_0502a_row93_col2, #T_0502a_row93_col3, #T_0502a_row93_col4, #T_0502a_row93_col5, #T_0502a_row93_col6, #T_0502a_row93_col7, #T_0502a_row93_col8, #T_0502a_row94_col0, #T_0502a_row94_col1, #T_0502a_row94_col2, #T_0502a_row94_col3, #T_0502a_row94_col4, #T_0502a_row94_col5, #T_0502a_row94_col6, #T_0502a_row94_col7, #T_0502a_row94_col8, #T_0502a_row95_col0, #T_0502a_row95_col1, #T_0502a_row95_col2, #T_0502a_row95_col3, #T_0502a_row95_col4, #T_0502a_row95_col5, #T_0502a_row95_col6, #T_0502a_row95_col7, #T_0502a_row95_col8, #T_0502a_row96_col0, #T_0502a_row96_col1, #T_0502a_row96_col2, #T_0502a_row96_col3, #T_0502a_row96_col4, #T_0502a_row96_col5, #T_0502a_row96_col6, #T_0502a_row96_col7, #T_0502a_row96_col8, #T_0502a_row97_col0, #T_0502a_row97_col1, #T_0502a_row97_col2, #T_0502a_row97_col3, #T_0502a_row97_col4, #T_0502a_row97_col5, #T_0502a_row97_col6, #T_0502a_row97_col7, #T_0502a_row97_col8, #T_0502a_row98_col0, #T_0502a_row98_col1, #T_0502a_row98_col2, #T_0502a_row98_col3, #T_0502a_row98_col4, #T_0502a_row98_col5, #T_0502a_row98_col6, #T_0502a_row98_col7, #T_0502a_row98_col8, #T_0502a_row99_col0, #T_0502a_row99_col1, #T_0502a_row99_col2, #T_0502a_row99_col3, #T_0502a_row99_col4, #T_0502a_row99_col5, #T_0502a_row99_col6, #T_0502a_row99_col7, #T_0502a_row99_col8, #T_0502a_row100_col0, #T_0502a_row100_col1, #T_0502a_row100_col2, #T_0502a_row100_col3, #T_0502a_row100_col4, #T_0502a_row100_col5, #T_0502a_row100_col6, #T_0502a_row100_col7, #T_0502a_row100_col8, #T_0502a_row101_col0, #T_0502a_row101_col1, #T_0502a_row101_col2, #T_0502a_row101_col3, #T_0502a_row101_col4, #T_0502a_row101_col5, #T_0502a_row101_col6, #T_0502a_row101_col7, #T_0502a_row101_col8, #T_0502a_row102_col0, #T_0502a_row102_col1, #T_0502a_row102_col2, #T_0502a_row102_col3, #T_0502a_row102_col4, #T_0502a_row102_col5, #T_0502a_row102_col6, #T_0502a_row102_col7, #T_0502a_row102_col8, #T_0502a_row103_col0, #T_0502a_row103_col1, #T_0502a_row103_col2, #T_0502a_row103_col3, #T_0502a_row103_col4, #T_0502a_row103_col5, #T_0502a_row103_col6, #T_0502a_row103_col7, #T_0502a_row103_col8, #T_0502a_row104_col0, #T_0502a_row104_col1, #T_0502a_row104_col2, #T_0502a_row104_col3, #T_0502a_row104_col4, #T_0502a_row104_col5, #T_0502a_row104_col6, #T_0502a_row104_col7, #T_0502a_row104_col8, #T_0502a_row105_col0, #T_0502a_row105_col1, #T_0502a_row105_col2, #T_0502a_row105_col3, #T_0502a_row105_col4, #T_0502a_row105_col5, #T_0502a_row105_col6, #T_0502a_row105_col7, #T_0502a_row105_col8, #T_0502a_row106_col0, #T_0502a_row106_col1, #T_0502a_row106_col2, #T_0502a_row106_col3, #T_0502a_row106_col4, #T_0502a_row106_col5, #T_0502a_row106_col6, #T_0502a_row106_col7, #T_0502a_row106_col8, #T_0502a_row107_col0, #T_0502a_row107_col1, #T_0502a_row107_col2, #T_0502a_row107_col3, #T_0502a_row107_col4, #T_0502a_row107_col5, #T_0502a_row107_col6, #T_0502a_row107_col7, #T_0502a_row107_col8, #T_0502a_row108_col0, #T_0502a_row108_col1, #T_0502a_row108_col2, #T_0502a_row108_col3, #T_0502a_row108_col4, #T_0502a_row108_col5, #T_0502a_row108_col6, #T_0502a_row108_col7, #T_0502a_row108_col8, #T_0502a_row109_col0, #T_0502a_row109_col1, #T_0502a_row109_col2, #T_0502a_row109_col3, #T_0502a_row109_col4, #T_0502a_row109_col5, #T_0502a_row109_col6, #T_0502a_row109_col7, #T_0502a_row109_col8, #T_0502a_row110_col0, #T_0502a_row110_col1, #T_0502a_row110_col2, #T_0502a_row110_col3, #T_0502a_row110_col4, #T_0502a_row110_col5, #T_0502a_row110_col6, #T_0502a_row110_col7, #T_0502a_row110_col8, #T_0502a_row111_col0, #T_0502a_row111_col1, #T_0502a_row111_col2, #T_0502a_row111_col3, #T_0502a_row111_col4, #T_0502a_row111_col5, #T_0502a_row111_col6, #T_0502a_row111_col7, #T_0502a_row111_col8, #T_0502a_row112_col0, #T_0502a_row112_col1, #T_0502a_row112_col2, #T_0502a_row112_col3, #T_0502a_row112_col4, #T_0502a_row112_col5, #T_0502a_row112_col6, #T_0502a_row112_col7, #T_0502a_row112_col8, #T_0502a_row113_col0, #T_0502a_row113_col1, #T_0502a_row113_col2, #T_0502a_row113_col3, #T_0502a_row113_col4, #T_0502a_row113_col5, #T_0502a_row113_col6, #T_0502a_row113_col7, #T_0502a_row113_col8, #T_0502a_row114_col0, #T_0502a_row114_col1, #T_0502a_row114_col2, #T_0502a_row114_col3, #T_0502a_row114_col4, #T_0502a_row114_col5, #T_0502a_row114_col6, #T_0502a_row114_col7, #T_0502a_row114_col8, #T_0502a_row115_col0, #T_0502a_row115_col1, #T_0502a_row115_col2, #T_0502a_row115_col3, #T_0502a_row115_col4, #T_0502a_row115_col5, #T_0502a_row115_col6, #T_0502a_row115_col7, #T_0502a_row115_col8, #T_0502a_row116_col0, #T_0502a_row116_col1, #T_0502a_row116_col2, #T_0502a_row116_col3, #T_0502a_row116_col4, #T_0502a_row116_col5, #T_0502a_row116_col6, #T_0502a_row116_col7, #T_0502a_row116_col8, #T_0502a_row117_col0, #T_0502a_row117_col1, #T_0502a_row117_col2, #T_0502a_row117_col3, #T_0502a_row117_col4, #T_0502a_row117_col5, #T_0502a_row117_col6, #T_0502a_row117_col7, #T_0502a_row117_col8, #T_0502a_row118_col0, #T_0502a_row118_col1, #T_0502a_row118_col2, #T_0502a_row118_col3, #T_0502a_row118_col4, #T_0502a_row118_col5, #T_0502a_row118_col6, #T_0502a_row118_col7, #T_0502a_row118_col8, #T_0502a_row119_col0, #T_0502a_row119_col1, #T_0502a_row119_col2, #T_0502a_row119_col3, #T_0502a_row119_col4, #T_0502a_row119_col5, #T_0502a_row119_col6, #T_0502a_row119_col7, #T_0502a_row119_col8, #T_0502a_row120_col0, #T_0502a_row120_col1, #T_0502a_row120_col2, #T_0502a_row120_col3, #T_0502a_row120_col4, #T_0502a_row120_col5, #T_0502a_row120_col6, #T_0502a_row120_col7, #T_0502a_row120_col8, #T_0502a_row121_col0, #T_0502a_row121_col1, #T_0502a_row121_col2, #T_0502a_row121_col3, #T_0502a_row121_col4, #T_0502a_row121_col5, #T_0502a_row121_col6, #T_0502a_row121_col7, #T_0502a_row121_col8, #T_0502a_row122_col0, #T_0502a_row122_col1, #T_0502a_row122_col2, #T_0502a_row122_col3, #T_0502a_row122_col4, #T_0502a_row122_col5, #T_0502a_row122_col6, #T_0502a_row122_col7, #T_0502a_row122_col8, #T_0502a_row123_col0, #T_0502a_row123_col1, #T_0502a_row123_col2, #T_0502a_row123_col3, #T_0502a_row123_col4, #T_0502a_row123_col5, #T_0502a_row123_col6, #T_0502a_row123_col7, #T_0502a_row123_col8, #T_0502a_row124_col0, #T_0502a_row124_col1, #T_0502a_row124_col2, #T_0502a_row124_col3, #T_0502a_row124_col4, #T_0502a_row124_col5, #T_0502a_row124_col6, #T_0502a_row124_col7, #T_0502a_row124_col8, #T_0502a_row125_col0, #T_0502a_row125_col1, #T_0502a_row125_col2, #T_0502a_row125_col3, #T_0502a_row125_col4, #T_0502a_row125_col5, #T_0502a_row125_col6, #T_0502a_row125_col7, #T_0502a_row125_col8, #T_0502a_row126_col0, #T_0502a_row126_col1, #T_0502a_row126_col2, #T_0502a_row126_col3, #T_0502a_row126_col4, #T_0502a_row126_col5, #T_0502a_row126_col6, #T_0502a_row126_col7, #T_0502a_row126_col8, #T_0502a_row127_col0, #T_0502a_row127_col1, #T_0502a_row127_col2, #T_0502a_row127_col3, #T_0502a_row127_col4, #T_0502a_row127_col5, #T_0502a_row127_col6, #T_0502a_row127_col7, #T_0502a_row127_col8, #T_0502a_row128_col0, #T_0502a_row128_col1, #T_0502a_row128_col2, #T_0502a_row128_col3, #T_0502a_row128_col4, #T_0502a_row128_col5, #T_0502a_row128_col6, #T_0502a_row128_col7, #T_0502a_row128_col8, #T_0502a_row129_col0, #T_0502a_row129_col1, #T_0502a_row129_col2, #T_0502a_row129_col3, #T_0502a_row129_col4, #T_0502a_row129_col5, #T_0502a_row129_col6, #T_0502a_row129_col7, #T_0502a_row129_col8, #T_0502a_row130_col0, #T_0502a_row130_col1, #T_0502a_row130_col2, #T_0502a_row130_col3, #T_0502a_row130_col4, #T_0502a_row130_col5, #T_0502a_row130_col6, #T_0502a_row130_col7, #T_0502a_row130_col8, #T_0502a_row131_col0, #T_0502a_row131_col1, #T_0502a_row131_col2, #T_0502a_row131_col3, #T_0502a_row131_col4, #T_0502a_row131_col5, #T_0502a_row131_col6, #T_0502a_row131_col7, #T_0502a_row131_col8, #T_0502a_row132_col0, #T_0502a_row132_col1, #T_0502a_row132_col2, #T_0502a_row132_col3, #T_0502a_row132_col4, #T_0502a_row132_col5, #T_0502a_row132_col6, #T_0502a_row132_col7, #T_0502a_row132_col8, #T_0502a_row133_col0, #T_0502a_row133_col1, #T_0502a_row133_col2, #T_0502a_row133_col3, #T_0502a_row133_col4, #T_0502a_row133_col5, #T_0502a_row133_col6, #T_0502a_row133_col7, #T_0502a_row133_col8, #T_0502a_row134_col0, #T_0502a_row134_col1, #T_0502a_row134_col2, #T_0502a_row134_col3, #T_0502a_row134_col4, #T_0502a_row134_col5, #T_0502a_row134_col6, #T_0502a_row134_col7, #T_0502a_row134_col8, #T_0502a_row135_col0, #T_0502a_row135_col1, #T_0502a_row135_col2, #T_0502a_row135_col3, #T_0502a_row135_col4, #T_0502a_row135_col5, #T_0502a_row135_col6, #T_0502a_row135_col7, #T_0502a_row135_col8, #T_0502a_row136_col0, #T_0502a_row136_col1, #T_0502a_row136_col2, #T_0502a_row136_col3, #T_0502a_row136_col4, #T_0502a_row136_col5, #T_0502a_row136_col6, #T_0502a_row136_col7, #T_0502a_row136_col8, #T_0502a_row137_col0, #T_0502a_row137_col1, #T_0502a_row137_col2, #T_0502a_row137_col3, #T_0502a_row137_col4, #T_0502a_row137_col5, #T_0502a_row137_col6, #T_0502a_row137_col7, #T_0502a_row137_col8, #T_0502a_row138_col0, #T_0502a_row138_col1, #T_0502a_row138_col2, #T_0502a_row138_col3, #T_0502a_row138_col4, #T_0502a_row138_col5, #T_0502a_row138_col6, #T_0502a_row138_col7, #T_0502a_row138_col8, #T_0502a_row139_col0, #T_0502a_row139_col1, #T_0502a_row139_col2, #T_0502a_row139_col3, #T_0502a_row139_col4, #T_0502a_row139_col5, #T_0502a_row139_col6, #T_0502a_row139_col7, #T_0502a_row139_col8, #T_0502a_row140_col0, #T_0502a_row140_col1, #T_0502a_row140_col2, #T_0502a_row140_col3, #T_0502a_row140_col4, #T_0502a_row140_col5, #T_0502a_row140_col6, #T_0502a_row140_col7, #T_0502a_row140_col8, #T_0502a_row141_col0, #T_0502a_row141_col1, #T_0502a_row141_col2, #T_0502a_row141_col3, #T_0502a_row141_col4, #T_0502a_row141_col5, #T_0502a_row141_col6, #T_0502a_row141_col7, #T_0502a_row141_col8, #T_0502a_row142_col0, #T_0502a_row142_col1, #T_0502a_row142_col2, #T_0502a_row142_col3, #T_0502a_row142_col4, #T_0502a_row142_col5, #T_0502a_row142_col6, #T_0502a_row142_col7, #T_0502a_row142_col8, #T_0502a_row143_col0, #T_0502a_row143_col1, #T_0502a_row143_col2, #T_0502a_row143_col3, #T_0502a_row143_col4, #T_0502a_row143_col5, #T_0502a_row143_col6, #T_0502a_row143_col7, #T_0502a_row143_col8, #T_0502a_row144_col0, #T_0502a_row144_col1, #T_0502a_row144_col2, #T_0502a_row144_col3, #T_0502a_row144_col4, #T_0502a_row144_col5, #T_0502a_row144_col6, #T_0502a_row144_col7, #T_0502a_row144_col8, #T_0502a_row145_col0, #T_0502a_row145_col1, #T_0502a_row145_col2, #T_0502a_row145_col3, #T_0502a_row145_col4, #T_0502a_row145_col5, #T_0502a_row145_col6, #T_0502a_row145_col7, #T_0502a_row145_col8, #T_0502a_row146_col0, #T_0502a_row146_col1, #T_0502a_row146_col2, #T_0502a_row146_col3, #T_0502a_row146_col4, #T_0502a_row146_col5, #T_0502a_row146_col6, #T_0502a_row146_col7, #T_0502a_row146_col8, #T_0502a_row147_col0, #T_0502a_row147_col1, #T_0502a_row147_col2, #T_0502a_row147_col3, #T_0502a_row147_col4, #T_0502a_row147_col5, #T_0502a_row147_col6, #T_0502a_row147_col7, #T_0502a_row147_col8, #T_0502a_row148_col0, #T_0502a_row148_col1, #T_0502a_row148_col2, #T_0502a_row148_col3, #T_0502a_row148_col4, #T_0502a_row148_col5, #T_0502a_row148_col6, #T_0502a_row148_col7, #T_0502a_row148_col8, #T_0502a_row149_col0, #T_0502a_row149_col1, #T_0502a_row149_col2, #T_0502a_row149_col3, #T_0502a_row149_col4, #T_0502a_row149_col5, #T_0502a_row149_col6, #T_0502a_row149_col7, #T_0502a_row149_col8, #T_0502a_row150_col0, #T_0502a_row150_col1, #T_0502a_row150_col2, #T_0502a_row150_col3, #T_0502a_row150_col4, #T_0502a_row150_col5, #T_0502a_row150_col6, #T_0502a_row150_col7, #T_0502a_row150_col8, #T_0502a_row151_col0, #T_0502a_row151_col1, #T_0502a_row151_col2, #T_0502a_row151_col3, #T_0502a_row151_col4, #T_0502a_row151_col5, #T_0502a_row151_col6, #T_0502a_row151_col7, #T_0502a_row151_col8, #T_0502a_row152_col0, #T_0502a_row152_col1, #T_0502a_row152_col2, #T_0502a_row152_col3, #T_0502a_row152_col4, #T_0502a_row152_col5, #T_0502a_row152_col6, #T_0502a_row152_col7, #T_0502a_row152_col8, #T_0502a_row153_col0, #T_0502a_row153_col1, #T_0502a_row153_col2, #T_0502a_row153_col3, #T_0502a_row153_col4, #T_0502a_row153_col5, #T_0502a_row153_col6, #T_0502a_row153_col7, #T_0502a_row153_col8, #T_0502a_row154_col0, #T_0502a_row154_col1, #T_0502a_row154_col2, #T_0502a_row154_col3, #T_0502a_row154_col4, #T_0502a_row154_col5, #T_0502a_row154_col6, #T_0502a_row154_col7, #T_0502a_row154_col8, #T_0502a_row155_col0, #T_0502a_row155_col1, #T_0502a_row155_col2, #T_0502a_row155_col3, #T_0502a_row155_col4, #T_0502a_row155_col5, #T_0502a_row155_col6, #T_0502a_row155_col7, #T_0502a_row155_col8, #T_0502a_row156_col0, #T_0502a_row156_col1, #T_0502a_row156_col2, #T_0502a_row156_col3, #T_0502a_row156_col4, #T_0502a_row156_col5, #T_0502a_row156_col6, #T_0502a_row156_col7, #T_0502a_row156_col8, #T_0502a_row157_col0, #T_0502a_row157_col1, #T_0502a_row157_col2, #T_0502a_row157_col3, #T_0502a_row157_col4, #T_0502a_row157_col5, #T_0502a_row157_col6, #T_0502a_row157_col7, #T_0502a_row157_col8, #T_0502a_row158_col0, #T_0502a_row158_col1, #T_0502a_row158_col2, #T_0502a_row158_col3, #T_0502a_row158_col4, #T_0502a_row158_col5, #T_0502a_row158_col6, #T_0502a_row158_col7, #T_0502a_row158_col8, #T_0502a_row159_col0, #T_0502a_row159_col1, #T_0502a_row159_col2, #T_0502a_row159_col3, #T_0502a_row159_col4, #T_0502a_row159_col5, #T_0502a_row159_col6, #T_0502a_row159_col7, #T_0502a_row159_col8, #T_0502a_row160_col0, #T_0502a_row160_col1, #T_0502a_row160_col2, #T_0502a_row160_col3, #T_0502a_row160_col4, #T_0502a_row160_col5, #T_0502a_row160_col6, #T_0502a_row160_col7, #T_0502a_row160_col8, #T_0502a_row161_col0, #T_0502a_row161_col1, #T_0502a_row161_col2, #T_0502a_row161_col3, #T_0502a_row161_col4, #T_0502a_row161_col5, #T_0502a_row161_col6, #T_0502a_row161_col7, #T_0502a_row161_col8, #T_0502a_row162_col0, #T_0502a_row162_col1, #T_0502a_row162_col2, #T_0502a_row162_col3, #T_0502a_row162_col4, #T_0502a_row162_col5, #T_0502a_row162_col6, #T_0502a_row162_col7, #T_0502a_row162_col8, #T_0502a_row163_col0, #T_0502a_row163_col1, #T_0502a_row163_col2, #T_0502a_row163_col3, #T_0502a_row163_col4, #T_0502a_row163_col5, #T_0502a_row163_col6, #T_0502a_row163_col7, #T_0502a_row163_col8, #T_0502a_row164_col0, #T_0502a_row164_col1, #T_0502a_row164_col2, #T_0502a_row164_col3, #T_0502a_row164_col4, #T_0502a_row164_col5, #T_0502a_row164_col6, #T_0502a_row164_col7, #T_0502a_row164_col8, #T_0502a_row165_col0, #T_0502a_row165_col1, #T_0502a_row165_col2, #T_0502a_row165_col3, #T_0502a_row165_col4, #T_0502a_row165_col5, #T_0502a_row165_col6, #T_0502a_row165_col7, #T_0502a_row165_col8, #T_0502a_row166_col0, #T_0502a_row166_col1, #T_0502a_row166_col2, #T_0502a_row166_col3, #T_0502a_row166_col4, #T_0502a_row166_col5, #T_0502a_row166_col6, #T_0502a_row166_col7, #T_0502a_row166_col8, #T_0502a_row167_col0, #T_0502a_row167_col1, #T_0502a_row167_col2, #T_0502a_row167_col3, #T_0502a_row167_col4, #T_0502a_row167_col5, #T_0502a_row167_col6, #T_0502a_row167_col7, #T_0502a_row167_col8, #T_0502a_row168_col0, #T_0502a_row168_col1, #T_0502a_row168_col2, #T_0502a_row168_col3, #T_0502a_row168_col4, #T_0502a_row168_col5, #T_0502a_row168_col6, #T_0502a_row168_col7, #T_0502a_row168_col8, #T_0502a_row169_col0, #T_0502a_row169_col1, #T_0502a_row169_col2, #T_0502a_row169_col3, #T_0502a_row169_col4, #T_0502a_row169_col5, #T_0502a_row169_col6, #T_0502a_row169_col7, #T_0502a_row169_col8, #T_0502a_row170_col0, #T_0502a_row170_col1, #T_0502a_row170_col2, #T_0502a_row170_col3, #T_0502a_row170_col4, #T_0502a_row170_col5, #T_0502a_row170_col6, #T_0502a_row170_col7, #T_0502a_row170_col8, #T_0502a_row171_col0, #T_0502a_row171_col1, #T_0502a_row171_col2, #T_0502a_row171_col3, #T_0502a_row171_col4, #T_0502a_row171_col5, #T_0502a_row171_col6, #T_0502a_row171_col7, #T_0502a_row171_col8, #T_0502a_row172_col0, #T_0502a_row172_col1, #T_0502a_row172_col2, #T_0502a_row172_col3, #T_0502a_row172_col4, #T_0502a_row172_col5, #T_0502a_row172_col6, #T_0502a_row172_col7, #T_0502a_row172_col8, #T_0502a_row173_col0, #T_0502a_row173_col1, #T_0502a_row173_col2, #T_0502a_row173_col3, #T_0502a_row173_col4, #T_0502a_row173_col5, #T_0502a_row173_col6, #T_0502a_row173_col7, #T_0502a_row173_col8, #T_0502a_row174_col0, #T_0502a_row174_col1, #T_0502a_row174_col2, #T_0502a_row174_col3, #T_0502a_row174_col4, #T_0502a_row174_col5, #T_0502a_row174_col6, #T_0502a_row174_col7, #T_0502a_row174_col8, #T_0502a_row175_col0, #T_0502a_row175_col1, #T_0502a_row175_col2, #T_0502a_row175_col3, #T_0502a_row175_col4, #T_0502a_row175_col5, #T_0502a_row175_col6, #T_0502a_row175_col7, #T_0502a_row175_col8, #T_0502a_row176_col0, #T_0502a_row176_col1, #T_0502a_row176_col2, #T_0502a_row176_col3, #T_0502a_row176_col4, #T_0502a_row176_col5, #T_0502a_row176_col6, #T_0502a_row176_col7, #T_0502a_row176_col8, #T_0502a_row177_col0, #T_0502a_row177_col1, #T_0502a_row177_col2, #T_0502a_row177_col3, #T_0502a_row177_col4, #T_0502a_row177_col5, #T_0502a_row177_col6, #T_0502a_row177_col7, #T_0502a_row177_col8, #T_0502a_row178_col0, #T_0502a_row178_col1, #T_0502a_row178_col2, #T_0502a_row178_col3, #T_0502a_row178_col4, #T_0502a_row178_col5, #T_0502a_row178_col6, #T_0502a_row178_col7, #T_0502a_row178_col8, #T_0502a_row179_col0, #T_0502a_row179_col1, #T_0502a_row179_col2, #T_0502a_row179_col3, #T_0502a_row179_col4, #T_0502a_row179_col5, #T_0502a_row179_col6, #T_0502a_row179_col7, #T_0502a_row179_col8, #T_0502a_row180_col0, #T_0502a_row180_col1, #T_0502a_row180_col2, #T_0502a_row180_col3, #T_0502a_row180_col4, #T_0502a_row180_col5, #T_0502a_row180_col6, #T_0502a_row180_col7, #T_0502a_row180_col8, #T_0502a_row181_col0, #T_0502a_row181_col1, #T_0502a_row181_col2, #T_0502a_row181_col3, #T_0502a_row181_col4, #T_0502a_row181_col5, #T_0502a_row181_col6, #T_0502a_row181_col7, #T_0502a_row181_col8, #T_0502a_row182_col0, #T_0502a_row182_col1, #T_0502a_row182_col2, #T_0502a_row182_col3, #T_0502a_row182_col4, #T_0502a_row182_col5, #T_0502a_row182_col6, #T_0502a_row182_col7, #T_0502a_row182_col8, #T_0502a_row183_col0, #T_0502a_row183_col1, #T_0502a_row183_col2, #T_0502a_row183_col3, #T_0502a_row183_col4, #T_0502a_row183_col5, #T_0502a_row183_col6, #T_0502a_row183_col7, #T_0502a_row183_col8, #T_0502a_row184_col0, #T_0502a_row184_col1, #T_0502a_row184_col2, #T_0502a_row184_col3, #T_0502a_row184_col4, #T_0502a_row184_col5, #T_0502a_row184_col6, #T_0502a_row184_col7, #T_0502a_row184_col8, #T_0502a_row185_col0, #T_0502a_row185_col1, #T_0502a_row185_col2, #T_0502a_row185_col3, #T_0502a_row185_col4, #T_0502a_row185_col5, #T_0502a_row185_col6, #T_0502a_row185_col7, #T_0502a_row185_col8, #T_0502a_row186_col0, #T_0502a_row186_col1, #T_0502a_row186_col2, #T_0502a_row186_col3, #T_0502a_row186_col4, #T_0502a_row186_col5, #T_0502a_row186_col6, #T_0502a_row186_col7, #T_0502a_row186_col8, #T_0502a_row187_col0, #T_0502a_row187_col1, #T_0502a_row187_col2, #T_0502a_row187_col3, #T_0502a_row187_col4, #T_0502a_row187_col5, #T_0502a_row187_col6, #T_0502a_row187_col7, #T_0502a_row187_col8, #T_0502a_row188_col0, #T_0502a_row188_col1, #T_0502a_row188_col2, #T_0502a_row188_col3, #T_0502a_row188_col4, #T_0502a_row188_col5, #T_0502a_row188_col6, #T_0502a_row188_col7, #T_0502a_row188_col8, #T_0502a_row189_col0, #T_0502a_row189_col1, #T_0502a_row189_col2, #T_0502a_row189_col3, #T_0502a_row189_col4, #T_0502a_row189_col5, #T_0502a_row189_col6, #T_0502a_row189_col7, #T_0502a_row189_col8, #T_0502a_row190_col0, #T_0502a_row190_col1, #T_0502a_row190_col2, #T_0502a_row190_col3, #T_0502a_row190_col4, #T_0502a_row190_col5, #T_0502a_row190_col6, #T_0502a_row190_col7, #T_0502a_row190_col8, #T_0502a_row191_col0, #T_0502a_row191_col1, #T_0502a_row191_col2, #T_0502a_row191_col3, #T_0502a_row191_col4, #T_0502a_row191_col5, #T_0502a_row191_col6, #T_0502a_row191_col7, #T_0502a_row191_col8, #T_0502a_row192_col0, #T_0502a_row192_col1, #T_0502a_row192_col2, #T_0502a_row192_col3, #T_0502a_row192_col4, #T_0502a_row192_col5, #T_0502a_row192_col6, #T_0502a_row192_col7, #T_0502a_row192_col8, #T_0502a_row193_col0, #T_0502a_row193_col1, #T_0502a_row193_col2, #T_0502a_row193_col3, #T_0502a_row193_col4, #T_0502a_row193_col5, #T_0502a_row193_col6, #T_0502a_row193_col7, #T_0502a_row193_col8, #T_0502a_row194_col0, #T_0502a_row194_col1, #T_0502a_row194_col2, #T_0502a_row194_col3, #T_0502a_row194_col4, #T_0502a_row194_col5, #T_0502a_row194_col6, #T_0502a_row194_col7, #T_0502a_row194_col8 {\n",
+              "  text-align: left;\n",
+              "}\n",
+              "</style>\n",
+              "<table id=\"T_0502a\">\n",
+              "  <thead>\n",
+              "    <tr>\n",
+              "      <th id=\"T_0502a_level0_col0\" class=\"col_heading level0 col0\" >ID</th>\n",
+              "      <th id=\"T_0502a_level0_col1\" class=\"col_heading level0 col1\" >Name</th>\n",
+              "      <th id=\"T_0502a_level0_col2\" class=\"col_heading level0 col2\" >Description</th>\n",
+              "      <th id=\"T_0502a_level0_col3\" class=\"col_heading level0 col3\" >Has Figure</th>\n",
+              "      <th id=\"T_0502a_level0_col4\" class=\"col_heading level0 col4\" >Has Table</th>\n",
+              "      <th id=\"T_0502a_level0_col5\" class=\"col_heading level0 col5\" >Required Inputs</th>\n",
+              "      <th id=\"T_0502a_level0_col6\" class=\"col_heading level0 col6\" >Params</th>\n",
+              "      <th id=\"T_0502a_level0_col7\" class=\"col_heading level0 col7\" >Tags</th>\n",
+              "      <th id=\"T_0502a_level0_col8\" class=\"col_heading level0 col8\" >Tasks</th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row0_col0\" class=\"data row0 col0\" >validmind.data_validation.ACFandPACFPlot</td>\n",
+              "      <td id=\"T_0502a_row0_col1\" class=\"data row0 col1\" >AC Fand PACF Plot</td>\n",
+              "      <td id=\"T_0502a_row0_col2\" class=\"data row0 col2\" >Analyzes time series data using Autocorrelation Function (ACF) and Partial Autocorrelation Function (PACF) plots to...</td>\n",
+              "      <td id=\"T_0502a_row0_col3\" class=\"data row0 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row0_col4\" class=\"data row0 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row0_col5\" class=\"data row0 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row0_col6\" class=\"data row0 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row0_col7\" class=\"data row0 col7\" >['time_series_data', 'forecasting', 'statistical_test', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row0_col8\" class=\"data row0 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row1_col0\" class=\"data row1 col0\" >validmind.data_validation.ADF</td>\n",
+              "      <td id=\"T_0502a_row1_col1\" class=\"data row1 col1\" >ADF</td>\n",
+              "      <td id=\"T_0502a_row1_col2\" class=\"data row1 col2\" >Assesses the stationarity of a time series dataset using the Augmented Dickey-Fuller (ADF) test....</td>\n",
+              "      <td id=\"T_0502a_row1_col3\" class=\"data row1 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row1_col4\" class=\"data row1 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row1_col5\" class=\"data row1 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row1_col6\" class=\"data row1 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row1_col7\" class=\"data row1 col7\" >['time_series_data', 'statsmodels', 'forecasting', 'statistical_test', 'stationarity']</td>\n",
+              "      <td id=\"T_0502a_row1_col8\" class=\"data row1 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row2_col0\" class=\"data row2 col0\" >validmind.data_validation.AutoAR</td>\n",
+              "      <td id=\"T_0502a_row2_col1\" class=\"data row2 col1\" >Auto AR</td>\n",
+              "      <td id=\"T_0502a_row2_col2\" class=\"data row2 col2\" >Automatically identifies the optimal Autoregressive (AR) order for a time series using BIC and AIC criteria....</td>\n",
+              "      <td id=\"T_0502a_row2_col3\" class=\"data row2 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row2_col4\" class=\"data row2 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row2_col5\" class=\"data row2 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row2_col6\" class=\"data row2 col6\" >{'max_ar_order': {'type': 'int', 'default': 3}}</td>\n",
+              "      <td id=\"T_0502a_row2_col7\" class=\"data row2 col7\" >['time_series_data', 'statsmodels', 'forecasting', 'statistical_test']</td>\n",
+              "      <td id=\"T_0502a_row2_col8\" class=\"data row2 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row3_col0\" class=\"data row3 col0\" >validmind.data_validation.AutoMA</td>\n",
+              "      <td id=\"T_0502a_row3_col1\" class=\"data row3 col1\" >Auto MA</td>\n",
+              "      <td id=\"T_0502a_row3_col2\" class=\"data row3 col2\" >Automatically selects the optimal Moving Average (MA) order for each variable in a time series dataset based on...</td>\n",
+              "      <td id=\"T_0502a_row3_col3\" class=\"data row3 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row3_col4\" class=\"data row3 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row3_col5\" class=\"data row3 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row3_col6\" class=\"data row3 col6\" >{'max_ma_order': {'type': 'int', 'default': 3}}</td>\n",
+              "      <td id=\"T_0502a_row3_col7\" class=\"data row3 col7\" >['time_series_data', 'statsmodels', 'forecasting', 'statistical_test']</td>\n",
+              "      <td id=\"T_0502a_row3_col8\" class=\"data row3 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row4_col0\" class=\"data row4 col0\" >validmind.data_validation.AutoStationarity</td>\n",
+              "      <td id=\"T_0502a_row4_col1\" class=\"data row4 col1\" >Auto Stationarity</td>\n",
+              "      <td id=\"T_0502a_row4_col2\" class=\"data row4 col2\" >Automates Augmented Dickey-Fuller test to assess stationarity across multiple time series in a DataFrame....</td>\n",
+              "      <td id=\"T_0502a_row4_col3\" class=\"data row4 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row4_col4\" class=\"data row4 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row4_col5\" class=\"data row4 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row4_col6\" class=\"data row4 col6\" >{'max_order': {'type': 'int', 'default': 5}, 'threshold': {'type': 'float', 'default': 0.05}}</td>\n",
+              "      <td id=\"T_0502a_row4_col7\" class=\"data row4 col7\" >['time_series_data', 'statsmodels', 'forecasting', 'statistical_test']</td>\n",
+              "      <td id=\"T_0502a_row4_col8\" class=\"data row4 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row5_col0\" class=\"data row5 col0\" >validmind.data_validation.BivariateScatterPlots</td>\n",
+              "      <td id=\"T_0502a_row5_col1\" class=\"data row5 col1\" >Bivariate Scatter Plots</td>\n",
+              "      <td id=\"T_0502a_row5_col2\" class=\"data row5 col2\" >Generates bivariate scatterplots to visually inspect relationships between pairs of numerical predictor variables...</td>\n",
+              "      <td id=\"T_0502a_row5_col3\" class=\"data row5 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row5_col4\" class=\"data row5 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row5_col5\" class=\"data row5 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row5_col6\" class=\"data row5 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row5_col7\" class=\"data row5 col7\" >['tabular_data', 'numerical_data', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row5_col8\" class=\"data row5 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row6_col0\" class=\"data row6 col0\" >validmind.data_validation.BoxPierce</td>\n",
+              "      <td id=\"T_0502a_row6_col1\" class=\"data row6 col1\" >Box Pierce</td>\n",
+              "      <td id=\"T_0502a_row6_col2\" class=\"data row6 col2\" >Detects autocorrelation in time-series data through the Box-Pierce test to validate model performance....</td>\n",
+              "      <td id=\"T_0502a_row6_col3\" class=\"data row6 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row6_col4\" class=\"data row6 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row6_col5\" class=\"data row6 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row6_col6\" class=\"data row6 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row6_col7\" class=\"data row6 col7\" >['time_series_data', 'forecasting', 'statistical_test', 'statsmodels']</td>\n",
+              "      <td id=\"T_0502a_row6_col8\" class=\"data row6 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row7_col0\" class=\"data row7 col0\" >validmind.data_validation.ChiSquaredFeaturesTable</td>\n",
+              "      <td id=\"T_0502a_row7_col1\" class=\"data row7 col1\" >Chi Squared Features Table</td>\n",
+              "      <td id=\"T_0502a_row7_col2\" class=\"data row7 col2\" >Assesses the statistical association between categorical features and a target variable using the Chi-Squared test....</td>\n",
+              "      <td id=\"T_0502a_row7_col3\" class=\"data row7 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row7_col4\" class=\"data row7 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row7_col5\" class=\"data row7 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row7_col6\" class=\"data row7 col6\" >{'p_threshold': {'type': '_empty', 'default': 0.05}}</td>\n",
+              "      <td id=\"T_0502a_row7_col7\" class=\"data row7 col7\" >['tabular_data', 'categorical_data', 'statistical_test']</td>\n",
+              "      <td id=\"T_0502a_row7_col8\" class=\"data row7 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row8_col0\" class=\"data row8 col0\" >validmind.data_validation.ClassImbalance</td>\n",
+              "      <td id=\"T_0502a_row8_col1\" class=\"data row8 col1\" >Class Imbalance</td>\n",
+              "      <td id=\"T_0502a_row8_col2\" class=\"data row8 col2\" >Evaluates and quantifies class distribution imbalance in a dataset used by a machine learning model....</td>\n",
+              "      <td id=\"T_0502a_row8_col3\" class=\"data row8 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row8_col4\" class=\"data row8 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row8_col5\" class=\"data row8 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row8_col6\" class=\"data row8 col6\" >{'min_percent_threshold': {'type': 'int', 'default': 10}}</td>\n",
+              "      <td id=\"T_0502a_row8_col7\" class=\"data row8 col7\" >['tabular_data', 'binary_classification', 'multiclass_classification', 'data_quality']</td>\n",
+              "      <td id=\"T_0502a_row8_col8\" class=\"data row8 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row9_col0\" class=\"data row9 col0\" >validmind.data_validation.DatasetDescription</td>\n",
+              "      <td id=\"T_0502a_row9_col1\" class=\"data row9 col1\" >Dataset Description</td>\n",
+              "      <td id=\"T_0502a_row9_col2\" class=\"data row9 col2\" >Provides comprehensive analysis and statistical summaries of each column in a machine learning model's dataset....</td>\n",
+              "      <td id=\"T_0502a_row9_col3\" class=\"data row9 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row9_col4\" class=\"data row9 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row9_col5\" class=\"data row9 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row9_col6\" class=\"data row9 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row9_col7\" class=\"data row9 col7\" >['tabular_data', 'time_series_data', 'text_data']</td>\n",
+              "      <td id=\"T_0502a_row9_col8\" class=\"data row9 col8\" >['classification', 'regression', 'text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row10_col0\" class=\"data row10 col0\" >validmind.data_validation.DatasetSplit</td>\n",
+              "      <td id=\"T_0502a_row10_col1\" class=\"data row10 col1\" >Dataset Split</td>\n",
+              "      <td id=\"T_0502a_row10_col2\" class=\"data row10 col2\" >Evaluates and visualizes the distribution proportions among training, testing, and validation datasets of an ML...</td>\n",
+              "      <td id=\"T_0502a_row10_col3\" class=\"data row10 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row10_col4\" class=\"data row10 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row10_col5\" class=\"data row10 col5\" >['datasets']</td>\n",
+              "      <td id=\"T_0502a_row10_col6\" class=\"data row10 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row10_col7\" class=\"data row10 col7\" >['tabular_data', 'time_series_data', 'text_data']</td>\n",
+              "      <td id=\"T_0502a_row10_col8\" class=\"data row10 col8\" >['classification', 'regression', 'text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row11_col0\" class=\"data row11 col0\" >validmind.data_validation.DescriptiveStatistics</td>\n",
+              "      <td id=\"T_0502a_row11_col1\" class=\"data row11 col1\" >Descriptive Statistics</td>\n",
+              "      <td id=\"T_0502a_row11_col2\" class=\"data row11 col2\" >Performs a detailed descriptive statistical analysis of both numerical and categorical data within a model's...</td>\n",
+              "      <td id=\"T_0502a_row11_col3\" class=\"data row11 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row11_col4\" class=\"data row11 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row11_col5\" class=\"data row11 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row11_col6\" class=\"data row11 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row11_col7\" class=\"data row11 col7\" >['tabular_data', 'time_series_data', 'data_quality']</td>\n",
+              "      <td id=\"T_0502a_row11_col8\" class=\"data row11 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row12_col0\" class=\"data row12 col0\" >validmind.data_validation.DickeyFullerGLS</td>\n",
+              "      <td id=\"T_0502a_row12_col1\" class=\"data row12 col1\" >Dickey Fuller GLS</td>\n",
+              "      <td id=\"T_0502a_row12_col2\" class=\"data row12 col2\" >Assesses stationarity in time series data using the Dickey-Fuller GLS test to determine the order of integration....</td>\n",
+              "      <td id=\"T_0502a_row12_col3\" class=\"data row12 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row12_col4\" class=\"data row12 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row12_col5\" class=\"data row12 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row12_col6\" class=\"data row12 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row12_col7\" class=\"data row12 col7\" >['time_series_data', 'forecasting', 'unit_root_test']</td>\n",
+              "      <td id=\"T_0502a_row12_col8\" class=\"data row12 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row13_col0\" class=\"data row13 col0\" >validmind.data_validation.Duplicates</td>\n",
+              "      <td id=\"T_0502a_row13_col1\" class=\"data row13 col1\" >Duplicates</td>\n",
+              "      <td id=\"T_0502a_row13_col2\" class=\"data row13 col2\" >Tests dataset for duplicate entries, ensuring model reliability via data quality verification....</td>\n",
+              "      <td id=\"T_0502a_row13_col3\" class=\"data row13 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row13_col4\" class=\"data row13 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row13_col5\" class=\"data row13 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row13_col6\" class=\"data row13 col6\" >{'min_threshold': {'type': '_empty', 'default': 1}}</td>\n",
+              "      <td id=\"T_0502a_row13_col7\" class=\"data row13 col7\" >['tabular_data', 'data_quality', 'text_data']</td>\n",
+              "      <td id=\"T_0502a_row13_col8\" class=\"data row13 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row14_col0\" class=\"data row14 col0\" >validmind.data_validation.EngleGrangerCoint</td>\n",
+              "      <td id=\"T_0502a_row14_col1\" class=\"data row14 col1\" >Engle Granger Coint</td>\n",
+              "      <td id=\"T_0502a_row14_col2\" class=\"data row14 col2\" >Assesses the degree of co-movement between pairs of time series data using the Engle-Granger cointegration test....</td>\n",
+              "      <td id=\"T_0502a_row14_col3\" class=\"data row14 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row14_col4\" class=\"data row14 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row14_col5\" class=\"data row14 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row14_col6\" class=\"data row14 col6\" >{'threshold': {'type': 'float', 'default': 0.05}}</td>\n",
+              "      <td id=\"T_0502a_row14_col7\" class=\"data row14 col7\" >['time_series_data', 'statistical_test', 'forecasting']</td>\n",
+              "      <td id=\"T_0502a_row14_col8\" class=\"data row14 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row15_col0\" class=\"data row15 col0\" >validmind.data_validation.FeatureTargetCorrelationPlot</td>\n",
+              "      <td id=\"T_0502a_row15_col1\" class=\"data row15 col1\" >Feature Target Correlation Plot</td>\n",
+              "      <td id=\"T_0502a_row15_col2\" class=\"data row15 col2\" >Visualizes the correlation between input features and the model's target output in a color-coded horizontal bar...</td>\n",
+              "      <td id=\"T_0502a_row15_col3\" class=\"data row15 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row15_col4\" class=\"data row15 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row15_col5\" class=\"data row15 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row15_col6\" class=\"data row15 col6\" >{'fig_height': {'type': '_empty', 'default': 600}}</td>\n",
+              "      <td id=\"T_0502a_row15_col7\" class=\"data row15 col7\" >['tabular_data', 'visualization', 'correlation']</td>\n",
+              "      <td id=\"T_0502a_row15_col8\" class=\"data row15 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row16_col0\" class=\"data row16 col0\" >validmind.data_validation.HighCardinality</td>\n",
+              "      <td id=\"T_0502a_row16_col1\" class=\"data row16 col1\" >High Cardinality</td>\n",
+              "      <td id=\"T_0502a_row16_col2\" class=\"data row16 col2\" >Assesses the number of unique values in categorical columns to detect high cardinality and potential overfitting....</td>\n",
+              "      <td id=\"T_0502a_row16_col3\" class=\"data row16 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row16_col4\" class=\"data row16 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row16_col5\" class=\"data row16 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row16_col6\" class=\"data row16 col6\" >{'num_threshold': {'type': 'int', 'default': 100}, 'percent_threshold': {'type': 'float', 'default': 0.1}, 'threshold_type': {'type': 'str', 'default': 'percent'}}</td>\n",
+              "      <td id=\"T_0502a_row16_col7\" class=\"data row16 col7\" >['tabular_data', 'data_quality', 'categorical_data']</td>\n",
+              "      <td id=\"T_0502a_row16_col8\" class=\"data row16 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row17_col0\" class=\"data row17 col0\" >validmind.data_validation.HighPearsonCorrelation</td>\n",
+              "      <td id=\"T_0502a_row17_col1\" class=\"data row17 col1\" >High Pearson Correlation</td>\n",
+              "      <td id=\"T_0502a_row17_col2\" class=\"data row17 col2\" >Identifies highly correlated feature pairs in a dataset suggesting feature redundancy or multicollinearity....</td>\n",
+              "      <td id=\"T_0502a_row17_col3\" class=\"data row17 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row17_col4\" class=\"data row17 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row17_col5\" class=\"data row17 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row17_col6\" class=\"data row17 col6\" >{'max_threshold': {'type': 'float', 'default': 0.3}, 'top_n_correlations': {'type': 'int', 'default': 10}, 'feature_columns': {'type': 'list', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row17_col7\" class=\"data row17 col7\" >['tabular_data', 'data_quality', 'correlation']</td>\n",
+              "      <td id=\"T_0502a_row17_col8\" class=\"data row17 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row18_col0\" class=\"data row18 col0\" >validmind.data_validation.IQROutliersBarPlot</td>\n",
+              "      <td id=\"T_0502a_row18_col1\" class=\"data row18 col1\" >IQR Outliers Bar Plot</td>\n",
+              "      <td id=\"T_0502a_row18_col2\" class=\"data row18 col2\" >Visualizes outlier distribution across percentiles in numerical data using the Interquartile Range (IQR) method....</td>\n",
+              "      <td id=\"T_0502a_row18_col3\" class=\"data row18 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row18_col4\" class=\"data row18 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row18_col5\" class=\"data row18 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row18_col6\" class=\"data row18 col6\" >{'threshold': {'type': 'float', 'default': 1.5}, 'fig_width': {'type': 'int', 'default': 800}}</td>\n",
+              "      <td id=\"T_0502a_row18_col7\" class=\"data row18 col7\" >['tabular_data', 'visualization', 'numerical_data']</td>\n",
+              "      <td id=\"T_0502a_row18_col8\" class=\"data row18 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row19_col0\" class=\"data row19 col0\" >validmind.data_validation.IQROutliersTable</td>\n",
+              "      <td id=\"T_0502a_row19_col1\" class=\"data row19 col1\" >IQR Outliers Table</td>\n",
+              "      <td id=\"T_0502a_row19_col2\" class=\"data row19 col2\" >Determines and summarizes outliers in numerical features using the Interquartile Range method....</td>\n",
+              "      <td id=\"T_0502a_row19_col3\" class=\"data row19 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row19_col4\" class=\"data row19 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row19_col5\" class=\"data row19 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row19_col6\" class=\"data row19 col6\" >{'threshold': {'type': 'float', 'default': 1.5}}</td>\n",
+              "      <td id=\"T_0502a_row19_col7\" class=\"data row19 col7\" >['tabular_data', 'numerical_data']</td>\n",
+              "      <td id=\"T_0502a_row19_col8\" class=\"data row19 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row20_col0\" class=\"data row20 col0\" >validmind.data_validation.IsolationForestOutliers</td>\n",
+              "      <td id=\"T_0502a_row20_col1\" class=\"data row20 col1\" >Isolation Forest Outliers</td>\n",
+              "      <td id=\"T_0502a_row20_col2\" class=\"data row20 col2\" >Detects outliers in a dataset using the Isolation Forest algorithm and visualizes results through scatter plots....</td>\n",
+              "      <td id=\"T_0502a_row20_col3\" class=\"data row20 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row20_col4\" class=\"data row20 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row20_col5\" class=\"data row20 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row20_col6\" class=\"data row20 col6\" >{'random_state': {'type': 'int', 'default': 0}, 'contamination': {'type': 'float', 'default': 0.1}, 'feature_columns': {'type': 'list', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row20_col7\" class=\"data row20 col7\" >['tabular_data', 'anomaly_detection']</td>\n",
+              "      <td id=\"T_0502a_row20_col8\" class=\"data row20 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row21_col0\" class=\"data row21 col0\" >validmind.data_validation.JarqueBera</td>\n",
+              "      <td id=\"T_0502a_row21_col1\" class=\"data row21 col1\" >Jarque Bera</td>\n",
+              "      <td id=\"T_0502a_row21_col2\" class=\"data row21 col2\" >Assesses normality of dataset features in an ML model using the Jarque-Bera test....</td>\n",
+              "      <td id=\"T_0502a_row21_col3\" class=\"data row21 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row21_col4\" class=\"data row21 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row21_col5\" class=\"data row21 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row21_col6\" class=\"data row21 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row21_col7\" class=\"data row21 col7\" >['tabular_data', 'data_distribution', 'statistical_test', 'statsmodels']</td>\n",
+              "      <td id=\"T_0502a_row21_col8\" class=\"data row21 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row22_col0\" class=\"data row22 col0\" >validmind.data_validation.KPSS</td>\n",
+              "      <td id=\"T_0502a_row22_col1\" class=\"data row22 col1\" >KPSS</td>\n",
+              "      <td id=\"T_0502a_row22_col2\" class=\"data row22 col2\" >Assesses the stationarity of time-series data in a machine learning model using the KPSS unit root test....</td>\n",
+              "      <td id=\"T_0502a_row22_col3\" class=\"data row22 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row22_col4\" class=\"data row22 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row22_col5\" class=\"data row22 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row22_col6\" class=\"data row22 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row22_col7\" class=\"data row22 col7\" >['time_series_data', 'stationarity', 'unit_root_test', 'statsmodels']</td>\n",
+              "      <td id=\"T_0502a_row22_col8\" class=\"data row22 col8\" >['data_validation']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row23_col0\" class=\"data row23 col0\" >validmind.data_validation.LJungBox</td>\n",
+              "      <td id=\"T_0502a_row23_col1\" class=\"data row23 col1\" >L Jung Box</td>\n",
+              "      <td id=\"T_0502a_row23_col2\" class=\"data row23 col2\" >Assesses autocorrelations in dataset features by performing a Ljung-Box test on each feature....</td>\n",
+              "      <td id=\"T_0502a_row23_col3\" class=\"data row23 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row23_col4\" class=\"data row23 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row23_col5\" class=\"data row23 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row23_col6\" class=\"data row23 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row23_col7\" class=\"data row23 col7\" >['time_series_data', 'forecasting', 'statistical_test', 'statsmodels']</td>\n",
+              "      <td id=\"T_0502a_row23_col8\" class=\"data row23 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row24_col0\" class=\"data row24 col0\" >validmind.data_validation.LaggedCorrelationHeatmap</td>\n",
+              "      <td id=\"T_0502a_row24_col1\" class=\"data row24 col1\" >Lagged Correlation Heatmap</td>\n",
+              "      <td id=\"T_0502a_row24_col2\" class=\"data row24 col2\" >Assesses and visualizes correlation between target variable and lagged independent variables in a time-series...</td>\n",
+              "      <td id=\"T_0502a_row24_col3\" class=\"data row24 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row24_col4\" class=\"data row24 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row24_col5\" class=\"data row24 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row24_col6\" class=\"data row24 col6\" >{'num_lags': {'type': 'int', 'default': 10}}</td>\n",
+              "      <td id=\"T_0502a_row24_col7\" class=\"data row24 col7\" >['time_series_data', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row24_col8\" class=\"data row24 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row25_col0\" class=\"data row25 col0\" >validmind.data_validation.MissingValues</td>\n",
+              "      <td id=\"T_0502a_row25_col1\" class=\"data row25 col1\" >Missing Values</td>\n",
+              "      <td id=\"T_0502a_row25_col2\" class=\"data row25 col2\" >Evaluates dataset quality by ensuring missing value ratio across all features does not exceed a set threshold....</td>\n",
+              "      <td id=\"T_0502a_row25_col3\" class=\"data row25 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row25_col4\" class=\"data row25 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row25_col5\" class=\"data row25 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row25_col6\" class=\"data row25 col6\" >{'min_threshold': {'type': 'int', 'default': 1}}</td>\n",
+              "      <td id=\"T_0502a_row25_col7\" class=\"data row25 col7\" >['tabular_data', 'data_quality']</td>\n",
+              "      <td id=\"T_0502a_row25_col8\" class=\"data row25 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row26_col0\" class=\"data row26 col0\" >validmind.data_validation.MissingValuesBarPlot</td>\n",
+              "      <td id=\"T_0502a_row26_col1\" class=\"data row26 col1\" >Missing Values Bar Plot</td>\n",
+              "      <td id=\"T_0502a_row26_col2\" class=\"data row26 col2\" >Assesses the percentage and distribution of missing values in the dataset via a bar plot, with emphasis on...</td>\n",
+              "      <td id=\"T_0502a_row26_col3\" class=\"data row26 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row26_col4\" class=\"data row26 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row26_col5\" class=\"data row26 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row26_col6\" class=\"data row26 col6\" >{'threshold': {'type': 'int', 'default': 80}, 'fig_height': {'type': 'int', 'default': 600}}</td>\n",
+              "      <td id=\"T_0502a_row26_col7\" class=\"data row26 col7\" >['tabular_data', 'data_quality', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row26_col8\" class=\"data row26 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row27_col0\" class=\"data row27 col0\" >validmind.data_validation.MutualInformation</td>\n",
+              "      <td id=\"T_0502a_row27_col1\" class=\"data row27 col1\" >Mutual Information</td>\n",
+              "      <td id=\"T_0502a_row27_col2\" class=\"data row27 col2\" >Calculates mutual information scores between features and target variable to evaluate feature relevance....</td>\n",
+              "      <td id=\"T_0502a_row27_col3\" class=\"data row27 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row27_col4\" class=\"data row27 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row27_col5\" class=\"data row27 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row27_col6\" class=\"data row27 col6\" >{'min_threshold': {'type': 'float', 'default': 0.01}, 'task': {'type': 'str', 'default': 'classification'}}</td>\n",
+              "      <td id=\"T_0502a_row27_col7\" class=\"data row27 col7\" >['feature_selection', 'data_analysis']</td>\n",
+              "      <td id=\"T_0502a_row27_col8\" class=\"data row27 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row28_col0\" class=\"data row28 col0\" >validmind.data_validation.PearsonCorrelationMatrix</td>\n",
+              "      <td id=\"T_0502a_row28_col1\" class=\"data row28 col1\" >Pearson Correlation Matrix</td>\n",
+              "      <td id=\"T_0502a_row28_col2\" class=\"data row28 col2\" >Evaluates linear dependency between numerical variables in a dataset via a Pearson Correlation coefficient heat map....</td>\n",
+              "      <td id=\"T_0502a_row28_col3\" class=\"data row28 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row28_col4\" class=\"data row28 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row28_col5\" class=\"data row28 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row28_col6\" class=\"data row28 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row28_col7\" class=\"data row28 col7\" >['tabular_data', 'numerical_data', 'correlation']</td>\n",
+              "      <td id=\"T_0502a_row28_col8\" class=\"data row28 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row29_col0\" class=\"data row29 col0\" >validmind.data_validation.PhillipsPerronArch</td>\n",
+              "      <td id=\"T_0502a_row29_col1\" class=\"data row29 col1\" >Phillips Perron Arch</td>\n",
+              "      <td id=\"T_0502a_row29_col2\" class=\"data row29 col2\" >Assesses the stationarity of time series data in each feature of the ML model using the Phillips-Perron test....</td>\n",
+              "      <td id=\"T_0502a_row29_col3\" class=\"data row29 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row29_col4\" class=\"data row29 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row29_col5\" class=\"data row29 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row29_col6\" class=\"data row29 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row29_col7\" class=\"data row29 col7\" >['time_series_data', 'forecasting', 'statistical_test', 'unit_root_test']</td>\n",
+              "      <td id=\"T_0502a_row29_col8\" class=\"data row29 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row30_col0\" class=\"data row30 col0\" >validmind.data_validation.ProtectedClassesDescription</td>\n",
+              "      <td id=\"T_0502a_row30_col1\" class=\"data row30 col1\" >Protected Classes Description</td>\n",
+              "      <td id=\"T_0502a_row30_col2\" class=\"data row30 col2\" >Visualizes the distribution of protected classes in the dataset relative to the target variable...</td>\n",
+              "      <td id=\"T_0502a_row30_col3\" class=\"data row30 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row30_col4\" class=\"data row30 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row30_col5\" class=\"data row30 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row30_col6\" class=\"data row30 col6\" >{'protected_classes': {'type': '_empty', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row30_col7\" class=\"data row30 col7\" >['bias_and_fairness', 'descriptive_statistics']</td>\n",
+              "      <td id=\"T_0502a_row30_col8\" class=\"data row30 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row31_col0\" class=\"data row31 col0\" >validmind.data_validation.RollingStatsPlot</td>\n",
+              "      <td id=\"T_0502a_row31_col1\" class=\"data row31 col1\" >Rolling Stats Plot</td>\n",
+              "      <td id=\"T_0502a_row31_col2\" class=\"data row31 col2\" >Evaluates the stationarity of time series data by plotting its rolling mean and standard deviation over a specified...</td>\n",
+              "      <td id=\"T_0502a_row31_col3\" class=\"data row31 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row31_col4\" class=\"data row31 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row31_col5\" class=\"data row31 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row31_col6\" class=\"data row31 col6\" >{'window_size': {'type': 'int', 'default': 12}}</td>\n",
+              "      <td id=\"T_0502a_row31_col7\" class=\"data row31 col7\" >['time_series_data', 'visualization', 'stationarity']</td>\n",
+              "      <td id=\"T_0502a_row31_col8\" class=\"data row31 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row32_col0\" class=\"data row32 col0\" >validmind.data_validation.RunsTest</td>\n",
+              "      <td id=\"T_0502a_row32_col1\" class=\"data row32 col1\" >Runs Test</td>\n",
+              "      <td id=\"T_0502a_row32_col2\" class=\"data row32 col2\" >Executes Runs Test on ML model to detect non-random patterns in output data sequence....</td>\n",
+              "      <td id=\"T_0502a_row32_col3\" class=\"data row32 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row32_col4\" class=\"data row32 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row32_col5\" class=\"data row32 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row32_col6\" class=\"data row32 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row32_col7\" class=\"data row32 col7\" >['tabular_data', 'statistical_test', 'statsmodels']</td>\n",
+              "      <td id=\"T_0502a_row32_col8\" class=\"data row32 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row33_col0\" class=\"data row33 col0\" >validmind.data_validation.ScatterPlot</td>\n",
+              "      <td id=\"T_0502a_row33_col1\" class=\"data row33 col1\" >Scatter Plot</td>\n",
+              "      <td id=\"T_0502a_row33_col2\" class=\"data row33 col2\" >Assesses visual relationships, patterns, and outliers among features in a dataset through scatter plot matrices....</td>\n",
+              "      <td id=\"T_0502a_row33_col3\" class=\"data row33 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row33_col4\" class=\"data row33 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row33_col5\" class=\"data row33 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row33_col6\" class=\"data row33 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row33_col7\" class=\"data row33 col7\" >['tabular_data', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row33_col8\" class=\"data row33 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row34_col0\" class=\"data row34 col0\" >validmind.data_validation.ScoreBandDefaultRates</td>\n",
+              "      <td id=\"T_0502a_row34_col1\" class=\"data row34 col1\" >Score Band Default Rates</td>\n",
+              "      <td id=\"T_0502a_row34_col2\" class=\"data row34 col2\" >Analyzes default rates and population distribution across credit score bands....</td>\n",
+              "      <td id=\"T_0502a_row34_col3\" class=\"data row34 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row34_col4\" class=\"data row34 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row34_col5\" class=\"data row34 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row34_col6\" class=\"data row34 col6\" >{'score_column': {'type': 'str', 'default': 'score'}, 'score_bands': {'type': 'list', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row34_col7\" class=\"data row34 col7\" >['visualization', 'credit_risk', 'scorecard']</td>\n",
+              "      <td id=\"T_0502a_row34_col8\" class=\"data row34 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row35_col0\" class=\"data row35 col0\" >validmind.data_validation.SeasonalDecompose</td>\n",
+              "      <td id=\"T_0502a_row35_col1\" class=\"data row35 col1\" >Seasonal Decompose</td>\n",
+              "      <td id=\"T_0502a_row35_col2\" class=\"data row35 col2\" >Assesses patterns and seasonality in a time series dataset by decomposing its features into foundational components....</td>\n",
+              "      <td id=\"T_0502a_row35_col3\" class=\"data row35 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row35_col4\" class=\"data row35 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row35_col5\" class=\"data row35 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row35_col6\" class=\"data row35 col6\" >{'seasonal_model': {'type': 'str', 'default': 'additive'}}</td>\n",
+              "      <td id=\"T_0502a_row35_col7\" class=\"data row35 col7\" >['time_series_data', 'seasonality', 'statsmodels']</td>\n",
+              "      <td id=\"T_0502a_row35_col8\" class=\"data row35 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row36_col0\" class=\"data row36 col0\" >validmind.data_validation.ShapiroWilk</td>\n",
+              "      <td id=\"T_0502a_row36_col1\" class=\"data row36 col1\" >Shapiro Wilk</td>\n",
+              "      <td id=\"T_0502a_row36_col2\" class=\"data row36 col2\" >Evaluates feature-wise normality of training data using the Shapiro-Wilk test....</td>\n",
+              "      <td id=\"T_0502a_row36_col3\" class=\"data row36 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row36_col4\" class=\"data row36 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row36_col5\" class=\"data row36 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row36_col6\" class=\"data row36 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row36_col7\" class=\"data row36 col7\" >['tabular_data', 'data_distribution', 'statistical_test']</td>\n",
+              "      <td id=\"T_0502a_row36_col8\" class=\"data row36 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row37_col0\" class=\"data row37 col0\" >validmind.data_validation.Skewness</td>\n",
+              "      <td id=\"T_0502a_row37_col1\" class=\"data row37 col1\" >Skewness</td>\n",
+              "      <td id=\"T_0502a_row37_col2\" class=\"data row37 col2\" >Evaluates the skewness of numerical data in a dataset to check against a defined threshold, aiming to ensure data...</td>\n",
+              "      <td id=\"T_0502a_row37_col3\" class=\"data row37 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row37_col4\" class=\"data row37 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row37_col5\" class=\"data row37 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row37_col6\" class=\"data row37 col6\" >{'max_threshold': {'type': '_empty', 'default': 1}}</td>\n",
+              "      <td id=\"T_0502a_row37_col7\" class=\"data row37 col7\" >['data_quality', 'tabular_data']</td>\n",
+              "      <td id=\"T_0502a_row37_col8\" class=\"data row37 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row38_col0\" class=\"data row38 col0\" >validmind.data_validation.SpreadPlot</td>\n",
+              "      <td id=\"T_0502a_row38_col1\" class=\"data row38 col1\" >Spread Plot</td>\n",
+              "      <td id=\"T_0502a_row38_col2\" class=\"data row38 col2\" >Assesses potential correlations between pairs of time series variables through visualization to enhance...</td>\n",
+              "      <td id=\"T_0502a_row38_col3\" class=\"data row38 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row38_col4\" class=\"data row38 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row38_col5\" class=\"data row38 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row38_col6\" class=\"data row38 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row38_col7\" class=\"data row38 col7\" >['time_series_data', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row38_col8\" class=\"data row38 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row39_col0\" class=\"data row39 col0\" >validmind.data_validation.TabularCategoricalBarPlots</td>\n",
+              "      <td id=\"T_0502a_row39_col1\" class=\"data row39 col1\" >Tabular Categorical Bar Plots</td>\n",
+              "      <td id=\"T_0502a_row39_col2\" class=\"data row39 col2\" >Generates and visualizes bar plots for each category in categorical features to evaluate the dataset's composition....</td>\n",
+              "      <td id=\"T_0502a_row39_col3\" class=\"data row39 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row39_col4\" class=\"data row39 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row39_col5\" class=\"data row39 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row39_col6\" class=\"data row39 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row39_col7\" class=\"data row39 col7\" >['tabular_data', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row39_col8\" class=\"data row39 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row40_col0\" class=\"data row40 col0\" >validmind.data_validation.TabularDateTimeHistograms</td>\n",
+              "      <td id=\"T_0502a_row40_col1\" class=\"data row40 col1\" >Tabular Date Time Histograms</td>\n",
+              "      <td id=\"T_0502a_row40_col2\" class=\"data row40 col2\" >Generates histograms to provide graphical insight into the distribution of time intervals in a model's datetime...</td>\n",
+              "      <td id=\"T_0502a_row40_col3\" class=\"data row40 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row40_col4\" class=\"data row40 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row40_col5\" class=\"data row40 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row40_col6\" class=\"data row40 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row40_col7\" class=\"data row40 col7\" >['time_series_data', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row40_col8\" class=\"data row40 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row41_col0\" class=\"data row41 col0\" >validmind.data_validation.TabularDescriptionTables</td>\n",
+              "      <td id=\"T_0502a_row41_col1\" class=\"data row41 col1\" >Tabular Description Tables</td>\n",
+              "      <td id=\"T_0502a_row41_col2\" class=\"data row41 col2\" >Summarizes key descriptive statistics for numerical, categorical, and datetime variables in a dataset....</td>\n",
+              "      <td id=\"T_0502a_row41_col3\" class=\"data row41 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row41_col4\" class=\"data row41 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row41_col5\" class=\"data row41 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row41_col6\" class=\"data row41 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row41_col7\" class=\"data row41 col7\" >['tabular_data']</td>\n",
+              "      <td id=\"T_0502a_row41_col8\" class=\"data row41 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row42_col0\" class=\"data row42 col0\" >validmind.data_validation.TabularNumericalHistograms</td>\n",
+              "      <td id=\"T_0502a_row42_col1\" class=\"data row42 col1\" >Tabular Numerical Histograms</td>\n",
+              "      <td id=\"T_0502a_row42_col2\" class=\"data row42 col2\" >Generates histograms for each numerical feature in a dataset to provide visual insights into data distribution and...</td>\n",
+              "      <td id=\"T_0502a_row42_col3\" class=\"data row42 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row42_col4\" class=\"data row42 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row42_col5\" class=\"data row42 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row42_col6\" class=\"data row42 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row42_col7\" class=\"data row42 col7\" >['tabular_data', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row42_col8\" class=\"data row42 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row43_col0\" class=\"data row43 col0\" >validmind.data_validation.TargetRateBarPlots</td>\n",
+              "      <td id=\"T_0502a_row43_col1\" class=\"data row43 col1\" >Target Rate Bar Plots</td>\n",
+              "      <td id=\"T_0502a_row43_col2\" class=\"data row43 col2\" >Generates bar plots visualizing the default rates of categorical features for a classification machine learning...</td>\n",
+              "      <td id=\"T_0502a_row43_col3\" class=\"data row43 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row43_col4\" class=\"data row43 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row43_col5\" class=\"data row43 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row43_col6\" class=\"data row43 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row43_col7\" class=\"data row43 col7\" >['tabular_data', 'visualization', 'categorical_data']</td>\n",
+              "      <td id=\"T_0502a_row43_col8\" class=\"data row43 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row44_col0\" class=\"data row44 col0\" >validmind.data_validation.TimeSeriesDescription</td>\n",
+              "      <td id=\"T_0502a_row44_col1\" class=\"data row44 col1\" >Time Series Description</td>\n",
+              "      <td id=\"T_0502a_row44_col2\" class=\"data row44 col2\" >Generates a detailed analysis for the provided time series dataset, summarizing key statistics to identify trends,...</td>\n",
+              "      <td id=\"T_0502a_row44_col3\" class=\"data row44 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row44_col4\" class=\"data row44 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row44_col5\" class=\"data row44 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row44_col6\" class=\"data row44 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row44_col7\" class=\"data row44 col7\" >['time_series_data', 'analysis']</td>\n",
+              "      <td id=\"T_0502a_row44_col8\" class=\"data row44 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row45_col0\" class=\"data row45 col0\" >validmind.data_validation.TimeSeriesDescriptiveStatistics</td>\n",
+              "      <td id=\"T_0502a_row45_col1\" class=\"data row45 col1\" >Time Series Descriptive Statistics</td>\n",
+              "      <td id=\"T_0502a_row45_col2\" class=\"data row45 col2\" >Evaluates the descriptive statistics of a time series dataset to identify trends, patterns, and data quality issues....</td>\n",
+              "      <td id=\"T_0502a_row45_col3\" class=\"data row45 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row45_col4\" class=\"data row45 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row45_col5\" class=\"data row45 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row45_col6\" class=\"data row45 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row45_col7\" class=\"data row45 col7\" >['time_series_data', 'analysis']</td>\n",
+              "      <td id=\"T_0502a_row45_col8\" class=\"data row45 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row46_col0\" class=\"data row46 col0\" >validmind.data_validation.TimeSeriesFrequency</td>\n",
+              "      <td id=\"T_0502a_row46_col1\" class=\"data row46 col1\" >Time Series Frequency</td>\n",
+              "      <td id=\"T_0502a_row46_col2\" class=\"data row46 col2\" >Evaluates consistency of time series data frequency and generates a frequency plot....</td>\n",
+              "      <td id=\"T_0502a_row46_col3\" class=\"data row46 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row46_col4\" class=\"data row46 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row46_col5\" class=\"data row46 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row46_col6\" class=\"data row46 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row46_col7\" class=\"data row46 col7\" >['time_series_data']</td>\n",
+              "      <td id=\"T_0502a_row46_col8\" class=\"data row46 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row47_col0\" class=\"data row47 col0\" >validmind.data_validation.TimeSeriesHistogram</td>\n",
+              "      <td id=\"T_0502a_row47_col1\" class=\"data row47 col1\" >Time Series Histogram</td>\n",
+              "      <td id=\"T_0502a_row47_col2\" class=\"data row47 col2\" >Visualizes distribution of time-series data using histograms and Kernel Density Estimation (KDE) lines....</td>\n",
+              "      <td id=\"T_0502a_row47_col3\" class=\"data row47 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row47_col4\" class=\"data row47 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row47_col5\" class=\"data row47 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row47_col6\" class=\"data row47 col6\" >{'nbins': {'type': '_empty', 'default': 30}}</td>\n",
+              "      <td id=\"T_0502a_row47_col7\" class=\"data row47 col7\" >['data_validation', 'visualization', 'time_series_data']</td>\n",
+              "      <td id=\"T_0502a_row47_col8\" class=\"data row47 col8\" >['regression', 'time_series_forecasting']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row48_col0\" class=\"data row48 col0\" >validmind.data_validation.TimeSeriesLinePlot</td>\n",
+              "      <td id=\"T_0502a_row48_col1\" class=\"data row48 col1\" >Time Series Line Plot</td>\n",
+              "      <td id=\"T_0502a_row48_col2\" class=\"data row48 col2\" >Generates and analyses time-series data through line plots revealing trends, patterns, anomalies over time....</td>\n",
+              "      <td id=\"T_0502a_row48_col3\" class=\"data row48 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row48_col4\" class=\"data row48 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row48_col5\" class=\"data row48 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row48_col6\" class=\"data row48 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row48_col7\" class=\"data row48 col7\" >['time_series_data', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row48_col8\" class=\"data row48 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row49_col0\" class=\"data row49 col0\" >validmind.data_validation.TimeSeriesMissingValues</td>\n",
+              "      <td id=\"T_0502a_row49_col1\" class=\"data row49 col1\" >Time Series Missing Values</td>\n",
+              "      <td id=\"T_0502a_row49_col2\" class=\"data row49 col2\" >Validates time-series data quality by confirming the count of missing values is below a certain threshold....</td>\n",
+              "      <td id=\"T_0502a_row49_col3\" class=\"data row49 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row49_col4\" class=\"data row49 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row49_col5\" class=\"data row49 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row49_col6\" class=\"data row49 col6\" >{'min_threshold': {'type': 'int', 'default': 1}}</td>\n",
+              "      <td id=\"T_0502a_row49_col7\" class=\"data row49 col7\" >['time_series_data']</td>\n",
+              "      <td id=\"T_0502a_row49_col8\" class=\"data row49 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row50_col0\" class=\"data row50 col0\" >validmind.data_validation.TimeSeriesOutliers</td>\n",
+              "      <td id=\"T_0502a_row50_col1\" class=\"data row50 col1\" >Time Series Outliers</td>\n",
+              "      <td id=\"T_0502a_row50_col2\" class=\"data row50 col2\" >Identifies and visualizes outliers in time-series data using the z-score method....</td>\n",
+              "      <td id=\"T_0502a_row50_col3\" class=\"data row50 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row50_col4\" class=\"data row50 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row50_col5\" class=\"data row50 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row50_col6\" class=\"data row50 col6\" >{'zscore_threshold': {'type': 'int', 'default': 3}}</td>\n",
+              "      <td id=\"T_0502a_row50_col7\" class=\"data row50 col7\" >['time_series_data']</td>\n",
+              "      <td id=\"T_0502a_row50_col8\" class=\"data row50 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row51_col0\" class=\"data row51 col0\" >validmind.data_validation.TooManyZeroValues</td>\n",
+              "      <td id=\"T_0502a_row51_col1\" class=\"data row51 col1\" >Too Many Zero Values</td>\n",
+              "      <td id=\"T_0502a_row51_col2\" class=\"data row51 col2\" >Identifies numerical columns in a dataset that contain an excessive number of zero values, defined by a threshold...</td>\n",
+              "      <td id=\"T_0502a_row51_col3\" class=\"data row51 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row51_col4\" class=\"data row51 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row51_col5\" class=\"data row51 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row51_col6\" class=\"data row51 col6\" >{'max_percent_threshold': {'type': 'float', 'default': 0.03}}</td>\n",
+              "      <td id=\"T_0502a_row51_col7\" class=\"data row51 col7\" >['tabular_data']</td>\n",
+              "      <td id=\"T_0502a_row51_col8\" class=\"data row51 col8\" >['regression', 'classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row52_col0\" class=\"data row52 col0\" >validmind.data_validation.UniqueRows</td>\n",
+              "      <td id=\"T_0502a_row52_col1\" class=\"data row52 col1\" >Unique Rows</td>\n",
+              "      <td id=\"T_0502a_row52_col2\" class=\"data row52 col2\" >Verifies the diversity of the dataset by ensuring that the count of unique rows exceeds a prescribed threshold....</td>\n",
+              "      <td id=\"T_0502a_row52_col3\" class=\"data row52 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row52_col4\" class=\"data row52 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row52_col5\" class=\"data row52 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row52_col6\" class=\"data row52 col6\" >{'min_percent_threshold': {'type': 'float', 'default': 1}}</td>\n",
+              "      <td id=\"T_0502a_row52_col7\" class=\"data row52 col7\" >['tabular_data']</td>\n",
+              "      <td id=\"T_0502a_row52_col8\" class=\"data row52 col8\" >['regression', 'classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row53_col0\" class=\"data row53 col0\" >validmind.data_validation.WOEBinPlots</td>\n",
+              "      <td id=\"T_0502a_row53_col1\" class=\"data row53 col1\" >WOE Bin Plots</td>\n",
+              "      <td id=\"T_0502a_row53_col2\" class=\"data row53 col2\" >Generates visualizations of Weight of Evidence (WoE) and Information Value (IV) for understanding predictive power...</td>\n",
+              "      <td id=\"T_0502a_row53_col3\" class=\"data row53 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row53_col4\" class=\"data row53 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row53_col5\" class=\"data row53 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row53_col6\" class=\"data row53 col6\" >{'breaks_adj': {'type': 'list', 'default': None}, 'fig_height': {'type': 'int', 'default': 600}, 'fig_width': {'type': 'int', 'default': 500}}</td>\n",
+              "      <td id=\"T_0502a_row53_col7\" class=\"data row53 col7\" >['tabular_data', 'visualization', 'categorical_data']</td>\n",
+              "      <td id=\"T_0502a_row53_col8\" class=\"data row53 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row54_col0\" class=\"data row54 col0\" >validmind.data_validation.WOEBinTable</td>\n",
+              "      <td id=\"T_0502a_row54_col1\" class=\"data row54 col1\" >WOE Bin Table</td>\n",
+              "      <td id=\"T_0502a_row54_col2\" class=\"data row54 col2\" >Assesses the Weight of Evidence (WoE) and Information Value (IV) of each feature to evaluate its predictive power...</td>\n",
+              "      <td id=\"T_0502a_row54_col3\" class=\"data row54 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row54_col4\" class=\"data row54 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row54_col5\" class=\"data row54 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row54_col6\" class=\"data row54 col6\" >{'breaks_adj': {'type': 'list', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row54_col7\" class=\"data row54 col7\" >['tabular_data', 'categorical_data']</td>\n",
+              "      <td id=\"T_0502a_row54_col8\" class=\"data row54 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row55_col0\" class=\"data row55 col0\" >validmind.data_validation.ZivotAndrewsArch</td>\n",
+              "      <td id=\"T_0502a_row55_col1\" class=\"data row55 col1\" >Zivot Andrews Arch</td>\n",
+              "      <td id=\"T_0502a_row55_col2\" class=\"data row55 col2\" >Evaluates the order of integration and stationarity of time series data using the Zivot-Andrews unit root test....</td>\n",
+              "      <td id=\"T_0502a_row55_col3\" class=\"data row55 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row55_col4\" class=\"data row55 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row55_col5\" class=\"data row55 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row55_col6\" class=\"data row55 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row55_col7\" class=\"data row55 col7\" >['time_series_data', 'stationarity', 'unit_root_test']</td>\n",
+              "      <td id=\"T_0502a_row55_col8\" class=\"data row55 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row56_col0\" class=\"data row56 col0\" >validmind.data_validation.nlp.CommonWords</td>\n",
+              "      <td id=\"T_0502a_row56_col1\" class=\"data row56 col1\" >Common Words</td>\n",
+              "      <td id=\"T_0502a_row56_col2\" class=\"data row56 col2\" >Assesses the most frequent non-stopwords in a text column for identifying prevalent language patterns....</td>\n",
+              "      <td id=\"T_0502a_row56_col3\" class=\"data row56 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row56_col4\" class=\"data row56 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row56_col5\" class=\"data row56 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row56_col6\" class=\"data row56 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row56_col7\" class=\"data row56 col7\" >['nlp', 'text_data', 'visualization', 'frequency_analysis']</td>\n",
+              "      <td id=\"T_0502a_row56_col8\" class=\"data row56 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row57_col0\" class=\"data row57 col0\" >validmind.data_validation.nlp.Hashtags</td>\n",
+              "      <td id=\"T_0502a_row57_col1\" class=\"data row57 col1\" >Hashtags</td>\n",
+              "      <td id=\"T_0502a_row57_col2\" class=\"data row57 col2\" >Assesses hashtag frequency in a text column, highlighting usage trends and potential dataset bias or spam....</td>\n",
+              "      <td id=\"T_0502a_row57_col3\" class=\"data row57 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row57_col4\" class=\"data row57 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row57_col5\" class=\"data row57 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row57_col6\" class=\"data row57 col6\" >{'top_hashtags': {'type': 'int', 'default': 25}}</td>\n",
+              "      <td id=\"T_0502a_row57_col7\" class=\"data row57 col7\" >['nlp', 'text_data', 'visualization', 'frequency_analysis']</td>\n",
+              "      <td id=\"T_0502a_row57_col8\" class=\"data row57 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row58_col0\" class=\"data row58 col0\" >validmind.data_validation.nlp.LanguageDetection</td>\n",
+              "      <td id=\"T_0502a_row58_col1\" class=\"data row58 col1\" >Language Detection</td>\n",
+              "      <td id=\"T_0502a_row58_col2\" class=\"data row58 col2\" >Assesses the diversity of languages in a textual dataset by detecting and visualizing the distribution of languages....</td>\n",
+              "      <td id=\"T_0502a_row58_col3\" class=\"data row58 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row58_col4\" class=\"data row58 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row58_col5\" class=\"data row58 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row58_col6\" class=\"data row58 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row58_col7\" class=\"data row58 col7\" >['nlp', 'text_data', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row58_col8\" class=\"data row58 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row59_col0\" class=\"data row59 col0\" >validmind.data_validation.nlp.Mentions</td>\n",
+              "      <td id=\"T_0502a_row59_col1\" class=\"data row59 col1\" >Mentions</td>\n",
+              "      <td id=\"T_0502a_row59_col2\" class=\"data row59 col2\" >Calculates and visualizes frequencies of '@' prefixed mentions in a text-based dataset for NLP model analysis....</td>\n",
+              "      <td id=\"T_0502a_row59_col3\" class=\"data row59 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row59_col4\" class=\"data row59 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row59_col5\" class=\"data row59 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row59_col6\" class=\"data row59 col6\" >{'top_mentions': {'type': 'int', 'default': 25}}</td>\n",
+              "      <td id=\"T_0502a_row59_col7\" class=\"data row59 col7\" >['nlp', 'text_data', 'visualization', 'frequency_analysis']</td>\n",
+              "      <td id=\"T_0502a_row59_col8\" class=\"data row59 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row60_col0\" class=\"data row60 col0\" >validmind.data_validation.nlp.PolarityAndSubjectivity</td>\n",
+              "      <td id=\"T_0502a_row60_col1\" class=\"data row60 col1\" >Polarity And Subjectivity</td>\n",
+              "      <td id=\"T_0502a_row60_col2\" class=\"data row60 col2\" >Analyzes the polarity and subjectivity of text data within a given dataset to visualize the sentiment distribution....</td>\n",
+              "      <td id=\"T_0502a_row60_col3\" class=\"data row60 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row60_col4\" class=\"data row60 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row60_col5\" class=\"data row60 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row60_col6\" class=\"data row60 col6\" >{'threshold_subjectivity': {'type': '_empty', 'default': 0.5}, 'threshold_polarity': {'type': '_empty', 'default': 0}}</td>\n",
+              "      <td id=\"T_0502a_row60_col7\" class=\"data row60 col7\" >['nlp', 'text_data', 'data_validation']</td>\n",
+              "      <td id=\"T_0502a_row60_col8\" class=\"data row60 col8\" >['nlp']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row61_col0\" class=\"data row61 col0\" >validmind.data_validation.nlp.Punctuations</td>\n",
+              "      <td id=\"T_0502a_row61_col1\" class=\"data row61 col1\" >Punctuations</td>\n",
+              "      <td id=\"T_0502a_row61_col2\" class=\"data row61 col2\" >Analyzes and visualizes the frequency distribution of punctuation usage in a given text dataset....</td>\n",
+              "      <td id=\"T_0502a_row61_col3\" class=\"data row61 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row61_col4\" class=\"data row61 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row61_col5\" class=\"data row61 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row61_col6\" class=\"data row61 col6\" >{'count_mode': {'type': '_empty', 'default': 'token'}}</td>\n",
+              "      <td id=\"T_0502a_row61_col7\" class=\"data row61 col7\" >['nlp', 'text_data', 'visualization', 'frequency_analysis']</td>\n",
+              "      <td id=\"T_0502a_row61_col8\" class=\"data row61 col8\" >['text_classification', 'text_summarization', 'nlp']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row62_col0\" class=\"data row62 col0\" >validmind.data_validation.nlp.Sentiment</td>\n",
+              "      <td id=\"T_0502a_row62_col1\" class=\"data row62 col1\" >Sentiment</td>\n",
+              "      <td id=\"T_0502a_row62_col2\" class=\"data row62 col2\" >Analyzes the sentiment of text data within a dataset using the VADER sentiment analysis tool....</td>\n",
+              "      <td id=\"T_0502a_row62_col3\" class=\"data row62 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row62_col4\" class=\"data row62 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row62_col5\" class=\"data row62 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row62_col6\" class=\"data row62 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row62_col7\" class=\"data row62 col7\" >['nlp', 'text_data', 'data_validation']</td>\n",
+              "      <td id=\"T_0502a_row62_col8\" class=\"data row62 col8\" >['nlp']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row63_col0\" class=\"data row63 col0\" >validmind.data_validation.nlp.StopWords</td>\n",
+              "      <td id=\"T_0502a_row63_col1\" class=\"data row63 col1\" >Stop Words</td>\n",
+              "      <td id=\"T_0502a_row63_col2\" class=\"data row63 col2\" >Evaluates and visualizes the frequency of English stop words in a text dataset against a defined threshold....</td>\n",
+              "      <td id=\"T_0502a_row63_col3\" class=\"data row63 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row63_col4\" class=\"data row63 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row63_col5\" class=\"data row63 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row63_col6\" class=\"data row63 col6\" >{'min_percent_threshold': {'type': 'float', 'default': 0.5}, 'num_words': {'type': 'int', 'default': 25}}</td>\n",
+              "      <td id=\"T_0502a_row63_col7\" class=\"data row63 col7\" >['nlp', 'text_data', 'frequency_analysis', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row63_col8\" class=\"data row63 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row64_col0\" class=\"data row64 col0\" >validmind.data_validation.nlp.TextDescription</td>\n",
+              "      <td id=\"T_0502a_row64_col1\" class=\"data row64 col1\" >Text Description</td>\n",
+              "      <td id=\"T_0502a_row64_col2\" class=\"data row64 col2\" >Conducts comprehensive textual analysis on a dataset using NLTK to evaluate various parameters and generate...</td>\n",
+              "      <td id=\"T_0502a_row64_col3\" class=\"data row64 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row64_col4\" class=\"data row64 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row64_col5\" class=\"data row64 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row64_col6\" class=\"data row64 col6\" >{'unwanted_tokens': {'type': 'set', 'default': {'s', 'mrs', 'us', \"''\", ' ', 'ms', 'dr', 'dollar', '``', 'mr', \"'s\", \"s'\"}}, 'lang': {'type': 'str', 'default': 'english'}}</td>\n",
+              "      <td id=\"T_0502a_row64_col7\" class=\"data row64 col7\" >['nlp', 'text_data', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row64_col8\" class=\"data row64 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row65_col0\" class=\"data row65 col0\" >validmind.data_validation.nlp.Toxicity</td>\n",
+              "      <td id=\"T_0502a_row65_col1\" class=\"data row65 col1\" >Toxicity</td>\n",
+              "      <td id=\"T_0502a_row65_col2\" class=\"data row65 col2\" >Assesses the toxicity of text data within a dataset to visualize the distribution of toxicity scores....</td>\n",
+              "      <td id=\"T_0502a_row65_col3\" class=\"data row65 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row65_col4\" class=\"data row65 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row65_col5\" class=\"data row65 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row65_col6\" class=\"data row65 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row65_col7\" class=\"data row65 col7\" >['nlp', 'text_data', 'data_validation']</td>\n",
+              "      <td id=\"T_0502a_row65_col8\" class=\"data row65 col8\" >['nlp']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row66_col0\" class=\"data row66 col0\" >validmind.model_validation.BertScore</td>\n",
+              "      <td id=\"T_0502a_row66_col1\" class=\"data row66 col1\" >Bert Score</td>\n",
+              "      <td id=\"T_0502a_row66_col2\" class=\"data row66 col2\" >Assesses the quality of machine-generated text using BERTScore metrics and visualizes results through histograms...</td>\n",
+              "      <td id=\"T_0502a_row66_col3\" class=\"data row66 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row66_col4\" class=\"data row66 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row66_col5\" class=\"data row66 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row66_col6\" class=\"data row66 col6\" >{'evaluation_model': {'type': '_empty', 'default': 'distilbert-base-uncased'}}</td>\n",
+              "      <td id=\"T_0502a_row66_col7\" class=\"data row66 col7\" >['nlp', 'text_data', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row66_col8\" class=\"data row66 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row67_col0\" class=\"data row67 col0\" >validmind.model_validation.BleuScore</td>\n",
+              "      <td id=\"T_0502a_row67_col1\" class=\"data row67 col1\" >Bleu Score</td>\n",
+              "      <td id=\"T_0502a_row67_col2\" class=\"data row67 col2\" >Evaluates the quality of machine-generated text using BLEU metrics and visualizes the results through histograms...</td>\n",
+              "      <td id=\"T_0502a_row67_col3\" class=\"data row67 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row67_col4\" class=\"data row67 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row67_col5\" class=\"data row67 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row67_col6\" class=\"data row67 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row67_col7\" class=\"data row67 col7\" >['nlp', 'text_data', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row67_col8\" class=\"data row67 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row68_col0\" class=\"data row68 col0\" >validmind.model_validation.ClusterSizeDistribution</td>\n",
+              "      <td id=\"T_0502a_row68_col1\" class=\"data row68 col1\" >Cluster Size Distribution</td>\n",
+              "      <td id=\"T_0502a_row68_col2\" class=\"data row68 col2\" >Assesses the performance of clustering models by comparing the distribution of cluster sizes in model predictions...</td>\n",
+              "      <td id=\"T_0502a_row68_col3\" class=\"data row68 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row68_col4\" class=\"data row68 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row68_col5\" class=\"data row68 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row68_col6\" class=\"data row68 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row68_col7\" class=\"data row68 col7\" >['sklearn', 'model_performance']</td>\n",
+              "      <td id=\"T_0502a_row68_col8\" class=\"data row68 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row69_col0\" class=\"data row69 col0\" >validmind.model_validation.ContextualRecall</td>\n",
+              "      <td id=\"T_0502a_row69_col1\" class=\"data row69 col1\" >Contextual Recall</td>\n",
+              "      <td id=\"T_0502a_row69_col2\" class=\"data row69 col2\" >Evaluates a Natural Language Generation model's ability to generate contextually relevant and factually correct...</td>\n",
+              "      <td id=\"T_0502a_row69_col3\" class=\"data row69 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row69_col4\" class=\"data row69 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row69_col5\" class=\"data row69 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row69_col6\" class=\"data row69 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row69_col7\" class=\"data row69 col7\" >['nlp', 'text_data', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row69_col8\" class=\"data row69 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row70_col0\" class=\"data row70 col0\" >validmind.model_validation.FeaturesAUC</td>\n",
+              "      <td id=\"T_0502a_row70_col1\" class=\"data row70 col1\" >Features AUC</td>\n",
+              "      <td id=\"T_0502a_row70_col2\" class=\"data row70 col2\" >Evaluates the discriminatory power of each individual feature within a binary classification model by calculating...</td>\n",
+              "      <td id=\"T_0502a_row70_col3\" class=\"data row70 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row70_col4\" class=\"data row70 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row70_col5\" class=\"data row70 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row70_col6\" class=\"data row70 col6\" >{'fontsize': {'type': 'int', 'default': 12}, 'figure_height': {'type': 'int', 'default': 500}}</td>\n",
+              "      <td id=\"T_0502a_row70_col7\" class=\"data row70 col7\" >['feature_importance', 'AUC', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row70_col8\" class=\"data row70 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row71_col0\" class=\"data row71 col0\" >validmind.model_validation.MeteorScore</td>\n",
+              "      <td id=\"T_0502a_row71_col1\" class=\"data row71 col1\" >Meteor Score</td>\n",
+              "      <td id=\"T_0502a_row71_col2\" class=\"data row71 col2\" >Assesses the quality of machine-generated translations by comparing them to human-produced references using the...</td>\n",
+              "      <td id=\"T_0502a_row71_col3\" class=\"data row71 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row71_col4\" class=\"data row71 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row71_col5\" class=\"data row71 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row71_col6\" class=\"data row71 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row71_col7\" class=\"data row71 col7\" >['nlp', 'text_data', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row71_col8\" class=\"data row71 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row72_col0\" class=\"data row72 col0\" >validmind.model_validation.ModelMetadata</td>\n",
+              "      <td id=\"T_0502a_row72_col1\" class=\"data row72 col1\" >Model Metadata</td>\n",
+              "      <td id=\"T_0502a_row72_col2\" class=\"data row72 col2\" >Compare metadata of different models and generate a summary table with the results....</td>\n",
+              "      <td id=\"T_0502a_row72_col3\" class=\"data row72 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row72_col4\" class=\"data row72 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row72_col5\" class=\"data row72 col5\" >['model']</td>\n",
+              "      <td id=\"T_0502a_row72_col6\" class=\"data row72 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row72_col7\" class=\"data row72 col7\" >['model_training', 'metadata']</td>\n",
+              "      <td id=\"T_0502a_row72_col8\" class=\"data row72 col8\" >['regression', 'time_series_forecasting']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row73_col0\" class=\"data row73 col0\" >validmind.model_validation.ModelPredictionResiduals</td>\n",
+              "      <td id=\"T_0502a_row73_col1\" class=\"data row73 col1\" >Model Prediction Residuals</td>\n",
+              "      <td id=\"T_0502a_row73_col2\" class=\"data row73 col2\" >Assesses normality and behavior of residuals in regression models through visualization and statistical tests....</td>\n",
+              "      <td id=\"T_0502a_row73_col3\" class=\"data row73 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row73_col4\" class=\"data row73 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row73_col5\" class=\"data row73 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row73_col6\" class=\"data row73 col6\" >{'nbins': {'type': 'int', 'default': 100}, 'p_value_threshold': {'type': 'float', 'default': 0.05}, 'start_date': {'type': None, 'default': None}, 'end_date': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row73_col7\" class=\"data row73 col7\" >['regression']</td>\n",
+              "      <td id=\"T_0502a_row73_col8\" class=\"data row73 col8\" >['residual_analysis', 'visualization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row74_col0\" class=\"data row74 col0\" >validmind.model_validation.RegardScore</td>\n",
+              "      <td id=\"T_0502a_row74_col1\" class=\"data row74 col1\" >Regard Score</td>\n",
+              "      <td id=\"T_0502a_row74_col2\" class=\"data row74 col2\" >Assesses the sentiment and potential biases in text generated by NLP models by computing and visualizing regard...</td>\n",
+              "      <td id=\"T_0502a_row74_col3\" class=\"data row74 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row74_col4\" class=\"data row74 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row74_col5\" class=\"data row74 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row74_col6\" class=\"data row74 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row74_col7\" class=\"data row74 col7\" >['nlp', 'text_data', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row74_col8\" class=\"data row74 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row75_col0\" class=\"data row75 col0\" >validmind.model_validation.RegressionResidualsPlot</td>\n",
+              "      <td id=\"T_0502a_row75_col1\" class=\"data row75 col1\" >Regression Residuals Plot</td>\n",
+              "      <td id=\"T_0502a_row75_col2\" class=\"data row75 col2\" >Evaluates regression model performance using residual distribution and actual vs. predicted plots....</td>\n",
+              "      <td id=\"T_0502a_row75_col3\" class=\"data row75 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row75_col4\" class=\"data row75 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row75_col5\" class=\"data row75 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row75_col6\" class=\"data row75 col6\" >{'bin_size': {'type': 'float', 'default': 0.1}}</td>\n",
+              "      <td id=\"T_0502a_row75_col7\" class=\"data row75 col7\" >['model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row75_col8\" class=\"data row75 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row76_col0\" class=\"data row76 col0\" >validmind.model_validation.RougeScore</td>\n",
+              "      <td id=\"T_0502a_row76_col1\" class=\"data row76 col1\" >Rouge Score</td>\n",
+              "      <td id=\"T_0502a_row76_col2\" class=\"data row76 col2\" >Assesses the quality of machine-generated text using ROUGE metrics and visualizes the results to provide...</td>\n",
+              "      <td id=\"T_0502a_row76_col3\" class=\"data row76 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row76_col4\" class=\"data row76 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row76_col5\" class=\"data row76 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row76_col6\" class=\"data row76 col6\" >{'metric': {'type': 'str', 'default': 'rouge-1'}}</td>\n",
+              "      <td id=\"T_0502a_row76_col7\" class=\"data row76 col7\" >['nlp', 'text_data', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row76_col8\" class=\"data row76 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row77_col0\" class=\"data row77 col0\" >validmind.model_validation.TimeSeriesPredictionWithCI</td>\n",
+              "      <td id=\"T_0502a_row77_col1\" class=\"data row77 col1\" >Time Series Prediction With CI</td>\n",
+              "      <td id=\"T_0502a_row77_col2\" class=\"data row77 col2\" >Assesses predictive accuracy and uncertainty in time series models, highlighting breaches beyond confidence...</td>\n",
+              "      <td id=\"T_0502a_row77_col3\" class=\"data row77 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row77_col4\" class=\"data row77 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row77_col5\" class=\"data row77 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row77_col6\" class=\"data row77 col6\" >{'confidence': {'type': 'float', 'default': 0.95}}</td>\n",
+              "      <td id=\"T_0502a_row77_col7\" class=\"data row77 col7\" >['model_predictions', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row77_col8\" class=\"data row77 col8\" >['regression', 'time_series_forecasting']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row78_col0\" class=\"data row78 col0\" >validmind.model_validation.TimeSeriesPredictionsPlot</td>\n",
+              "      <td id=\"T_0502a_row78_col1\" class=\"data row78 col1\" >Time Series Predictions Plot</td>\n",
+              "      <td id=\"T_0502a_row78_col2\" class=\"data row78 col2\" >Plot actual vs predicted values for time series data and generate a visual comparison for the model....</td>\n",
+              "      <td id=\"T_0502a_row78_col3\" class=\"data row78 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row78_col4\" class=\"data row78 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row78_col5\" class=\"data row78 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row78_col6\" class=\"data row78 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row78_col7\" class=\"data row78 col7\" >['model_predictions', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row78_col8\" class=\"data row78 col8\" >['regression', 'time_series_forecasting']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row79_col0\" class=\"data row79 col0\" >validmind.model_validation.TimeSeriesR2SquareBySegments</td>\n",
+              "      <td id=\"T_0502a_row79_col1\" class=\"data row79 col1\" >Time Series R2 Square By Segments</td>\n",
+              "      <td id=\"T_0502a_row79_col2\" class=\"data row79 col2\" >Evaluates the R-Squared values of regression models over specified time segments in time series data to assess...</td>\n",
+              "      <td id=\"T_0502a_row79_col3\" class=\"data row79 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row79_col4\" class=\"data row79 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row79_col5\" class=\"data row79 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row79_col6\" class=\"data row79 col6\" >{'segments': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row79_col7\" class=\"data row79 col7\" >['model_performance', 'sklearn']</td>\n",
+              "      <td id=\"T_0502a_row79_col8\" class=\"data row79 col8\" >['regression', 'time_series_forecasting']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row80_col0\" class=\"data row80 col0\" >validmind.model_validation.TokenDisparity</td>\n",
+              "      <td id=\"T_0502a_row80_col1\" class=\"data row80 col1\" >Token Disparity</td>\n",
+              "      <td id=\"T_0502a_row80_col2\" class=\"data row80 col2\" >Evaluates the token disparity between reference and generated texts, visualizing the results through histograms and...</td>\n",
+              "      <td id=\"T_0502a_row80_col3\" class=\"data row80 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row80_col4\" class=\"data row80 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row80_col5\" class=\"data row80 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row80_col6\" class=\"data row80 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row80_col7\" class=\"data row80 col7\" >['nlp', 'text_data', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row80_col8\" class=\"data row80 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row81_col0\" class=\"data row81 col0\" >validmind.model_validation.ToxicityScore</td>\n",
+              "      <td id=\"T_0502a_row81_col1\" class=\"data row81 col1\" >Toxicity Score</td>\n",
+              "      <td id=\"T_0502a_row81_col2\" class=\"data row81 col2\" >Assesses the toxicity levels of texts generated by NLP models to identify and mitigate harmful or offensive content....</td>\n",
+              "      <td id=\"T_0502a_row81_col3\" class=\"data row81 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row81_col4\" class=\"data row81 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row81_col5\" class=\"data row81 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row81_col6\" class=\"data row81 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row81_col7\" class=\"data row81 col7\" >['nlp', 'text_data', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row81_col8\" class=\"data row81 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row82_col0\" class=\"data row82 col0\" >validmind.model_validation.embeddings.ClusterDistribution</td>\n",
+              "      <td id=\"T_0502a_row82_col1\" class=\"data row82 col1\" >Cluster Distribution</td>\n",
+              "      <td id=\"T_0502a_row82_col2\" class=\"data row82 col2\" >Assesses the distribution of text embeddings across clusters produced by a model using KMeans clustering....</td>\n",
+              "      <td id=\"T_0502a_row82_col3\" class=\"data row82 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row82_col4\" class=\"data row82 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row82_col5\" class=\"data row82 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row82_col6\" class=\"data row82 col6\" >{'num_clusters': {'type': 'int', 'default': 5}}</td>\n",
+              "      <td id=\"T_0502a_row82_col7\" class=\"data row82 col7\" >['llm', 'text_data', 'embeddings', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row82_col8\" class=\"data row82 col8\" >['feature_extraction']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row83_col0\" class=\"data row83 col0\" >validmind.model_validation.embeddings.CosineSimilarityComparison</td>\n",
+              "      <td id=\"T_0502a_row83_col1\" class=\"data row83 col1\" >Cosine Similarity Comparison</td>\n",
+              "      <td id=\"T_0502a_row83_col2\" class=\"data row83 col2\" >Assesses the similarity between embeddings generated by different models using Cosine Similarity, providing both...</td>\n",
+              "      <td id=\"T_0502a_row83_col3\" class=\"data row83 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row83_col4\" class=\"data row83 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row83_col5\" class=\"data row83 col5\" >['dataset', 'models']</td>\n",
+              "      <td id=\"T_0502a_row83_col6\" class=\"data row83 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row83_col7\" class=\"data row83 col7\" >['visualization', 'dimensionality_reduction', 'embeddings']</td>\n",
+              "      <td id=\"T_0502a_row83_col8\" class=\"data row83 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row84_col0\" class=\"data row84 col0\" >validmind.model_validation.embeddings.CosineSimilarityDistribution</td>\n",
+              "      <td id=\"T_0502a_row84_col1\" class=\"data row84 col1\" >Cosine Similarity Distribution</td>\n",
+              "      <td id=\"T_0502a_row84_col2\" class=\"data row84 col2\" >Assesses the similarity between predicted text embeddings from a model using a Cosine Similarity distribution...</td>\n",
+              "      <td id=\"T_0502a_row84_col3\" class=\"data row84 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row84_col4\" class=\"data row84 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row84_col5\" class=\"data row84 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row84_col6\" class=\"data row84 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row84_col7\" class=\"data row84 col7\" >['llm', 'text_data', 'embeddings', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row84_col8\" class=\"data row84 col8\" >['feature_extraction']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row85_col0\" class=\"data row85 col0\" >validmind.model_validation.embeddings.CosineSimilarityHeatmap</td>\n",
+              "      <td id=\"T_0502a_row85_col1\" class=\"data row85 col1\" >Cosine Similarity Heatmap</td>\n",
+              "      <td id=\"T_0502a_row85_col2\" class=\"data row85 col2\" >Generates an interactive heatmap to visualize the cosine similarities among embeddings derived from a given model....</td>\n",
+              "      <td id=\"T_0502a_row85_col3\" class=\"data row85 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row85_col4\" class=\"data row85 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row85_col5\" class=\"data row85 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row85_col6\" class=\"data row85 col6\" >{'title': {'type': '_empty', 'default': 'Cosine Similarity Matrix'}, 'color': {'type': '_empty', 'default': 'Cosine Similarity'}, 'xaxis_title': {'type': '_empty', 'default': 'Index'}, 'yaxis_title': {'type': '_empty', 'default': 'Index'}, 'color_scale': {'type': '_empty', 'default': 'Blues'}}</td>\n",
+              "      <td id=\"T_0502a_row85_col7\" class=\"data row85 col7\" >['visualization', 'dimensionality_reduction', 'embeddings']</td>\n",
+              "      <td id=\"T_0502a_row85_col8\" class=\"data row85 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row86_col0\" class=\"data row86 col0\" >validmind.model_validation.embeddings.DescriptiveAnalytics</td>\n",
+              "      <td id=\"T_0502a_row86_col1\" class=\"data row86 col1\" >Descriptive Analytics</td>\n",
+              "      <td id=\"T_0502a_row86_col2\" class=\"data row86 col2\" >Evaluates statistical properties of text embeddings in an ML model via mean, median, and standard deviation...</td>\n",
+              "      <td id=\"T_0502a_row86_col3\" class=\"data row86 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row86_col4\" class=\"data row86 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row86_col5\" class=\"data row86 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row86_col6\" class=\"data row86 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row86_col7\" class=\"data row86 col7\" >['llm', 'text_data', 'embeddings', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row86_col8\" class=\"data row86 col8\" >['feature_extraction']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row87_col0\" class=\"data row87 col0\" >validmind.model_validation.embeddings.EmbeddingsVisualization2D</td>\n",
+              "      <td id=\"T_0502a_row87_col1\" class=\"data row87 col1\" >Embeddings Visualization2 D</td>\n",
+              "      <td id=\"T_0502a_row87_col2\" class=\"data row87 col2\" >Visualizes 2D representation of text embeddings generated by a model using t-SNE technique....</td>\n",
+              "      <td id=\"T_0502a_row87_col3\" class=\"data row87 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row87_col4\" class=\"data row87 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row87_col5\" class=\"data row87 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row87_col6\" class=\"data row87 col6\" >{'cluster_column': {'type': None, 'default': None}, 'perplexity': {'type': 'int', 'default': 30}}</td>\n",
+              "      <td id=\"T_0502a_row87_col7\" class=\"data row87 col7\" >['llm', 'text_data', 'embeddings', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row87_col8\" class=\"data row87 col8\" >['feature_extraction']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row88_col0\" class=\"data row88 col0\" >validmind.model_validation.embeddings.EuclideanDistanceComparison</td>\n",
+              "      <td id=\"T_0502a_row88_col1\" class=\"data row88 col1\" >Euclidean Distance Comparison</td>\n",
+              "      <td id=\"T_0502a_row88_col2\" class=\"data row88 col2\" >Assesses and visualizes the dissimilarity between model embeddings using Euclidean distance, providing insights...</td>\n",
+              "      <td id=\"T_0502a_row88_col3\" class=\"data row88 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row88_col4\" class=\"data row88 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row88_col5\" class=\"data row88 col5\" >['dataset', 'models']</td>\n",
+              "      <td id=\"T_0502a_row88_col6\" class=\"data row88 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row88_col7\" class=\"data row88 col7\" >['visualization', 'dimensionality_reduction', 'embeddings']</td>\n",
+              "      <td id=\"T_0502a_row88_col8\" class=\"data row88 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row89_col0\" class=\"data row89 col0\" >validmind.model_validation.embeddings.EuclideanDistanceHeatmap</td>\n",
+              "      <td id=\"T_0502a_row89_col1\" class=\"data row89 col1\" >Euclidean Distance Heatmap</td>\n",
+              "      <td id=\"T_0502a_row89_col2\" class=\"data row89 col2\" >Generates an interactive heatmap to visualize the Euclidean distances among embeddings derived from a given model....</td>\n",
+              "      <td id=\"T_0502a_row89_col3\" class=\"data row89 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row89_col4\" class=\"data row89 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row89_col5\" class=\"data row89 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row89_col6\" class=\"data row89 col6\" >{'title': {'type': '_empty', 'default': 'Euclidean Distance Matrix'}, 'color': {'type': '_empty', 'default': 'Euclidean Distance'}, 'xaxis_title': {'type': '_empty', 'default': 'Index'}, 'yaxis_title': {'type': '_empty', 'default': 'Index'}, 'color_scale': {'type': '_empty', 'default': 'Blues'}}</td>\n",
+              "      <td id=\"T_0502a_row89_col7\" class=\"data row89 col7\" >['visualization', 'dimensionality_reduction', 'embeddings']</td>\n",
+              "      <td id=\"T_0502a_row89_col8\" class=\"data row89 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row90_col0\" class=\"data row90 col0\" >validmind.model_validation.embeddings.PCAComponentsPairwisePlots</td>\n",
+              "      <td id=\"T_0502a_row90_col1\" class=\"data row90 col1\" >PCA Components Pairwise Plots</td>\n",
+              "      <td id=\"T_0502a_row90_col2\" class=\"data row90 col2\" >Generates scatter plots for pairwise combinations of principal component analysis (PCA) components of model...</td>\n",
+              "      <td id=\"T_0502a_row90_col3\" class=\"data row90 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row90_col4\" class=\"data row90 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row90_col5\" class=\"data row90 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row90_col6\" class=\"data row90 col6\" >{'n_components': {'type': 'int', 'default': 3}}</td>\n",
+              "      <td id=\"T_0502a_row90_col7\" class=\"data row90 col7\" >['visualization', 'dimensionality_reduction', 'embeddings']</td>\n",
+              "      <td id=\"T_0502a_row90_col8\" class=\"data row90 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row91_col0\" class=\"data row91 col0\" >validmind.model_validation.embeddings.StabilityAnalysisKeyword</td>\n",
+              "      <td id=\"T_0502a_row91_col1\" class=\"data row91 col1\" >Stability Analysis Keyword</td>\n",
+              "      <td id=\"T_0502a_row91_col2\" class=\"data row91 col2\" >Evaluates robustness of embedding models to keyword swaps in the test dataset....</td>\n",
+              "      <td id=\"T_0502a_row91_col3\" class=\"data row91 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row91_col4\" class=\"data row91 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row91_col5\" class=\"data row91 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row91_col6\" class=\"data row91 col6\" >{'keyword_dict': {'type': None, 'default': None}, 'mean_similarity_threshold': {'type': 'float', 'default': 0.7}}</td>\n",
+              "      <td id=\"T_0502a_row91_col7\" class=\"data row91 col7\" >['llm', 'text_data', 'embeddings', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row91_col8\" class=\"data row91 col8\" >['feature_extraction']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row92_col0\" class=\"data row92 col0\" >validmind.model_validation.embeddings.StabilityAnalysisRandomNoise</td>\n",
+              "      <td id=\"T_0502a_row92_col1\" class=\"data row92 col1\" >Stability Analysis Random Noise</td>\n",
+              "      <td id=\"T_0502a_row92_col2\" class=\"data row92 col2\" >Assesses the robustness of text embeddings models to random noise introduced via text perturbations....</td>\n",
+              "      <td id=\"T_0502a_row92_col3\" class=\"data row92 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row92_col4\" class=\"data row92 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row92_col5\" class=\"data row92 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row92_col6\" class=\"data row92 col6\" >{'probability': {'type': 'float', 'default': 0.02}, 'mean_similarity_threshold': {'type': 'float', 'default': 0.7}}</td>\n",
+              "      <td id=\"T_0502a_row92_col7\" class=\"data row92 col7\" >['llm', 'text_data', 'embeddings', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row92_col8\" class=\"data row92 col8\" >['feature_extraction']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row93_col0\" class=\"data row93 col0\" >validmind.model_validation.embeddings.StabilityAnalysisSynonyms</td>\n",
+              "      <td id=\"T_0502a_row93_col1\" class=\"data row93 col1\" >Stability Analysis Synonyms</td>\n",
+              "      <td id=\"T_0502a_row93_col2\" class=\"data row93 col2\" >Evaluates the stability of text embeddings models when words in test data are replaced by their synonyms randomly....</td>\n",
+              "      <td id=\"T_0502a_row93_col3\" class=\"data row93 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row93_col4\" class=\"data row93 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row93_col5\" class=\"data row93 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row93_col6\" class=\"data row93 col6\" >{'probability': {'type': 'float', 'default': 0.02}, 'mean_similarity_threshold': {'type': 'float', 'default': 0.7}}</td>\n",
+              "      <td id=\"T_0502a_row93_col7\" class=\"data row93 col7\" >['llm', 'text_data', 'embeddings', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row93_col8\" class=\"data row93 col8\" >['feature_extraction']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row94_col0\" class=\"data row94 col0\" >validmind.model_validation.embeddings.StabilityAnalysisTranslation</td>\n",
+              "      <td id=\"T_0502a_row94_col1\" class=\"data row94 col1\" >Stability Analysis Translation</td>\n",
+              "      <td id=\"T_0502a_row94_col2\" class=\"data row94 col2\" >Evaluates robustness of text embeddings models to noise introduced by translating the original text to another...</td>\n",
+              "      <td id=\"T_0502a_row94_col3\" class=\"data row94 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row94_col4\" class=\"data row94 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row94_col5\" class=\"data row94 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row94_col6\" class=\"data row94 col6\" >{'source_lang': {'type': 'str', 'default': 'en'}, 'target_lang': {'type': 'str', 'default': 'fr'}, 'mean_similarity_threshold': {'type': 'float', 'default': 0.7}}</td>\n",
+              "      <td id=\"T_0502a_row94_col7\" class=\"data row94 col7\" >['llm', 'text_data', 'embeddings', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row94_col8\" class=\"data row94 col8\" >['feature_extraction']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row95_col0\" class=\"data row95 col0\" >validmind.model_validation.embeddings.TSNEComponentsPairwisePlots</td>\n",
+              "      <td id=\"T_0502a_row95_col1\" class=\"data row95 col1\" >TSNE Components Pairwise Plots</td>\n",
+              "      <td id=\"T_0502a_row95_col2\" class=\"data row95 col2\" >Creates scatter plots for pairwise combinations of t-SNE components to visualize embeddings and highlight potential...</td>\n",
+              "      <td id=\"T_0502a_row95_col3\" class=\"data row95 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row95_col4\" class=\"data row95 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row95_col5\" class=\"data row95 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row95_col6\" class=\"data row95 col6\" >{'n_components': {'type': 'int', 'default': 2}, 'perplexity': {'type': 'int', 'default': 30}, 'title': {'type': 'str', 'default': 't-SNE'}}</td>\n",
+              "      <td id=\"T_0502a_row95_col7\" class=\"data row95 col7\" >['visualization', 'dimensionality_reduction', 'embeddings']</td>\n",
+              "      <td id=\"T_0502a_row95_col8\" class=\"data row95 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row96_col0\" class=\"data row96 col0\" >validmind.model_validation.ragas.AnswerCorrectness</td>\n",
+              "      <td id=\"T_0502a_row96_col1\" class=\"data row96 col1\" >Answer Correctness</td>\n",
+              "      <td id=\"T_0502a_row96_col2\" class=\"data row96 col2\" >Evaluates the correctness of answers in a dataset with respect to the provided ground...</td>\n",
+              "      <td id=\"T_0502a_row96_col3\" class=\"data row96 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row96_col4\" class=\"data row96 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row96_col5\" class=\"data row96 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row96_col6\" class=\"data row96 col6\" >{'user_input_column': {'type': 'str', 'default': 'user_input'}, 'response_column': {'type': 'str', 'default': 'response'}, 'reference_column': {'type': 'str', 'default': 'reference'}, 'judge_llm': {'type': '_empty', 'default': None}, 'judge_embeddings': {'type': '_empty', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row96_col7\" class=\"data row96 col7\" >['ragas', 'llm']</td>\n",
+              "      <td id=\"T_0502a_row96_col8\" class=\"data row96 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row97_col0\" class=\"data row97 col0\" >validmind.model_validation.ragas.AspectCritic</td>\n",
+              "      <td id=\"T_0502a_row97_col1\" class=\"data row97 col1\" >Aspect Critic</td>\n",
+              "      <td id=\"T_0502a_row97_col2\" class=\"data row97 col2\" >Evaluates generations against the following aspects: harmfulness, maliciousness,...</td>\n",
+              "      <td id=\"T_0502a_row97_col3\" class=\"data row97 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row97_col4\" class=\"data row97 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row97_col5\" class=\"data row97 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row97_col6\" class=\"data row97 col6\" >{'user_input_column': {'type': 'str', 'default': 'user_input'}, 'response_column': {'type': 'str', 'default': 'response'}, 'retrieved_contexts_column': {'type': None, 'default': None}, 'aspects': {'type': None, 'default': ['coherence', 'conciseness', 'correctness', 'harmfulness', 'maliciousness']}, 'additional_aspects': {'type': None, 'default': None}, 'judge_llm': {'type': '_empty', 'default': None}, 'judge_embeddings': {'type': '_empty', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row97_col7\" class=\"data row97 col7\" >['ragas', 'llm', 'qualitative']</td>\n",
+              "      <td id=\"T_0502a_row97_col8\" class=\"data row97 col8\" >['text_summarization', 'text_generation', 'text_qa']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row98_col0\" class=\"data row98 col0\" >validmind.model_validation.ragas.ContextEntityRecall</td>\n",
+              "      <td id=\"T_0502a_row98_col1\" class=\"data row98 col1\" >Context Entity Recall</td>\n",
+              "      <td id=\"T_0502a_row98_col2\" class=\"data row98 col2\" >Evaluates the context entity recall for dataset entries and visualizes the results....</td>\n",
+              "      <td id=\"T_0502a_row98_col3\" class=\"data row98 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row98_col4\" class=\"data row98 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row98_col5\" class=\"data row98 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row98_col6\" class=\"data row98 col6\" >{'retrieved_contexts_column': {'type': 'str', 'default': 'retrieved_contexts'}, 'reference_column': {'type': 'str', 'default': 'reference'}, 'judge_llm': {'type': '_empty', 'default': None}, 'judge_embeddings': {'type': '_empty', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row98_col7\" class=\"data row98 col7\" >['ragas', 'llm', 'retrieval_performance']</td>\n",
+              "      <td id=\"T_0502a_row98_col8\" class=\"data row98 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row99_col0\" class=\"data row99 col0\" >validmind.model_validation.ragas.ContextPrecision</td>\n",
+              "      <td id=\"T_0502a_row99_col1\" class=\"data row99 col1\" >Context Precision</td>\n",
+              "      <td id=\"T_0502a_row99_col2\" class=\"data row99 col2\" >Context Precision is a metric that evaluates whether all of the ground-truth...</td>\n",
+              "      <td id=\"T_0502a_row99_col3\" class=\"data row99 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row99_col4\" class=\"data row99 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row99_col5\" class=\"data row99 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row99_col6\" class=\"data row99 col6\" >{'user_input_column': {'type': 'str', 'default': 'user_input'}, 'retrieved_contexts_column': {'type': 'str', 'default': 'retrieved_contexts'}, 'reference_column': {'type': 'str', 'default': 'reference'}, 'judge_llm': {'type': '_empty', 'default': None}, 'judge_embeddings': {'type': '_empty', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row99_col7\" class=\"data row99 col7\" >['ragas', 'llm', 'retrieval_performance']</td>\n",
+              "      <td id=\"T_0502a_row99_col8\" class=\"data row99 col8\" >['text_qa', 'text_generation', 'text_summarization', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row100_col0\" class=\"data row100 col0\" >validmind.model_validation.ragas.ContextPrecisionWithoutReference</td>\n",
+              "      <td id=\"T_0502a_row100_col1\" class=\"data row100 col1\" >Context Precision Without Reference</td>\n",
+              "      <td id=\"T_0502a_row100_col2\" class=\"data row100 col2\" >Context Precision Without Reference is a metric used to evaluate the relevance of...</td>\n",
+              "      <td id=\"T_0502a_row100_col3\" class=\"data row100 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row100_col4\" class=\"data row100 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row100_col5\" class=\"data row100 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row100_col6\" class=\"data row100 col6\" >{'user_input_column': {'type': 'str', 'default': 'user_input'}, 'retrieved_contexts_column': {'type': 'str', 'default': 'retrieved_contexts'}, 'response_column': {'type': 'str', 'default': 'response'}, 'judge_llm': {'type': '_empty', 'default': None}, 'judge_embeddings': {'type': '_empty', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row100_col7\" class=\"data row100 col7\" >['ragas', 'llm', 'retrieval_performance']</td>\n",
+              "      <td id=\"T_0502a_row100_col8\" class=\"data row100 col8\" >['text_qa', 'text_generation', 'text_summarization', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row101_col0\" class=\"data row101 col0\" >validmind.model_validation.ragas.ContextRecall</td>\n",
+              "      <td id=\"T_0502a_row101_col1\" class=\"data row101 col1\" >Context Recall</td>\n",
+              "      <td id=\"T_0502a_row101_col2\" class=\"data row101 col2\" >Context recall measures the extent to which the retrieved context aligns with the...</td>\n",
+              "      <td id=\"T_0502a_row101_col3\" class=\"data row101 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row101_col4\" class=\"data row101 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row101_col5\" class=\"data row101 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row101_col6\" class=\"data row101 col6\" >{'user_input_column': {'type': 'str', 'default': 'user_input'}, 'retrieved_contexts_column': {'type': 'str', 'default': 'retrieved_contexts'}, 'reference_column': {'type': 'str', 'default': 'reference'}, 'judge_llm': {'type': '_empty', 'default': None}, 'judge_embeddings': {'type': '_empty', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row101_col7\" class=\"data row101 col7\" >['ragas', 'llm', 'retrieval_performance']</td>\n",
+              "      <td id=\"T_0502a_row101_col8\" class=\"data row101 col8\" >['text_qa', 'text_generation', 'text_summarization', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row102_col0\" class=\"data row102 col0\" >validmind.model_validation.ragas.Faithfulness</td>\n",
+              "      <td id=\"T_0502a_row102_col1\" class=\"data row102 col1\" >Faithfulness</td>\n",
+              "      <td id=\"T_0502a_row102_col2\" class=\"data row102 col2\" >Evaluates the faithfulness of the generated answers with respect to retrieved contexts....</td>\n",
+              "      <td id=\"T_0502a_row102_col3\" class=\"data row102 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row102_col4\" class=\"data row102 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row102_col5\" class=\"data row102 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row102_col6\" class=\"data row102 col6\" >{'user_input_column': {'type': 'str', 'default': 'user_input'}, 'response_column': {'type': 'str', 'default': 'response'}, 'retrieved_contexts_column': {'type': 'str', 'default': 'retrieved_contexts'}, 'judge_llm': {'type': '_empty', 'default': None}, 'judge_embeddings': {'type': '_empty', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row102_col7\" class=\"data row102 col7\" >['ragas', 'llm', 'rag_performance']</td>\n",
+              "      <td id=\"T_0502a_row102_col8\" class=\"data row102 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row103_col0\" class=\"data row103 col0\" >validmind.model_validation.ragas.NoiseSensitivity</td>\n",
+              "      <td id=\"T_0502a_row103_col1\" class=\"data row103 col1\" >Noise Sensitivity</td>\n",
+              "      <td id=\"T_0502a_row103_col2\" class=\"data row103 col2\" >Assesses the sensitivity of a Large Language Model (LLM) to noise in retrieved context by measuring how often it...</td>\n",
+              "      <td id=\"T_0502a_row103_col3\" class=\"data row103 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row103_col4\" class=\"data row103 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row103_col5\" class=\"data row103 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row103_col6\" class=\"data row103 col6\" >{'response_column': {'type': 'str', 'default': 'response'}, 'retrieved_contexts_column': {'type': 'str', 'default': 'retrieved_contexts'}, 'reference_column': {'type': 'str', 'default': 'reference'}, 'focus': {'type': 'str', 'default': 'relevant'}, 'user_input_column': {'type': 'str', 'default': 'user_input'}, 'judge_llm': {'type': '_empty', 'default': None}, 'judge_embeddings': {'type': '_empty', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row103_col7\" class=\"data row103 col7\" >['ragas', 'llm', 'rag_performance']</td>\n",
+              "      <td id=\"T_0502a_row103_col8\" class=\"data row103 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row104_col0\" class=\"data row104 col0\" >validmind.model_validation.ragas.ResponseRelevancy</td>\n",
+              "      <td id=\"T_0502a_row104_col1\" class=\"data row104 col1\" >Response Relevancy</td>\n",
+              "      <td id=\"T_0502a_row104_col2\" class=\"data row104 col2\" >Assesses how pertinent the generated answer is to the given prompt....</td>\n",
+              "      <td id=\"T_0502a_row104_col3\" class=\"data row104 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row104_col4\" class=\"data row104 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row104_col5\" class=\"data row104 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row104_col6\" class=\"data row104 col6\" >{'user_input_column': {'type': 'str', 'default': 'user_input'}, 'retrieved_contexts_column': {'type': 'str', 'default': None}, 'response_column': {'type': 'str', 'default': 'response'}, 'judge_llm': {'type': '_empty', 'default': None}, 'judge_embeddings': {'type': '_empty', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row104_col7\" class=\"data row104 col7\" >['ragas', 'llm', 'rag_performance']</td>\n",
+              "      <td id=\"T_0502a_row104_col8\" class=\"data row104 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row105_col0\" class=\"data row105 col0\" >validmind.model_validation.ragas.SemanticSimilarity</td>\n",
+              "      <td id=\"T_0502a_row105_col1\" class=\"data row105 col1\" >Semantic Similarity</td>\n",
+              "      <td id=\"T_0502a_row105_col2\" class=\"data row105 col2\" >Calculates the semantic similarity between generated responses and ground truths...</td>\n",
+              "      <td id=\"T_0502a_row105_col3\" class=\"data row105 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row105_col4\" class=\"data row105 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row105_col5\" class=\"data row105 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row105_col6\" class=\"data row105 col6\" >{'response_column': {'type': 'str', 'default': 'response'}, 'reference_column': {'type': 'str', 'default': 'reference'}, 'judge_llm': {'type': '_empty', 'default': None}, 'judge_embeddings': {'type': '_empty', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row105_col7\" class=\"data row105 col7\" >['ragas', 'llm']</td>\n",
+              "      <td id=\"T_0502a_row105_col8\" class=\"data row105 col8\" >['text_qa', 'text_generation', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row106_col0\" class=\"data row106 col0\" >validmind.model_validation.sklearn.AdjustedMutualInformation</td>\n",
+              "      <td id=\"T_0502a_row106_col1\" class=\"data row106 col1\" >Adjusted Mutual Information</td>\n",
+              "      <td id=\"T_0502a_row106_col2\" class=\"data row106 col2\" >Evaluates clustering model performance by measuring mutual information between true and predicted labels, adjusting...</td>\n",
+              "      <td id=\"T_0502a_row106_col3\" class=\"data row106 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row106_col4\" class=\"data row106 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row106_col5\" class=\"data row106 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row106_col6\" class=\"data row106 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row106_col7\" class=\"data row106 col7\" >['sklearn', 'model_performance', 'clustering']</td>\n",
+              "      <td id=\"T_0502a_row106_col8\" class=\"data row106 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row107_col0\" class=\"data row107 col0\" >validmind.model_validation.sklearn.AdjustedRandIndex</td>\n",
+              "      <td id=\"T_0502a_row107_col1\" class=\"data row107 col1\" >Adjusted Rand Index</td>\n",
+              "      <td id=\"T_0502a_row107_col2\" class=\"data row107 col2\" >Measures the similarity between two data clusters using the Adjusted Rand Index (ARI) metric in clustering machine...</td>\n",
+              "      <td id=\"T_0502a_row107_col3\" class=\"data row107 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row107_col4\" class=\"data row107 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row107_col5\" class=\"data row107 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row107_col6\" class=\"data row107 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row107_col7\" class=\"data row107 col7\" >['sklearn', 'model_performance', 'clustering']</td>\n",
+              "      <td id=\"T_0502a_row107_col8\" class=\"data row107 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row108_col0\" class=\"data row108 col0\" >validmind.model_validation.sklearn.CalibrationCurve</td>\n",
+              "      <td id=\"T_0502a_row108_col1\" class=\"data row108 col1\" >Calibration Curve</td>\n",
+              "      <td id=\"T_0502a_row108_col2\" class=\"data row108 col2\" >Evaluates the calibration of probability estimates by comparing predicted probabilities against observed...</td>\n",
+              "      <td id=\"T_0502a_row108_col3\" class=\"data row108 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row108_col4\" class=\"data row108 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row108_col5\" class=\"data row108 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row108_col6\" class=\"data row108 col6\" >{'n_bins': {'type': 'int', 'default': 10}}</td>\n",
+              "      <td id=\"T_0502a_row108_col7\" class=\"data row108 col7\" >['sklearn', 'model_performance', 'classification']</td>\n",
+              "      <td id=\"T_0502a_row108_col8\" class=\"data row108 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row109_col0\" class=\"data row109 col0\" >validmind.model_validation.sklearn.ClassifierPerformance</td>\n",
+              "      <td id=\"T_0502a_row109_col1\" class=\"data row109 col1\" >Classifier Performance</td>\n",
+              "      <td id=\"T_0502a_row109_col2\" class=\"data row109 col2\" >Evaluates performance of binary or multiclass classification models using precision, recall, F1-Score, accuracy,...</td>\n",
+              "      <td id=\"T_0502a_row109_col3\" class=\"data row109 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row109_col4\" class=\"data row109 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row109_col5\" class=\"data row109 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row109_col6\" class=\"data row109 col6\" >{'average': {'type': 'str', 'default': 'macro'}}</td>\n",
+              "      <td id=\"T_0502a_row109_col7\" class=\"data row109 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_0502a_row109_col8\" class=\"data row109 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row110_col0\" class=\"data row110 col0\" >validmind.model_validation.sklearn.ClassifierThresholdOptimization</td>\n",
+              "      <td id=\"T_0502a_row110_col1\" class=\"data row110 col1\" >Classifier Threshold Optimization</td>\n",
+              "      <td id=\"T_0502a_row110_col2\" class=\"data row110 col2\" >Analyzes and visualizes different threshold optimization methods for binary classification models....</td>\n",
+              "      <td id=\"T_0502a_row110_col3\" class=\"data row110 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row110_col4\" class=\"data row110 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row110_col5\" class=\"data row110 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row110_col6\" class=\"data row110 col6\" >{'methods': {'type': None, 'default': None}, 'target_recall': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row110_col7\" class=\"data row110 col7\" >['model_validation', 'threshold_optimization', 'classification_metrics']</td>\n",
+              "      <td id=\"T_0502a_row110_col8\" class=\"data row110 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row111_col0\" class=\"data row111 col0\" >validmind.model_validation.sklearn.ClusterCosineSimilarity</td>\n",
+              "      <td id=\"T_0502a_row111_col1\" class=\"data row111 col1\" >Cluster Cosine Similarity</td>\n",
+              "      <td id=\"T_0502a_row111_col2\" class=\"data row111 col2\" >Measures the intra-cluster similarity of a clustering model using cosine similarity....</td>\n",
+              "      <td id=\"T_0502a_row111_col3\" class=\"data row111 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row111_col4\" class=\"data row111 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row111_col5\" class=\"data row111 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row111_col6\" class=\"data row111 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row111_col7\" class=\"data row111 col7\" >['sklearn', 'model_performance', 'clustering']</td>\n",
+              "      <td id=\"T_0502a_row111_col8\" class=\"data row111 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row112_col0\" class=\"data row112 col0\" >validmind.model_validation.sklearn.ClusterPerformanceMetrics</td>\n",
+              "      <td id=\"T_0502a_row112_col1\" class=\"data row112 col1\" >Cluster Performance Metrics</td>\n",
+              "      <td id=\"T_0502a_row112_col2\" class=\"data row112 col2\" >Evaluates the performance of clustering machine learning models using multiple established metrics....</td>\n",
+              "      <td id=\"T_0502a_row112_col3\" class=\"data row112 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row112_col4\" class=\"data row112 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row112_col5\" class=\"data row112 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row112_col6\" class=\"data row112 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row112_col7\" class=\"data row112 col7\" >['sklearn', 'model_performance', 'clustering']</td>\n",
+              "      <td id=\"T_0502a_row112_col8\" class=\"data row112 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row113_col0\" class=\"data row113 col0\" >validmind.model_validation.sklearn.CompletenessScore</td>\n",
+              "      <td id=\"T_0502a_row113_col1\" class=\"data row113 col1\" >Completeness Score</td>\n",
+              "      <td id=\"T_0502a_row113_col2\" class=\"data row113 col2\" >Evaluates a clustering model's capacity to categorize instances from a single class into the same cluster....</td>\n",
+              "      <td id=\"T_0502a_row113_col3\" class=\"data row113 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row113_col4\" class=\"data row113 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row113_col5\" class=\"data row113 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row113_col6\" class=\"data row113 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row113_col7\" class=\"data row113 col7\" >['sklearn', 'model_performance', 'clustering']</td>\n",
+              "      <td id=\"T_0502a_row113_col8\" class=\"data row113 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row114_col0\" class=\"data row114 col0\" >validmind.model_validation.sklearn.ConfusionMatrix</td>\n",
+              "      <td id=\"T_0502a_row114_col1\" class=\"data row114 col1\" >Confusion Matrix</td>\n",
+              "      <td id=\"T_0502a_row114_col2\" class=\"data row114 col2\" >Evaluates and visually represents the classification ML model's predictive performance using a Confusion Matrix...</td>\n",
+              "      <td id=\"T_0502a_row114_col3\" class=\"data row114 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row114_col4\" class=\"data row114 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row114_col5\" class=\"data row114 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row114_col6\" class=\"data row114 col6\" >{'threshold': {'type': 'float', 'default': 0.5}}</td>\n",
+              "      <td id=\"T_0502a_row114_col7\" class=\"data row114 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row114_col8\" class=\"data row114 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row115_col0\" class=\"data row115 col0\" >validmind.model_validation.sklearn.FeatureImportance</td>\n",
+              "      <td id=\"T_0502a_row115_col1\" class=\"data row115 col1\" >Feature Importance</td>\n",
+              "      <td id=\"T_0502a_row115_col2\" class=\"data row115 col2\" >Compute feature importance scores for a given model and generate a summary table...</td>\n",
+              "      <td id=\"T_0502a_row115_col3\" class=\"data row115 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row115_col4\" class=\"data row115 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row115_col5\" class=\"data row115 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row115_col6\" class=\"data row115 col6\" >{'num_features': {'type': 'int', 'default': 3}}</td>\n",
+              "      <td id=\"T_0502a_row115_col7\" class=\"data row115 col7\" >['model_explainability', 'sklearn']</td>\n",
+              "      <td id=\"T_0502a_row115_col8\" class=\"data row115 col8\" >['regression', 'time_series_forecasting']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row116_col0\" class=\"data row116 col0\" >validmind.model_validation.sklearn.FowlkesMallowsScore</td>\n",
+              "      <td id=\"T_0502a_row116_col1\" class=\"data row116 col1\" >Fowlkes Mallows Score</td>\n",
+              "      <td id=\"T_0502a_row116_col2\" class=\"data row116 col2\" >Evaluates the similarity between predicted and actual cluster assignments in a model using the Fowlkes-Mallows...</td>\n",
+              "      <td id=\"T_0502a_row116_col3\" class=\"data row116 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row116_col4\" class=\"data row116 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row116_col5\" class=\"data row116 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row116_col6\" class=\"data row116 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row116_col7\" class=\"data row116 col7\" >['sklearn', 'model_performance']</td>\n",
+              "      <td id=\"T_0502a_row116_col8\" class=\"data row116 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row117_col0\" class=\"data row117 col0\" >validmind.model_validation.sklearn.HomogeneityScore</td>\n",
+              "      <td id=\"T_0502a_row117_col1\" class=\"data row117 col1\" >Homogeneity Score</td>\n",
+              "      <td id=\"T_0502a_row117_col2\" class=\"data row117 col2\" >Assesses clustering homogeneity by comparing true and predicted labels, scoring from 0 (heterogeneous) to 1...</td>\n",
+              "      <td id=\"T_0502a_row117_col3\" class=\"data row117 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row117_col4\" class=\"data row117 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row117_col5\" class=\"data row117 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row117_col6\" class=\"data row117 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row117_col7\" class=\"data row117 col7\" >['sklearn', 'model_performance']</td>\n",
+              "      <td id=\"T_0502a_row117_col8\" class=\"data row117 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row118_col0\" class=\"data row118 col0\" >validmind.model_validation.sklearn.HyperParametersTuning</td>\n",
+              "      <td id=\"T_0502a_row118_col1\" class=\"data row118 col1\" >Hyper Parameters Tuning</td>\n",
+              "      <td id=\"T_0502a_row118_col2\" class=\"data row118 col2\" >Performs exhaustive grid search over specified parameter ranges to find optimal model configurations...</td>\n",
+              "      <td id=\"T_0502a_row118_col3\" class=\"data row118 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row118_col4\" class=\"data row118 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row118_col5\" class=\"data row118 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row118_col6\" class=\"data row118 col6\" >{'param_grid': {'type': 'dict', 'default': None}, 'scoring': {'type': None, 'default': None}, 'thresholds': {'type': None, 'default': None}, 'fit_params': {'type': 'dict', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row118_col7\" class=\"data row118 col7\" >['sklearn', 'model_performance']</td>\n",
+              "      <td id=\"T_0502a_row118_col8\" class=\"data row118 col8\" >['clustering', 'classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row119_col0\" class=\"data row119 col0\" >validmind.model_validation.sklearn.KMeansClustersOptimization</td>\n",
+              "      <td id=\"T_0502a_row119_col1\" class=\"data row119 col1\" >K Means Clusters Optimization</td>\n",
+              "      <td id=\"T_0502a_row119_col2\" class=\"data row119 col2\" >Optimizes the number of clusters in K-means models using Elbow and Silhouette methods....</td>\n",
+              "      <td id=\"T_0502a_row119_col3\" class=\"data row119 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row119_col4\" class=\"data row119 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row119_col5\" class=\"data row119 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row119_col6\" class=\"data row119 col6\" >{'n_clusters': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row119_col7\" class=\"data row119 col7\" >['sklearn', 'model_performance', 'kmeans']</td>\n",
+              "      <td id=\"T_0502a_row119_col8\" class=\"data row119 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row120_col0\" class=\"data row120 col0\" >validmind.model_validation.sklearn.MinimumAccuracy</td>\n",
+              "      <td id=\"T_0502a_row120_col1\" class=\"data row120 col1\" >Minimum Accuracy</td>\n",
+              "      <td id=\"T_0502a_row120_col2\" class=\"data row120 col2\" >Checks if the model's prediction accuracy meets or surpasses a specified threshold....</td>\n",
+              "      <td id=\"T_0502a_row120_col3\" class=\"data row120 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row120_col4\" class=\"data row120 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row120_col5\" class=\"data row120 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row120_col6\" class=\"data row120 col6\" >{'min_threshold': {'type': 'float', 'default': 0.7}}</td>\n",
+              "      <td id=\"T_0502a_row120_col7\" class=\"data row120 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_0502a_row120_col8\" class=\"data row120 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row121_col0\" class=\"data row121 col0\" >validmind.model_validation.sklearn.MinimumF1Score</td>\n",
+              "      <td id=\"T_0502a_row121_col1\" class=\"data row121 col1\" >Minimum F1 Score</td>\n",
+              "      <td id=\"T_0502a_row121_col2\" class=\"data row121 col2\" >Assesses if the model's F1 score on the validation set meets a predefined minimum threshold, ensuring balanced...</td>\n",
+              "      <td id=\"T_0502a_row121_col3\" class=\"data row121 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row121_col4\" class=\"data row121 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row121_col5\" class=\"data row121 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row121_col6\" class=\"data row121 col6\" >{'min_threshold': {'type': 'float', 'default': 0.5}}</td>\n",
+              "      <td id=\"T_0502a_row121_col7\" class=\"data row121 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_0502a_row121_col8\" class=\"data row121 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row122_col0\" class=\"data row122 col0\" >validmind.model_validation.sklearn.MinimumROCAUCScore</td>\n",
+              "      <td id=\"T_0502a_row122_col1\" class=\"data row122 col1\" >Minimum ROCAUC Score</td>\n",
+              "      <td id=\"T_0502a_row122_col2\" class=\"data row122 col2\" >Validates model by checking if the ROC AUC score meets or surpasses a specified threshold....</td>\n",
+              "      <td id=\"T_0502a_row122_col3\" class=\"data row122 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row122_col4\" class=\"data row122 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row122_col5\" class=\"data row122 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row122_col6\" class=\"data row122 col6\" >{'min_threshold': {'type': 'float', 'default': 0.5}}</td>\n",
+              "      <td id=\"T_0502a_row122_col7\" class=\"data row122 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_0502a_row122_col8\" class=\"data row122 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row123_col0\" class=\"data row123 col0\" >validmind.model_validation.sklearn.ModelParameters</td>\n",
+              "      <td id=\"T_0502a_row123_col1\" class=\"data row123 col1\" >Model Parameters</td>\n",
+              "      <td id=\"T_0502a_row123_col2\" class=\"data row123 col2\" >Extracts and displays model parameters in a structured format for transparency and reproducibility....</td>\n",
+              "      <td id=\"T_0502a_row123_col3\" class=\"data row123 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row123_col4\" class=\"data row123 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row123_col5\" class=\"data row123 col5\" >['model']</td>\n",
+              "      <td id=\"T_0502a_row123_col6\" class=\"data row123 col6\" >{'model_params': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row123_col7\" class=\"data row123 col7\" >['model_training', 'metadata']</td>\n",
+              "      <td id=\"T_0502a_row123_col8\" class=\"data row123 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row124_col0\" class=\"data row124 col0\" >validmind.model_validation.sklearn.ModelsPerformanceComparison</td>\n",
+              "      <td id=\"T_0502a_row124_col1\" class=\"data row124 col1\" >Models Performance Comparison</td>\n",
+              "      <td id=\"T_0502a_row124_col2\" class=\"data row124 col2\" >Evaluates and compares the performance of multiple Machine Learning models using various metrics like accuracy,...</td>\n",
+              "      <td id=\"T_0502a_row124_col3\" class=\"data row124 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row124_col4\" class=\"data row124 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row124_col5\" class=\"data row124 col5\" >['dataset', 'models']</td>\n",
+              "      <td id=\"T_0502a_row124_col6\" class=\"data row124 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row124_col7\" class=\"data row124 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'model_comparison']</td>\n",
+              "      <td id=\"T_0502a_row124_col8\" class=\"data row124 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row125_col0\" class=\"data row125 col0\" >validmind.model_validation.sklearn.OverfitDiagnosis</td>\n",
+              "      <td id=\"T_0502a_row125_col1\" class=\"data row125 col1\" >Overfit Diagnosis</td>\n",
+              "      <td id=\"T_0502a_row125_col2\" class=\"data row125 col2\" >Assesses potential overfitting in a model's predictions, identifying regions where performance between training and...</td>\n",
+              "      <td id=\"T_0502a_row125_col3\" class=\"data row125 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row125_col4\" class=\"data row125 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row125_col5\" class=\"data row125 col5\" >['model', 'datasets']</td>\n",
+              "      <td id=\"T_0502a_row125_col6\" class=\"data row125 col6\" >{'metric': {'type': 'str', 'default': None}, 'cut_off_threshold': {'type': 'float', 'default': 0.04}}</td>\n",
+              "      <td id=\"T_0502a_row125_col7\" class=\"data row125 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'linear_regression', 'model_diagnosis']</td>\n",
+              "      <td id=\"T_0502a_row125_col8\" class=\"data row125 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row126_col0\" class=\"data row126 col0\" >validmind.model_validation.sklearn.PermutationFeatureImportance</td>\n",
+              "      <td id=\"T_0502a_row126_col1\" class=\"data row126 col1\" >Permutation Feature Importance</td>\n",
+              "      <td id=\"T_0502a_row126_col2\" class=\"data row126 col2\" >Assesses the significance of each feature in a model by evaluating the impact on model performance when feature...</td>\n",
+              "      <td id=\"T_0502a_row126_col3\" class=\"data row126 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row126_col4\" class=\"data row126 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row126_col5\" class=\"data row126 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row126_col6\" class=\"data row126 col6\" >{'fontsize': {'type': None, 'default': None}, 'figure_height': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row126_col7\" class=\"data row126 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'feature_importance', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row126_col8\" class=\"data row126 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row127_col0\" class=\"data row127 col0\" >validmind.model_validation.sklearn.PopulationStabilityIndex</td>\n",
+              "      <td id=\"T_0502a_row127_col1\" class=\"data row127 col1\" >Population Stability Index</td>\n",
+              "      <td id=\"T_0502a_row127_col2\" class=\"data row127 col2\" >Assesses the Population Stability Index (PSI) to quantify the stability of an ML model's predictions across...</td>\n",
+              "      <td id=\"T_0502a_row127_col3\" class=\"data row127 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row127_col4\" class=\"data row127 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row127_col5\" class=\"data row127 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_0502a_row127_col6\" class=\"data row127 col6\" >{'num_bins': {'type': 'int', 'default': 10}, 'mode': {'type': 'str', 'default': 'fixed'}}</td>\n",
+              "      <td id=\"T_0502a_row127_col7\" class=\"data row127 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_0502a_row127_col8\" class=\"data row127 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row128_col0\" class=\"data row128 col0\" >validmind.model_validation.sklearn.PrecisionRecallCurve</td>\n",
+              "      <td id=\"T_0502a_row128_col1\" class=\"data row128 col1\" >Precision Recall Curve</td>\n",
+              "      <td id=\"T_0502a_row128_col2\" class=\"data row128 col2\" >Evaluates the precision-recall trade-off for binary classification models and visualizes the Precision-Recall curve....</td>\n",
+              "      <td id=\"T_0502a_row128_col3\" class=\"data row128 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row128_col4\" class=\"data row128 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row128_col5\" class=\"data row128 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row128_col6\" class=\"data row128 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row128_col7\" class=\"data row128 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row128_col8\" class=\"data row128 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row129_col0\" class=\"data row129 col0\" >validmind.model_validation.sklearn.ROCCurve</td>\n",
+              "      <td id=\"T_0502a_row129_col1\" class=\"data row129 col1\" >ROC Curve</td>\n",
+              "      <td id=\"T_0502a_row129_col2\" class=\"data row129 col2\" >Evaluates binary classification model performance by generating and plotting the Receiver Operating Characteristic...</td>\n",
+              "      <td id=\"T_0502a_row129_col3\" class=\"data row129 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row129_col4\" class=\"data row129 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row129_col5\" class=\"data row129 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row129_col6\" class=\"data row129 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row129_col7\" class=\"data row129 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row129_col8\" class=\"data row129 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row130_col0\" class=\"data row130 col0\" >validmind.model_validation.sklearn.RegressionErrors</td>\n",
+              "      <td id=\"T_0502a_row130_col1\" class=\"data row130 col1\" >Regression Errors</td>\n",
+              "      <td id=\"T_0502a_row130_col2\" class=\"data row130 col2\" >Assesses the performance and error distribution of a regression model using various error metrics....</td>\n",
+              "      <td id=\"T_0502a_row130_col3\" class=\"data row130 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row130_col4\" class=\"data row130 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row130_col5\" class=\"data row130 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row130_col6\" class=\"data row130 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row130_col7\" class=\"data row130 col7\" >['sklearn', 'model_performance']</td>\n",
+              "      <td id=\"T_0502a_row130_col8\" class=\"data row130 col8\" >['regression', 'classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row131_col0\" class=\"data row131 col0\" >validmind.model_validation.sklearn.RegressionErrorsComparison</td>\n",
+              "      <td id=\"T_0502a_row131_col1\" class=\"data row131 col1\" >Regression Errors Comparison</td>\n",
+              "      <td id=\"T_0502a_row131_col2\" class=\"data row131 col2\" >Assesses multiple regression error metrics to compare model performance across different datasets, emphasizing...</td>\n",
+              "      <td id=\"T_0502a_row131_col3\" class=\"data row131 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row131_col4\" class=\"data row131 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row131_col5\" class=\"data row131 col5\" >['datasets', 'models']</td>\n",
+              "      <td id=\"T_0502a_row131_col6\" class=\"data row131 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row131_col7\" class=\"data row131 col7\" >['model_performance', 'sklearn']</td>\n",
+              "      <td id=\"T_0502a_row131_col8\" class=\"data row131 col8\" >['regression', 'time_series_forecasting']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row132_col0\" class=\"data row132 col0\" >validmind.model_validation.sklearn.RegressionPerformance</td>\n",
+              "      <td id=\"T_0502a_row132_col1\" class=\"data row132 col1\" >Regression Performance</td>\n",
+              "      <td id=\"T_0502a_row132_col2\" class=\"data row132 col2\" >Evaluates the performance of a regression model using five different metrics: MAE, MSE, RMSE, MAPE, and MBD....</td>\n",
+              "      <td id=\"T_0502a_row132_col3\" class=\"data row132 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row132_col4\" class=\"data row132 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row132_col5\" class=\"data row132 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row132_col6\" class=\"data row132 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row132_col7\" class=\"data row132 col7\" >['sklearn', 'model_performance']</td>\n",
+              "      <td id=\"T_0502a_row132_col8\" class=\"data row132 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row133_col0\" class=\"data row133 col0\" >validmind.model_validation.sklearn.RegressionR2Square</td>\n",
+              "      <td id=\"T_0502a_row133_col1\" class=\"data row133 col1\" >Regression R2 Square</td>\n",
+              "      <td id=\"T_0502a_row133_col2\" class=\"data row133 col2\" >Assesses the overall goodness-of-fit of a regression model by evaluating R-squared (R2) and Adjusted R-squared (Adj...</td>\n",
+              "      <td id=\"T_0502a_row133_col3\" class=\"data row133 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row133_col4\" class=\"data row133 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row133_col5\" class=\"data row133 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row133_col6\" class=\"data row133 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row133_col7\" class=\"data row133 col7\" >['sklearn', 'model_performance']</td>\n",
+              "      <td id=\"T_0502a_row133_col8\" class=\"data row133 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row134_col0\" class=\"data row134 col0\" >validmind.model_validation.sklearn.RegressionR2SquareComparison</td>\n",
+              "      <td id=\"T_0502a_row134_col1\" class=\"data row134 col1\" >Regression R2 Square Comparison</td>\n",
+              "      <td id=\"T_0502a_row134_col2\" class=\"data row134 col2\" >Compares R-Squared and Adjusted R-Squared values for different regression models across multiple datasets to assess...</td>\n",
+              "      <td id=\"T_0502a_row134_col3\" class=\"data row134 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row134_col4\" class=\"data row134 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row134_col5\" class=\"data row134 col5\" >['datasets', 'models']</td>\n",
+              "      <td id=\"T_0502a_row134_col6\" class=\"data row134 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row134_col7\" class=\"data row134 col7\" >['model_performance', 'sklearn']</td>\n",
+              "      <td id=\"T_0502a_row134_col8\" class=\"data row134 col8\" >['regression', 'time_series_forecasting']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row135_col0\" class=\"data row135 col0\" >validmind.model_validation.sklearn.RobustnessDiagnosis</td>\n",
+              "      <td id=\"T_0502a_row135_col1\" class=\"data row135 col1\" >Robustness Diagnosis</td>\n",
+              "      <td id=\"T_0502a_row135_col2\" class=\"data row135 col2\" >Assesses the robustness of a machine learning model by evaluating performance decay under noisy conditions....</td>\n",
+              "      <td id=\"T_0502a_row135_col3\" class=\"data row135 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row135_col4\" class=\"data row135 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row135_col5\" class=\"data row135 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_0502a_row135_col6\" class=\"data row135 col6\" >{'metric': {'type': 'str', 'default': None}, 'scaling_factor_std_dev_list': {'type': None, 'default': [0.1, 0.2, 0.3, 0.4, 0.5]}, 'performance_decay_threshold': {'type': 'float', 'default': 0.05}}</td>\n",
+              "      <td id=\"T_0502a_row135_col7\" class=\"data row135 col7\" >['sklearn', 'model_diagnosis', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row135_col8\" class=\"data row135 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row136_col0\" class=\"data row136 col0\" >validmind.model_validation.sklearn.SHAPGlobalImportance</td>\n",
+              "      <td id=\"T_0502a_row136_col1\" class=\"data row136 col1\" >SHAP Global Importance</td>\n",
+              "      <td id=\"T_0502a_row136_col2\" class=\"data row136 col2\" >Evaluates and visualizes global feature importance using SHAP values for model explanation and risk identification....</td>\n",
+              "      <td id=\"T_0502a_row136_col3\" class=\"data row136 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row136_col4\" class=\"data row136 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row136_col5\" class=\"data row136 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row136_col6\" class=\"data row136 col6\" >{'kernel_explainer_samples': {'type': 'int', 'default': 10}, 'tree_or_linear_explainer_samples': {'type': 'int', 'default': 200}, 'class_of_interest': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row136_col7\" class=\"data row136 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'feature_importance', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row136_col8\" class=\"data row136 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row137_col0\" class=\"data row137 col0\" >validmind.model_validation.sklearn.ScoreProbabilityAlignment</td>\n",
+              "      <td id=\"T_0502a_row137_col1\" class=\"data row137 col1\" >Score Probability Alignment</td>\n",
+              "      <td id=\"T_0502a_row137_col2\" class=\"data row137 col2\" >Analyzes the alignment between credit scores and predicted probabilities....</td>\n",
+              "      <td id=\"T_0502a_row137_col3\" class=\"data row137 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row137_col4\" class=\"data row137 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row137_col5\" class=\"data row137 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row137_col6\" class=\"data row137 col6\" >{'score_column': {'type': 'str', 'default': 'score'}, 'n_bins': {'type': 'int', 'default': 10}}</td>\n",
+              "      <td id=\"T_0502a_row137_col7\" class=\"data row137 col7\" >['visualization', 'credit_risk', 'calibration']</td>\n",
+              "      <td id=\"T_0502a_row137_col8\" class=\"data row137 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row138_col0\" class=\"data row138 col0\" >validmind.model_validation.sklearn.SilhouettePlot</td>\n",
+              "      <td id=\"T_0502a_row138_col1\" class=\"data row138 col1\" >Silhouette Plot</td>\n",
+              "      <td id=\"T_0502a_row138_col2\" class=\"data row138 col2\" >Calculates and visualizes Silhouette Score, assessing the degree of data point suitability to its cluster in ML...</td>\n",
+              "      <td id=\"T_0502a_row138_col3\" class=\"data row138 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row138_col4\" class=\"data row138 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row138_col5\" class=\"data row138 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row138_col6\" class=\"data row138 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row138_col7\" class=\"data row138 col7\" >['sklearn', 'model_performance']</td>\n",
+              "      <td id=\"T_0502a_row138_col8\" class=\"data row138 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row139_col0\" class=\"data row139 col0\" >validmind.model_validation.sklearn.TrainingTestDegradation</td>\n",
+              "      <td id=\"T_0502a_row139_col1\" class=\"data row139 col1\" >Training Test Degradation</td>\n",
+              "      <td id=\"T_0502a_row139_col2\" class=\"data row139 col2\" >Tests if model performance degradation between training and test datasets exceeds a predefined threshold....</td>\n",
+              "      <td id=\"T_0502a_row139_col3\" class=\"data row139 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row139_col4\" class=\"data row139 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row139_col5\" class=\"data row139 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_0502a_row139_col6\" class=\"data row139 col6\" >{'max_threshold': {'type': 'float', 'default': 0.1}}</td>\n",
+              "      <td id=\"T_0502a_row139_col7\" class=\"data row139 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row139_col8\" class=\"data row139 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row140_col0\" class=\"data row140 col0\" >validmind.model_validation.sklearn.VMeasure</td>\n",
+              "      <td id=\"T_0502a_row140_col1\" class=\"data row140 col1\" >V Measure</td>\n",
+              "      <td id=\"T_0502a_row140_col2\" class=\"data row140 col2\" >Evaluates homogeneity and completeness of a clustering model using the V Measure Score....</td>\n",
+              "      <td id=\"T_0502a_row140_col3\" class=\"data row140 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row140_col4\" class=\"data row140 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row140_col5\" class=\"data row140 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row140_col6\" class=\"data row140 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row140_col7\" class=\"data row140 col7\" >['sklearn', 'model_performance']</td>\n",
+              "      <td id=\"T_0502a_row140_col8\" class=\"data row140 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row141_col0\" class=\"data row141 col0\" >validmind.model_validation.sklearn.WeakspotsDiagnosis</td>\n",
+              "      <td id=\"T_0502a_row141_col1\" class=\"data row141 col1\" >Weakspots Diagnosis</td>\n",
+              "      <td id=\"T_0502a_row141_col2\" class=\"data row141 col2\" >Identifies and visualizes weak spots in a machine learning model's performance across various sections of the...</td>\n",
+              "      <td id=\"T_0502a_row141_col3\" class=\"data row141 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row141_col4\" class=\"data row141 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row141_col5\" class=\"data row141 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_0502a_row141_col6\" class=\"data row141 col6\" >{'features_columns': {'type': None, 'default': None}, 'metrics': {'type': None, 'default': None}, 'thresholds': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row141_col7\" class=\"data row141 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_diagnosis', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row141_col8\" class=\"data row141 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row142_col0\" class=\"data row142 col0\" >validmind.model_validation.statsmodels.AutoARIMA</td>\n",
+              "      <td id=\"T_0502a_row142_col1\" class=\"data row142 col1\" >Auto ARIMA</td>\n",
+              "      <td id=\"T_0502a_row142_col2\" class=\"data row142 col2\" >Evaluates ARIMA models for time-series forecasting, ranking them using Bayesian and Akaike Information Criteria....</td>\n",
+              "      <td id=\"T_0502a_row142_col3\" class=\"data row142 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row142_col4\" class=\"data row142 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row142_col5\" class=\"data row142 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row142_col6\" class=\"data row142 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row142_col7\" class=\"data row142 col7\" >['time_series_data', 'forecasting', 'model_selection', 'statsmodels']</td>\n",
+              "      <td id=\"T_0502a_row142_col8\" class=\"data row142 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row143_col0\" class=\"data row143 col0\" >validmind.model_validation.statsmodels.CumulativePredictionProbabilities</td>\n",
+              "      <td id=\"T_0502a_row143_col1\" class=\"data row143 col1\" >Cumulative Prediction Probabilities</td>\n",
+              "      <td id=\"T_0502a_row143_col2\" class=\"data row143 col2\" >Visualizes cumulative probabilities of positive and negative classes for both training and testing in classification models....</td>\n",
+              "      <td id=\"T_0502a_row143_col3\" class=\"data row143 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row143_col4\" class=\"data row143 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row143_col5\" class=\"data row143 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row143_col6\" class=\"data row143 col6\" >{'title': {'type': 'str', 'default': 'Cumulative Probabilities'}}</td>\n",
+              "      <td id=\"T_0502a_row143_col7\" class=\"data row143 col7\" >['visualization', 'credit_risk']</td>\n",
+              "      <td id=\"T_0502a_row143_col8\" class=\"data row143 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row144_col0\" class=\"data row144 col0\" >validmind.model_validation.statsmodels.DurbinWatsonTest</td>\n",
+              "      <td id=\"T_0502a_row144_col1\" class=\"data row144 col1\" >Durbin Watson Test</td>\n",
+              "      <td id=\"T_0502a_row144_col2\" class=\"data row144 col2\" >Assesses autocorrelation in time series data features using the Durbin-Watson statistic....</td>\n",
+              "      <td id=\"T_0502a_row144_col3\" class=\"data row144 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row144_col4\" class=\"data row144 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row144_col5\" class=\"data row144 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row144_col6\" class=\"data row144 col6\" >{'threshold': {'type': None, 'default': [1.5, 2.5]}}</td>\n",
+              "      <td id=\"T_0502a_row144_col7\" class=\"data row144 col7\" >['time_series_data', 'forecasting', 'statistical_test', 'statsmodels']</td>\n",
+              "      <td id=\"T_0502a_row144_col8\" class=\"data row144 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row145_col0\" class=\"data row145 col0\" >validmind.model_validation.statsmodels.GINITable</td>\n",
+              "      <td id=\"T_0502a_row145_col1\" class=\"data row145 col1\" >GINI Table</td>\n",
+              "      <td id=\"T_0502a_row145_col2\" class=\"data row145 col2\" >Evaluates classification model performance using AUC, GINI, and KS metrics for training and test datasets....</td>\n",
+              "      <td id=\"T_0502a_row145_col3\" class=\"data row145 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row145_col4\" class=\"data row145 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row145_col5\" class=\"data row145 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row145_col6\" class=\"data row145 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row145_col7\" class=\"data row145 col7\" >['model_performance']</td>\n",
+              "      <td id=\"T_0502a_row145_col8\" class=\"data row145 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row146_col0\" class=\"data row146 col0\" >validmind.model_validation.statsmodels.KolmogorovSmirnov</td>\n",
+              "      <td id=\"T_0502a_row146_col1\" class=\"data row146 col1\" >Kolmogorov Smirnov</td>\n",
+              "      <td id=\"T_0502a_row146_col2\" class=\"data row146 col2\" >Assesses whether each feature in the dataset aligns with a normal distribution using the Kolmogorov-Smirnov test....</td>\n",
+              "      <td id=\"T_0502a_row146_col3\" class=\"data row146 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row146_col4\" class=\"data row146 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row146_col5\" class=\"data row146 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row146_col6\" class=\"data row146 col6\" >{'dist': {'type': 'str', 'default': 'norm'}}</td>\n",
+              "      <td id=\"T_0502a_row146_col7\" class=\"data row146 col7\" >['tabular_data', 'data_distribution', 'statistical_test', 'statsmodels']</td>\n",
+              "      <td id=\"T_0502a_row146_col8\" class=\"data row146 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row147_col0\" class=\"data row147 col0\" >validmind.model_validation.statsmodels.Lilliefors</td>\n",
+              "      <td id=\"T_0502a_row147_col1\" class=\"data row147 col1\" >Lilliefors</td>\n",
+              "      <td id=\"T_0502a_row147_col2\" class=\"data row147 col2\" >Assesses the normality of feature distributions in an ML model's training dataset using the Lilliefors test....</td>\n",
+              "      <td id=\"T_0502a_row147_col3\" class=\"data row147 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row147_col4\" class=\"data row147 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row147_col5\" class=\"data row147 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row147_col6\" class=\"data row147 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row147_col7\" class=\"data row147 col7\" >['tabular_data', 'data_distribution', 'statistical_test', 'statsmodels']</td>\n",
+              "      <td id=\"T_0502a_row147_col8\" class=\"data row147 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row148_col0\" class=\"data row148 col0\" >validmind.model_validation.statsmodels.PredictionProbabilitiesHistogram</td>\n",
+              "      <td id=\"T_0502a_row148_col1\" class=\"data row148 col1\" >Prediction Probabilities Histogram</td>\n",
+              "      <td id=\"T_0502a_row148_col2\" class=\"data row148 col2\" >Assesses the predictive probability distribution for binary classification to evaluate model performance and...</td>\n",
+              "      <td id=\"T_0502a_row148_col3\" class=\"data row148 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row148_col4\" class=\"data row148 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row148_col5\" class=\"data row148 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row148_col6\" class=\"data row148 col6\" >{'title': {'type': 'str', 'default': 'Histogram of Predictive Probabilities'}}</td>\n",
+              "      <td id=\"T_0502a_row148_col7\" class=\"data row148 col7\" >['visualization', 'credit_risk']</td>\n",
+              "      <td id=\"T_0502a_row148_col8\" class=\"data row148 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row149_col0\" class=\"data row149 col0\" >validmind.model_validation.statsmodels.RegressionCoeffs</td>\n",
+              "      <td id=\"T_0502a_row149_col1\" class=\"data row149 col1\" >Regression Coeffs</td>\n",
+              "      <td id=\"T_0502a_row149_col2\" class=\"data row149 col2\" >Assesses the significance and uncertainty of predictor variables in a regression model through visualization of...</td>\n",
+              "      <td id=\"T_0502a_row149_col3\" class=\"data row149 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row149_col4\" class=\"data row149 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row149_col5\" class=\"data row149 col5\" >['model']</td>\n",
+              "      <td id=\"T_0502a_row149_col6\" class=\"data row149 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row149_col7\" class=\"data row149 col7\" >['tabular_data', 'visualization', 'model_training']</td>\n",
+              "      <td id=\"T_0502a_row149_col8\" class=\"data row149 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row150_col0\" class=\"data row150 col0\" >validmind.model_validation.statsmodels.RegressionFeatureSignificance</td>\n",
+              "      <td id=\"T_0502a_row150_col1\" class=\"data row150 col1\" >Regression Feature Significance</td>\n",
+              "      <td id=\"T_0502a_row150_col2\" class=\"data row150 col2\" >Assesses and visualizes the statistical significance of features in a regression model....</td>\n",
+              "      <td id=\"T_0502a_row150_col3\" class=\"data row150 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row150_col4\" class=\"data row150 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row150_col5\" class=\"data row150 col5\" >['model']</td>\n",
+              "      <td id=\"T_0502a_row150_col6\" class=\"data row150 col6\" >{'fontsize': {'type': 'int', 'default': 10}, 'p_threshold': {'type': 'float', 'default': 0.05}}</td>\n",
+              "      <td id=\"T_0502a_row150_col7\" class=\"data row150 col7\" >['statistical_test', 'model_interpretation', 'visualization', 'feature_importance']</td>\n",
+              "      <td id=\"T_0502a_row150_col8\" class=\"data row150 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row151_col0\" class=\"data row151 col0\" >validmind.model_validation.statsmodels.RegressionModelForecastPlot</td>\n",
+              "      <td id=\"T_0502a_row151_col1\" class=\"data row151 col1\" >Regression Model Forecast Plot</td>\n",
+              "      <td id=\"T_0502a_row151_col2\" class=\"data row151 col2\" >Generates plots to visually compare the forecasted outcomes of a regression model against actual observed values over...</td>\n",
+              "      <td id=\"T_0502a_row151_col3\" class=\"data row151 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row151_col4\" class=\"data row151 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row151_col5\" class=\"data row151 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row151_col6\" class=\"data row151 col6\" >{'start_date': {'type': None, 'default': None}, 'end_date': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row151_col7\" class=\"data row151 col7\" >['time_series_data', 'forecasting', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row151_col8\" class=\"data row151 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row152_col0\" class=\"data row152 col0\" >validmind.model_validation.statsmodels.RegressionModelForecastPlotLevels</td>\n",
+              "      <td id=\"T_0502a_row152_col1\" class=\"data row152 col1\" >Regression Model Forecast Plot Levels</td>\n",
+              "      <td id=\"T_0502a_row152_col2\" class=\"data row152 col2\" >Assesses the alignment between forecasted and observed values in regression models through visual plots...</td>\n",
+              "      <td id=\"T_0502a_row152_col3\" class=\"data row152 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row152_col4\" class=\"data row152 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row152_col5\" class=\"data row152 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row152_col6\" class=\"data row152 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row152_col7\" class=\"data row152 col7\" >['time_series_data', 'forecasting', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row152_col8\" class=\"data row152 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row153_col0\" class=\"data row153 col0\" >validmind.model_validation.statsmodels.RegressionModelSensitivityPlot</td>\n",
+              "      <td id=\"T_0502a_row153_col1\" class=\"data row153 col1\" >Regression Model Sensitivity Plot</td>\n",
+              "      <td id=\"T_0502a_row153_col2\" class=\"data row153 col2\" >Assesses the sensitivity of a regression model to changes in independent variables by applying shocks and...</td>\n",
+              "      <td id=\"T_0502a_row153_col3\" class=\"data row153 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row153_col4\" class=\"data row153 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row153_col5\" class=\"data row153 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row153_col6\" class=\"data row153 col6\" >{'shocks': {'type': None, 'default': [0.1]}, 'transformation': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row153_col7\" class=\"data row153 col7\" >['senstivity_analysis', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row153_col8\" class=\"data row153 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row154_col0\" class=\"data row154 col0\" >validmind.model_validation.statsmodels.RegressionModelSummary</td>\n",
+              "      <td id=\"T_0502a_row154_col1\" class=\"data row154 col1\" >Regression Model Summary</td>\n",
+              "      <td id=\"T_0502a_row154_col2\" class=\"data row154 col2\" >Evaluates regression model performance using metrics including R-Squared, Adjusted R-Squared, MSE, and RMSE....</td>\n",
+              "      <td id=\"T_0502a_row154_col3\" class=\"data row154 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row154_col4\" class=\"data row154 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row154_col5\" class=\"data row154 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row154_col6\" class=\"data row154 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row154_col7\" class=\"data row154 col7\" >['model_performance', 'regression']</td>\n",
+              "      <td id=\"T_0502a_row154_col8\" class=\"data row154 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row155_col0\" class=\"data row155 col0\" >validmind.model_validation.statsmodels.RegressionPermutationFeatureImportance</td>\n",
+              "      <td id=\"T_0502a_row155_col1\" class=\"data row155 col1\" >Regression Permutation Feature Importance</td>\n",
+              "      <td id=\"T_0502a_row155_col2\" class=\"data row155 col2\" >Assesses the significance of each feature in a model by evaluating the impact on model performance when feature...</td>\n",
+              "      <td id=\"T_0502a_row155_col3\" class=\"data row155 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row155_col4\" class=\"data row155 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row155_col5\" class=\"data row155 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row155_col6\" class=\"data row155 col6\" >{'fontsize': {'type': 'int', 'default': 12}, 'figure_height': {'type': 'int', 'default': 500}}</td>\n",
+              "      <td id=\"T_0502a_row155_col7\" class=\"data row155 col7\" >['statsmodels', 'feature_importance', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row155_col8\" class=\"data row155 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row156_col0\" class=\"data row156 col0\" >validmind.model_validation.statsmodels.ScorecardHistogram</td>\n",
+              "      <td id=\"T_0502a_row156_col1\" class=\"data row156 col1\" >Scorecard Histogram</td>\n",
+              "      <td id=\"T_0502a_row156_col2\" class=\"data row156 col2\" >The Scorecard Histogram test evaluates the distribution of credit scores between default and non-default instances,...</td>\n",
+              "      <td id=\"T_0502a_row156_col3\" class=\"data row156 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row156_col4\" class=\"data row156 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row156_col5\" class=\"data row156 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_0502a_row156_col6\" class=\"data row156 col6\" >{'title': {'type': 'str', 'default': 'Histogram of Scores'}, 'score_column': {'type': 'str', 'default': 'score'}}</td>\n",
+              "      <td id=\"T_0502a_row156_col7\" class=\"data row156 col7\" >['visualization', 'credit_risk', 'logistic_regression']</td>\n",
+              "      <td id=\"T_0502a_row156_col8\" class=\"data row156 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row157_col0\" class=\"data row157 col0\" >validmind.ongoing_monitoring.CalibrationCurveDrift</td>\n",
+              "      <td id=\"T_0502a_row157_col1\" class=\"data row157 col1\" >Calibration Curve Drift</td>\n",
+              "      <td id=\"T_0502a_row157_col2\" class=\"data row157 col2\" >Evaluates changes in probability calibration between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_0502a_row157_col3\" class=\"data row157 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row157_col4\" class=\"data row157 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row157_col5\" class=\"data row157 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_0502a_row157_col6\" class=\"data row157 col6\" >{'n_bins': {'type': 'int', 'default': 10}, 'drift_pct_threshold': {'type': 'float', 'default': 20}}</td>\n",
+              "      <td id=\"T_0502a_row157_col7\" class=\"data row157 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row157_col8\" class=\"data row157 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row158_col0\" class=\"data row158 col0\" >validmind.ongoing_monitoring.ClassDiscriminationDrift</td>\n",
+              "      <td id=\"T_0502a_row158_col1\" class=\"data row158 col1\" >Class Discrimination Drift</td>\n",
+              "      <td id=\"T_0502a_row158_col2\" class=\"data row158 col2\" >Compares classification discrimination metrics between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_0502a_row158_col3\" class=\"data row158 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row158_col4\" class=\"data row158 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row158_col5\" class=\"data row158 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_0502a_row158_col6\" class=\"data row158 col6\" >{'drift_pct_threshold': {'type': '_empty', 'default': 20}}</td>\n",
+              "      <td id=\"T_0502a_row158_col7\" class=\"data row158 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_0502a_row158_col8\" class=\"data row158 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row159_col0\" class=\"data row159 col0\" >validmind.ongoing_monitoring.ClassImbalanceDrift</td>\n",
+              "      <td id=\"T_0502a_row159_col1\" class=\"data row159 col1\" >Class Imbalance Drift</td>\n",
+              "      <td id=\"T_0502a_row159_col2\" class=\"data row159 col2\" >Evaluates drift in class distribution between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_0502a_row159_col3\" class=\"data row159 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row159_col4\" class=\"data row159 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row159_col5\" class=\"data row159 col5\" >['datasets']</td>\n",
+              "      <td id=\"T_0502a_row159_col6\" class=\"data row159 col6\" >{'drift_pct_threshold': {'type': 'float', 'default': 5.0}, 'title': {'type': 'str', 'default': 'Class Distribution Drift'}}</td>\n",
+              "      <td id=\"T_0502a_row159_col7\" class=\"data row159 col7\" >['tabular_data', 'binary_classification', 'multiclass_classification']</td>\n",
+              "      <td id=\"T_0502a_row159_col8\" class=\"data row159 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row160_col0\" class=\"data row160 col0\" >validmind.ongoing_monitoring.ClassificationAccuracyDrift</td>\n",
+              "      <td id=\"T_0502a_row160_col1\" class=\"data row160 col1\" >Classification Accuracy Drift</td>\n",
+              "      <td id=\"T_0502a_row160_col2\" class=\"data row160 col2\" >Compares classification accuracy metrics between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_0502a_row160_col3\" class=\"data row160 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row160_col4\" class=\"data row160 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row160_col5\" class=\"data row160 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_0502a_row160_col6\" class=\"data row160 col6\" >{'drift_pct_threshold': {'type': '_empty', 'default': 20}}</td>\n",
+              "      <td id=\"T_0502a_row160_col7\" class=\"data row160 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_0502a_row160_col8\" class=\"data row160 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row161_col0\" class=\"data row161 col0\" >validmind.ongoing_monitoring.ConfusionMatrixDrift</td>\n",
+              "      <td id=\"T_0502a_row161_col1\" class=\"data row161 col1\" >Confusion Matrix Drift</td>\n",
+              "      <td id=\"T_0502a_row161_col2\" class=\"data row161 col2\" >Compares confusion matrix metrics between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_0502a_row161_col3\" class=\"data row161 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row161_col4\" class=\"data row161 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row161_col5\" class=\"data row161 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_0502a_row161_col6\" class=\"data row161 col6\" >{'drift_pct_threshold': {'type': '_empty', 'default': 20}}</td>\n",
+              "      <td id=\"T_0502a_row161_col7\" class=\"data row161 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_0502a_row161_col8\" class=\"data row161 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row162_col0\" class=\"data row162 col0\" >validmind.ongoing_monitoring.CumulativePredictionProbabilitiesDrift</td>\n",
+              "      <td id=\"T_0502a_row162_col1\" class=\"data row162 col1\" >Cumulative Prediction Probabilities Drift</td>\n",
+              "      <td id=\"T_0502a_row162_col2\" class=\"data row162 col2\" >Compares cumulative prediction probability distributions between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_0502a_row162_col3\" class=\"data row162 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row162_col4\" class=\"data row162 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row162_col5\" class=\"data row162 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_0502a_row162_col6\" class=\"data row162 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row162_col7\" class=\"data row162 col7\" >['visualization', 'credit_risk']</td>\n",
+              "      <td id=\"T_0502a_row162_col8\" class=\"data row162 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row163_col0\" class=\"data row163 col0\" >validmind.ongoing_monitoring.FeatureDrift</td>\n",
+              "      <td id=\"T_0502a_row163_col1\" class=\"data row163 col1\" >Feature Drift</td>\n",
+              "      <td id=\"T_0502a_row163_col2\" class=\"data row163 col2\" >Evaluates changes in feature distribution over time to identify potential model drift....</td>\n",
+              "      <td id=\"T_0502a_row163_col3\" class=\"data row163 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row163_col4\" class=\"data row163 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row163_col5\" class=\"data row163 col5\" >['datasets']</td>\n",
+              "      <td id=\"T_0502a_row163_col6\" class=\"data row163 col6\" >{'bins': {'type': '_empty', 'default': [0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9]}, 'feature_columns': {'type': '_empty', 'default': None}, 'psi_threshold': {'type': '_empty', 'default': 0.2}}</td>\n",
+              "      <td id=\"T_0502a_row163_col7\" class=\"data row163 col7\" >['visualization']</td>\n",
+              "      <td id=\"T_0502a_row163_col8\" class=\"data row163 col8\" >['monitoring']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row164_col0\" class=\"data row164 col0\" >validmind.ongoing_monitoring.PredictionAcrossEachFeature</td>\n",
+              "      <td id=\"T_0502a_row164_col1\" class=\"data row164 col1\" >Prediction Across Each Feature</td>\n",
+              "      <td id=\"T_0502a_row164_col2\" class=\"data row164 col2\" >Assesses differences in model predictions across individual features between reference and monitoring datasets...</td>\n",
+              "      <td id=\"T_0502a_row164_col3\" class=\"data row164 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row164_col4\" class=\"data row164 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row164_col5\" class=\"data row164 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_0502a_row164_col6\" class=\"data row164 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row164_col7\" class=\"data row164 col7\" >['visualization']</td>\n",
+              "      <td id=\"T_0502a_row164_col8\" class=\"data row164 col8\" >['monitoring']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row165_col0\" class=\"data row165 col0\" >validmind.ongoing_monitoring.PredictionCorrelation</td>\n",
+              "      <td id=\"T_0502a_row165_col1\" class=\"data row165 col1\" >Prediction Correlation</td>\n",
+              "      <td id=\"T_0502a_row165_col2\" class=\"data row165 col2\" >Assesses correlation changes between model predictions from reference and monitoring datasets to detect potential...</td>\n",
+              "      <td id=\"T_0502a_row165_col3\" class=\"data row165 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row165_col4\" class=\"data row165 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row165_col5\" class=\"data row165 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_0502a_row165_col6\" class=\"data row165 col6\" >{'drift_pct_threshold': {'type': 'float', 'default': 20}}</td>\n",
+              "      <td id=\"T_0502a_row165_col7\" class=\"data row165 col7\" >['visualization']</td>\n",
+              "      <td id=\"T_0502a_row165_col8\" class=\"data row165 col8\" >['monitoring']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row166_col0\" class=\"data row166 col0\" >validmind.ongoing_monitoring.PredictionProbabilitiesHistogramDrift</td>\n",
+              "      <td id=\"T_0502a_row166_col1\" class=\"data row166 col1\" >Prediction Probabilities Histogram Drift</td>\n",
+              "      <td id=\"T_0502a_row166_col2\" class=\"data row166 col2\" >Compares prediction probability distributions between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_0502a_row166_col3\" class=\"data row166 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row166_col4\" class=\"data row166 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row166_col5\" class=\"data row166 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_0502a_row166_col6\" class=\"data row166 col6\" >{'title': {'type': '_empty', 'default': 'Prediction Probabilities Histogram Drift'}, 'drift_pct_threshold': {'type': 'float', 'default': 20.0}}</td>\n",
+              "      <td id=\"T_0502a_row166_col7\" class=\"data row166 col7\" >['visualization', 'credit_risk']</td>\n",
+              "      <td id=\"T_0502a_row166_col8\" class=\"data row166 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row167_col0\" class=\"data row167 col0\" >validmind.ongoing_monitoring.PredictionQuantilesAcrossFeatures</td>\n",
+              "      <td id=\"T_0502a_row167_col1\" class=\"data row167 col1\" >Prediction Quantiles Across Features</td>\n",
+              "      <td id=\"T_0502a_row167_col2\" class=\"data row167 col2\" >Assesses differences in model prediction distributions across individual features between reference...</td>\n",
+              "      <td id=\"T_0502a_row167_col3\" class=\"data row167 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row167_col4\" class=\"data row167 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row167_col5\" class=\"data row167 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_0502a_row167_col6\" class=\"data row167 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row167_col7\" class=\"data row167 col7\" >['visualization']</td>\n",
+              "      <td id=\"T_0502a_row167_col8\" class=\"data row167 col8\" >['monitoring']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row168_col0\" class=\"data row168 col0\" >validmind.ongoing_monitoring.ROCCurveDrift</td>\n",
+              "      <td id=\"T_0502a_row168_col1\" class=\"data row168 col1\" >ROC Curve Drift</td>\n",
+              "      <td id=\"T_0502a_row168_col2\" class=\"data row168 col2\" >Compares ROC curves between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_0502a_row168_col3\" class=\"data row168 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row168_col4\" class=\"data row168 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row168_col5\" class=\"data row168 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_0502a_row168_col6\" class=\"data row168 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row168_col7\" class=\"data row168 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_0502a_row168_col8\" class=\"data row168 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row169_col0\" class=\"data row169 col0\" >validmind.ongoing_monitoring.ScoreBandsDrift</td>\n",
+              "      <td id=\"T_0502a_row169_col1\" class=\"data row169 col1\" >Score Bands Drift</td>\n",
+              "      <td id=\"T_0502a_row169_col2\" class=\"data row169 col2\" >Analyzes drift in population distribution and default rates across score bands....</td>\n",
+              "      <td id=\"T_0502a_row169_col3\" class=\"data row169 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row169_col4\" class=\"data row169 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row169_col5\" class=\"data row169 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_0502a_row169_col6\" class=\"data row169 col6\" >{'score_column': {'type': 'str', 'default': 'score'}, 'score_bands': {'type': 'list', 'default': None}, 'drift_threshold': {'type': 'float', 'default': 20.0}}</td>\n",
+              "      <td id=\"T_0502a_row169_col7\" class=\"data row169 col7\" >['visualization', 'credit_risk', 'scorecard']</td>\n",
+              "      <td id=\"T_0502a_row169_col8\" class=\"data row169 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row170_col0\" class=\"data row170 col0\" >validmind.ongoing_monitoring.ScorecardHistogramDrift</td>\n",
+              "      <td id=\"T_0502a_row170_col1\" class=\"data row170 col1\" >Scorecard Histogram Drift</td>\n",
+              "      <td id=\"T_0502a_row170_col2\" class=\"data row170 col2\" >Compares score distributions between reference and monitoring datasets for each class....</td>\n",
+              "      <td id=\"T_0502a_row170_col3\" class=\"data row170 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row170_col4\" class=\"data row170 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row170_col5\" class=\"data row170 col5\" >['datasets']</td>\n",
+              "      <td id=\"T_0502a_row170_col6\" class=\"data row170 col6\" >{'score_column': {'type': 'str', 'default': 'score'}, 'title': {'type': 'str', 'default': 'Scorecard Histogram Drift'}, 'drift_pct_threshold': {'type': 'float', 'default': 20.0}}</td>\n",
+              "      <td id=\"T_0502a_row170_col7\" class=\"data row170 col7\" >['visualization', 'credit_risk', 'logistic_regression']</td>\n",
+              "      <td id=\"T_0502a_row170_col8\" class=\"data row170 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row171_col0\" class=\"data row171 col0\" >validmind.ongoing_monitoring.TargetPredictionDistributionPlot</td>\n",
+              "      <td id=\"T_0502a_row171_col1\" class=\"data row171 col1\" >Target Prediction Distribution Plot</td>\n",
+              "      <td id=\"T_0502a_row171_col2\" class=\"data row171 col2\" >Assesses differences in prediction distributions between a reference dataset and a monitoring dataset to identify...</td>\n",
+              "      <td id=\"T_0502a_row171_col3\" class=\"data row171 col3\" >True</td>\n",
+              "      <td id=\"T_0502a_row171_col4\" class=\"data row171 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row171_col5\" class=\"data row171 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_0502a_row171_col6\" class=\"data row171 col6\" >{'drift_pct_threshold': {'type': 'float', 'default': 20}}</td>\n",
+              "      <td id=\"T_0502a_row171_col7\" class=\"data row171 col7\" >['visualization']</td>\n",
+              "      <td id=\"T_0502a_row171_col8\" class=\"data row171 col8\" >['monitoring']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row172_col0\" class=\"data row172 col0\" >validmind.prompt_validation.Bias</td>\n",
+              "      <td id=\"T_0502a_row172_col1\" class=\"data row172 col1\" >Bias</td>\n",
+              "      <td id=\"T_0502a_row172_col2\" class=\"data row172 col2\" >Assesses potential bias in a Large Language Model by analyzing the distribution and order of exemplars in the...</td>\n",
+              "      <td id=\"T_0502a_row172_col3\" class=\"data row172 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row172_col4\" class=\"data row172 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row172_col5\" class=\"data row172 col5\" >['model']</td>\n",
+              "      <td id=\"T_0502a_row172_col6\" class=\"data row172 col6\" >{'min_threshold': {'type': '_empty', 'default': 7}, 'judge_llm': {'type': '_empty', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row172_col7\" class=\"data row172 col7\" >['llm', 'few_shot']</td>\n",
+              "      <td id=\"T_0502a_row172_col8\" class=\"data row172 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row173_col0\" class=\"data row173 col0\" >validmind.prompt_validation.Clarity</td>\n",
+              "      <td id=\"T_0502a_row173_col1\" class=\"data row173 col1\" >Clarity</td>\n",
+              "      <td id=\"T_0502a_row173_col2\" class=\"data row173 col2\" >Evaluates and scores the clarity of prompts in a Large Language Model based on specified guidelines....</td>\n",
+              "      <td id=\"T_0502a_row173_col3\" class=\"data row173 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row173_col4\" class=\"data row173 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row173_col5\" class=\"data row173 col5\" >['model']</td>\n",
+              "      <td id=\"T_0502a_row173_col6\" class=\"data row173 col6\" >{'min_threshold': {'type': '_empty', 'default': 7}, 'judge_llm': {'type': '_empty', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row173_col7\" class=\"data row173 col7\" >['llm', 'zero_shot', 'few_shot']</td>\n",
+              "      <td id=\"T_0502a_row173_col8\" class=\"data row173 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row174_col0\" class=\"data row174 col0\" >validmind.prompt_validation.Conciseness</td>\n",
+              "      <td id=\"T_0502a_row174_col1\" class=\"data row174 col1\" >Conciseness</td>\n",
+              "      <td id=\"T_0502a_row174_col2\" class=\"data row174 col2\" >Analyzes and grades the conciseness of prompts provided to a Large Language Model....</td>\n",
+              "      <td id=\"T_0502a_row174_col3\" class=\"data row174 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row174_col4\" class=\"data row174 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row174_col5\" class=\"data row174 col5\" >['model']</td>\n",
+              "      <td id=\"T_0502a_row174_col6\" class=\"data row174 col6\" >{'min_threshold': {'type': '_empty', 'default': 7}, 'judge_llm': {'type': '_empty', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row174_col7\" class=\"data row174 col7\" >['llm', 'zero_shot', 'few_shot']</td>\n",
+              "      <td id=\"T_0502a_row174_col8\" class=\"data row174 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row175_col0\" class=\"data row175 col0\" >validmind.prompt_validation.Delimitation</td>\n",
+              "      <td id=\"T_0502a_row175_col1\" class=\"data row175 col1\" >Delimitation</td>\n",
+              "      <td id=\"T_0502a_row175_col2\" class=\"data row175 col2\" >Evaluates the proper use of delimiters in prompts provided to Large Language Models....</td>\n",
+              "      <td id=\"T_0502a_row175_col3\" class=\"data row175 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row175_col4\" class=\"data row175 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row175_col5\" class=\"data row175 col5\" >['model']</td>\n",
+              "      <td id=\"T_0502a_row175_col6\" class=\"data row175 col6\" >{'min_threshold': {'type': '_empty', 'default': 7}, 'judge_llm': {'type': '_empty', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row175_col7\" class=\"data row175 col7\" >['llm', 'zero_shot', 'few_shot']</td>\n",
+              "      <td id=\"T_0502a_row175_col8\" class=\"data row175 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row176_col0\" class=\"data row176 col0\" >validmind.prompt_validation.NegativeInstruction</td>\n",
+              "      <td id=\"T_0502a_row176_col1\" class=\"data row176 col1\" >Negative Instruction</td>\n",
+              "      <td id=\"T_0502a_row176_col2\" class=\"data row176 col2\" >Evaluates and grades the use of affirmative, proactive language over negative instructions in LLM prompts....</td>\n",
+              "      <td id=\"T_0502a_row176_col3\" class=\"data row176 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row176_col4\" class=\"data row176 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row176_col5\" class=\"data row176 col5\" >['model']</td>\n",
+              "      <td id=\"T_0502a_row176_col6\" class=\"data row176 col6\" >{'min_threshold': {'type': '_empty', 'default': 7}, 'judge_llm': {'type': '_empty', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row176_col7\" class=\"data row176 col7\" >['llm', 'zero_shot', 'few_shot']</td>\n",
+              "      <td id=\"T_0502a_row176_col8\" class=\"data row176 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row177_col0\" class=\"data row177 col0\" >validmind.prompt_validation.Robustness</td>\n",
+              "      <td id=\"T_0502a_row177_col1\" class=\"data row177 col1\" >Robustness</td>\n",
+              "      <td id=\"T_0502a_row177_col2\" class=\"data row177 col2\" >Assesses the robustness of prompts provided to a Large Language Model under varying conditions and contexts. This test...</td>\n",
+              "      <td id=\"T_0502a_row177_col3\" class=\"data row177 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row177_col4\" class=\"data row177 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row177_col5\" class=\"data row177 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row177_col6\" class=\"data row177 col6\" >{'num_tests': {'type': '_empty', 'default': 10}, 'judge_llm': {'type': '_empty', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row177_col7\" class=\"data row177 col7\" >['llm', 'zero_shot', 'few_shot']</td>\n",
+              "      <td id=\"T_0502a_row177_col8\" class=\"data row177 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row178_col0\" class=\"data row178 col0\" >validmind.prompt_validation.Specificity</td>\n",
+              "      <td id=\"T_0502a_row178_col1\" class=\"data row178 col1\" >Specificity</td>\n",
+              "      <td id=\"T_0502a_row178_col2\" class=\"data row178 col2\" >Evaluates and scores the specificity of prompts provided to a Large Language Model (LLM), based on clarity, detail,...</td>\n",
+              "      <td id=\"T_0502a_row178_col3\" class=\"data row178 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row178_col4\" class=\"data row178 col4\" >True</td>\n",
+              "      <td id=\"T_0502a_row178_col5\" class=\"data row178 col5\" >['model']</td>\n",
+              "      <td id=\"T_0502a_row178_col6\" class=\"data row178 col6\" >{'min_threshold': {'type': '_empty', 'default': 7}, 'judge_llm': {'type': '_empty', 'default': None}}</td>\n",
+              "      <td id=\"T_0502a_row178_col7\" class=\"data row178 col7\" >['llm', 'zero_shot', 'few_shot']</td>\n",
+              "      <td id=\"T_0502a_row178_col8\" class=\"data row178 col8\" >['text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row179_col0\" class=\"data row179 col0\" >validmind.unit_metrics.classification.Accuracy</td>\n",
+              "      <td id=\"T_0502a_row179_col1\" class=\"data row179 col1\" >Accuracy</td>\n",
+              "      <td id=\"T_0502a_row179_col2\" class=\"data row179 col2\" >Calculates the accuracy of a model</td>\n",
+              "      <td id=\"T_0502a_row179_col3\" class=\"data row179 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row179_col4\" class=\"data row179 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row179_col5\" class=\"data row179 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row179_col6\" class=\"data row179 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row179_col7\" class=\"data row179 col7\" >['classification']</td>\n",
+              "      <td id=\"T_0502a_row179_col8\" class=\"data row179 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row180_col0\" class=\"data row180 col0\" >validmind.unit_metrics.classification.F1</td>\n",
+              "      <td id=\"T_0502a_row180_col1\" class=\"data row180 col1\" >F1</td>\n",
+              "      <td id=\"T_0502a_row180_col2\" class=\"data row180 col2\" >Calculates the F1 score for a classification model.</td>\n",
+              "      <td id=\"T_0502a_row180_col3\" class=\"data row180 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row180_col4\" class=\"data row180 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row180_col5\" class=\"data row180 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row180_col6\" class=\"data row180 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row180_col7\" class=\"data row180 col7\" >['classification']</td>\n",
+              "      <td id=\"T_0502a_row180_col8\" class=\"data row180 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row181_col0\" class=\"data row181 col0\" >validmind.unit_metrics.classification.Precision</td>\n",
+              "      <td id=\"T_0502a_row181_col1\" class=\"data row181 col1\" >Precision</td>\n",
+              "      <td id=\"T_0502a_row181_col2\" class=\"data row181 col2\" >Calculates the precision for a classification model.</td>\n",
+              "      <td id=\"T_0502a_row181_col3\" class=\"data row181 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row181_col4\" class=\"data row181 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row181_col5\" class=\"data row181 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row181_col6\" class=\"data row181 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row181_col7\" class=\"data row181 col7\" >['classification']</td>\n",
+              "      <td id=\"T_0502a_row181_col8\" class=\"data row181 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row182_col0\" class=\"data row182 col0\" >validmind.unit_metrics.classification.ROC_AUC</td>\n",
+              "      <td id=\"T_0502a_row182_col1\" class=\"data row182 col1\" >ROC AUC</td>\n",
+              "      <td id=\"T_0502a_row182_col2\" class=\"data row182 col2\" >Calculates the ROC AUC for a classification model.</td>\n",
+              "      <td id=\"T_0502a_row182_col3\" class=\"data row182 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row182_col4\" class=\"data row182 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row182_col5\" class=\"data row182 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row182_col6\" class=\"data row182 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row182_col7\" class=\"data row182 col7\" >['classification']</td>\n",
+              "      <td id=\"T_0502a_row182_col8\" class=\"data row182 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row183_col0\" class=\"data row183 col0\" >validmind.unit_metrics.classification.Recall</td>\n",
+              "      <td id=\"T_0502a_row183_col1\" class=\"data row183 col1\" >Recall</td>\n",
+              "      <td id=\"T_0502a_row183_col2\" class=\"data row183 col2\" >Calculates the recall for a classification model.</td>\n",
+              "      <td id=\"T_0502a_row183_col3\" class=\"data row183 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row183_col4\" class=\"data row183 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row183_col5\" class=\"data row183 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row183_col6\" class=\"data row183 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row183_col7\" class=\"data row183 col7\" >['classification']</td>\n",
+              "      <td id=\"T_0502a_row183_col8\" class=\"data row183 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row184_col0\" class=\"data row184 col0\" >validmind.unit_metrics.regression.AdjustedRSquaredScore</td>\n",
+              "      <td id=\"T_0502a_row184_col1\" class=\"data row184 col1\" >Adjusted R Squared Score</td>\n",
+              "      <td id=\"T_0502a_row184_col2\" class=\"data row184 col2\" >Calculates the adjusted R-squared score for a regression model.</td>\n",
+              "      <td id=\"T_0502a_row184_col3\" class=\"data row184 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row184_col4\" class=\"data row184 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row184_col5\" class=\"data row184 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row184_col6\" class=\"data row184 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row184_col7\" class=\"data row184 col7\" >['regression']</td>\n",
+              "      <td id=\"T_0502a_row184_col8\" class=\"data row184 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row185_col0\" class=\"data row185 col0\" >validmind.unit_metrics.regression.GiniCoefficient</td>\n",
+              "      <td id=\"T_0502a_row185_col1\" class=\"data row185 col1\" >Gini Coefficient</td>\n",
+              "      <td id=\"T_0502a_row185_col2\" class=\"data row185 col2\" >Calculates the Gini coefficient for a regression model.</td>\n",
+              "      <td id=\"T_0502a_row185_col3\" class=\"data row185 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row185_col4\" class=\"data row185 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row185_col5\" class=\"data row185 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row185_col6\" class=\"data row185 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row185_col7\" class=\"data row185 col7\" >['regression']</td>\n",
+              "      <td id=\"T_0502a_row185_col8\" class=\"data row185 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row186_col0\" class=\"data row186 col0\" >validmind.unit_metrics.regression.HuberLoss</td>\n",
+              "      <td id=\"T_0502a_row186_col1\" class=\"data row186 col1\" >Huber Loss</td>\n",
+              "      <td id=\"T_0502a_row186_col2\" class=\"data row186 col2\" >Calculates the Huber loss for a regression model.</td>\n",
+              "      <td id=\"T_0502a_row186_col3\" class=\"data row186 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row186_col4\" class=\"data row186 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row186_col5\" class=\"data row186 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row186_col6\" class=\"data row186 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row186_col7\" class=\"data row186 col7\" >['regression']</td>\n",
+              "      <td id=\"T_0502a_row186_col8\" class=\"data row186 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row187_col0\" class=\"data row187 col0\" >validmind.unit_metrics.regression.KolmogorovSmirnovStatistic</td>\n",
+              "      <td id=\"T_0502a_row187_col1\" class=\"data row187 col1\" >Kolmogorov Smirnov Statistic</td>\n",
+              "      <td id=\"T_0502a_row187_col2\" class=\"data row187 col2\" >Calculates the Kolmogorov-Smirnov statistic for a regression model.</td>\n",
+              "      <td id=\"T_0502a_row187_col3\" class=\"data row187 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row187_col4\" class=\"data row187 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row187_col5\" class=\"data row187 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_0502a_row187_col6\" class=\"data row187 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row187_col7\" class=\"data row187 col7\" >['regression']</td>\n",
+              "      <td id=\"T_0502a_row187_col8\" class=\"data row187 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row188_col0\" class=\"data row188 col0\" >validmind.unit_metrics.regression.MeanAbsoluteError</td>\n",
+              "      <td id=\"T_0502a_row188_col1\" class=\"data row188 col1\" >Mean Absolute Error</td>\n",
+              "      <td id=\"T_0502a_row188_col2\" class=\"data row188 col2\" >Calculates the mean absolute error for a regression model.</td>\n",
+              "      <td id=\"T_0502a_row188_col3\" class=\"data row188 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row188_col4\" class=\"data row188 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row188_col5\" class=\"data row188 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row188_col6\" class=\"data row188 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row188_col7\" class=\"data row188 col7\" >['regression']</td>\n",
+              "      <td id=\"T_0502a_row188_col8\" class=\"data row188 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row189_col0\" class=\"data row189 col0\" >validmind.unit_metrics.regression.MeanAbsolutePercentageError</td>\n",
+              "      <td id=\"T_0502a_row189_col1\" class=\"data row189 col1\" >Mean Absolute Percentage Error</td>\n",
+              "      <td id=\"T_0502a_row189_col2\" class=\"data row189 col2\" >Calculates the mean absolute percentage error for a regression model.</td>\n",
+              "      <td id=\"T_0502a_row189_col3\" class=\"data row189 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row189_col4\" class=\"data row189 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row189_col5\" class=\"data row189 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row189_col6\" class=\"data row189 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row189_col7\" class=\"data row189 col7\" >['regression']</td>\n",
+              "      <td id=\"T_0502a_row189_col8\" class=\"data row189 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row190_col0\" class=\"data row190 col0\" >validmind.unit_metrics.regression.MeanBiasDeviation</td>\n",
+              "      <td id=\"T_0502a_row190_col1\" class=\"data row190 col1\" >Mean Bias Deviation</td>\n",
+              "      <td id=\"T_0502a_row190_col2\" class=\"data row190 col2\" >Calculates the mean bias deviation for a regression model.</td>\n",
+              "      <td id=\"T_0502a_row190_col3\" class=\"data row190 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row190_col4\" class=\"data row190 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row190_col5\" class=\"data row190 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row190_col6\" class=\"data row190 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row190_col7\" class=\"data row190 col7\" >['regression']</td>\n",
+              "      <td id=\"T_0502a_row190_col8\" class=\"data row190 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row191_col0\" class=\"data row191 col0\" >validmind.unit_metrics.regression.MeanSquaredError</td>\n",
+              "      <td id=\"T_0502a_row191_col1\" class=\"data row191 col1\" >Mean Squared Error</td>\n",
+              "      <td id=\"T_0502a_row191_col2\" class=\"data row191 col2\" >Calculates the mean squared error for a regression model.</td>\n",
+              "      <td id=\"T_0502a_row191_col3\" class=\"data row191 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row191_col4\" class=\"data row191 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row191_col5\" class=\"data row191 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row191_col6\" class=\"data row191 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row191_col7\" class=\"data row191 col7\" >['regression']</td>\n",
+              "      <td id=\"T_0502a_row191_col8\" class=\"data row191 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row192_col0\" class=\"data row192 col0\" >validmind.unit_metrics.regression.QuantileLoss</td>\n",
+              "      <td id=\"T_0502a_row192_col1\" class=\"data row192 col1\" >Quantile Loss</td>\n",
+              "      <td id=\"T_0502a_row192_col2\" class=\"data row192 col2\" >Calculates the quantile loss for a regression model.</td>\n",
+              "      <td id=\"T_0502a_row192_col3\" class=\"data row192 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row192_col4\" class=\"data row192 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row192_col5\" class=\"data row192 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row192_col6\" class=\"data row192 col6\" >{'quantile': {'type': '_empty', 'default': 0.5}}</td>\n",
+              "      <td id=\"T_0502a_row192_col7\" class=\"data row192 col7\" >['regression']</td>\n",
+              "      <td id=\"T_0502a_row192_col8\" class=\"data row192 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row193_col0\" class=\"data row193 col0\" >validmind.unit_metrics.regression.RSquaredScore</td>\n",
+              "      <td id=\"T_0502a_row193_col1\" class=\"data row193 col1\" >R Squared Score</td>\n",
+              "      <td id=\"T_0502a_row193_col2\" class=\"data row193 col2\" >Calculates the R-squared score for a regression model.</td>\n",
+              "      <td id=\"T_0502a_row193_col3\" class=\"data row193 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row193_col4\" class=\"data row193 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row193_col5\" class=\"data row193 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row193_col6\" class=\"data row193 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row193_col7\" class=\"data row193 col7\" >['regression']</td>\n",
+              "      <td id=\"T_0502a_row193_col8\" class=\"data row193 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_0502a_row194_col0\" class=\"data row194 col0\" >validmind.unit_metrics.regression.RootMeanSquaredError</td>\n",
+              "      <td id=\"T_0502a_row194_col1\" class=\"data row194 col1\" >Root Mean Squared Error</td>\n",
+              "      <td id=\"T_0502a_row194_col2\" class=\"data row194 col2\" >Calculates the root mean squared error for a regression model.</td>\n",
+              "      <td id=\"T_0502a_row194_col3\" class=\"data row194 col3\" >False</td>\n",
+              "      <td id=\"T_0502a_row194_col4\" class=\"data row194 col4\" >False</td>\n",
+              "      <td id=\"T_0502a_row194_col5\" class=\"data row194 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_0502a_row194_col6\" class=\"data row194 col6\" >{}</td>\n",
+              "      <td id=\"T_0502a_row194_col7\" class=\"data row194 col7\" >['regression']</td>\n",
+              "      <td id=\"T_0502a_row194_col8\" class=\"data row194 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "  </tbody>\n",
+              "</table>\n"
+            ],
+            "text/plain": [
+              "<pandas.io.formats.style.Styler at 0x38000a670>"
+            ]
+          },
+          "execution_count": null,
+          "metadata": {},
+          "output_type": "execute_result"
+        }
       ],
-      "text/plain": [
-       "<pandas.io.formats.style.Styler at 0x38000a670>"
+      "source": [
+        "list_tests()"
       ]
-     },
-     "execution_count": 2,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "list_tests()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Understand tags and task types\n",
-    "\n",
-    "Use [list_tasks()](https://docs.validmind.ai/validmind/validmind/tests.html#list_tasks) to view all unique task types used to classify tests in the ValidMind Library.\n",
-    "\n",
-    "Understanding `task` types helps you filter tests that match your model’s objective. For example:\n",
-    "\n",
-    "- **classification:** Works with Classification Models and Datasets.\n",
-    "- **regression:** Works with Regression Models and Datasets.\n",
-    "- **text classification:** Works with Text Classification Models and Datasets.\n",
-    "- **text summarization:** Works with Text Summarization Models and Datasets."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 3,
-   "metadata": {},
-   "outputs": [
+    },
     {
-     "data": {
-      "text/plain": [
-       "['text_qa',\n",
-       " 'classification',\n",
-       " 'data_validation',\n",
-       " 'text_classification',\n",
-       " 'feature_extraction',\n",
-       " 'regression',\n",
-       " 'visualization',\n",
-       " 'clustering',\n",
-       " 'time_series_forecasting',\n",
-       " 'text_summarization',\n",
-       " 'nlp',\n",
-       " 'residual_analysis',\n",
-       " 'monitoring',\n",
-       " 'text_generation']"
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Understand tags and task types\n",
+        "\n",
+        "Use [list_tasks()](https://docs.validmind.ai/validmind/validmind/tests.html#list_tasks) to view all unique task types used to classify tests in the ValidMind Library.\n",
+        "\n",
+        "Understanding `task` types helps you filter tests that match your record's objective. For example:\n",
+        "\n",
+        "- **classification:** Works with Classification Models and Datasets.\n",
+        "- **regression:** Works with Regression Models and Datasets.\n",
+        "- **text classification:** Works with Text Classification Models and Datasets.\n",
+        "- **text summarization:** Works with Text Summarization Models and Datasets."
       ]
-     },
-     "execution_count": 3,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "list_tasks()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Use [list_tags()](https://docs.validmind.ai/validmind/validmind/tests.html#list_tags) to view all unique tags used to describe tests in the ValidMind Library.\n",
-    "\n",
-    "`Tags` describe what a test applies to and help you filter tests for your use case. Examples include:\n",
-    "\n",
-    "- **llm:** Tests that work with Large Language Models.\n",
-    "- **nlp:** Tests relevant for natural language processing.\n",
-    "- **binary_classification:** Tests for binary classification tasks.\n",
-    "- **forecasting:** Tests for forecasting and time-series analysis.\n",
-    "- **tabular_data:** Tests for tabular data like CSVs and Excel spreadsheets."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 4,
-   "metadata": {},
-   "outputs": [
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 3,
+      "metadata": {},
+      "outputs": [
+        {
+          "data": {
+            "text/plain": [
+              "['text_qa',\n",
+              " 'classification',\n",
+              " 'data_validation',\n",
+              " 'text_classification',\n",
+              " 'feature_extraction',\n",
+              " 'regression',\n",
+              " 'visualization',\n",
+              " 'clustering',\n",
+              " 'time_series_forecasting',\n",
+              " 'text_summarization',\n",
+              " 'nlp',\n",
+              " 'residual_analysis',\n",
+              " 'monitoring',\n",
+              " 'text_generation']"
+            ]
+          },
+          "execution_count": null,
+          "metadata": {},
+          "output_type": "execute_result"
+        }
+      ],
+      "source": [
+        "list_tasks()"
+      ]
+    },
     {
-     "data": {
-      "text/plain": [
-       "['senstivity_analysis',\n",
-       " 'calibration',\n",
-       " 'clustering',\n",
-       " 'anomaly_detection',\n",
-       " 'nlp',\n",
-       " 'classification_metrics',\n",
-       " 'dimensionality_reduction',\n",
-       " 'tabular_data',\n",
-       " 'time_series_data',\n",
-       " 'model_predictions',\n",
-       " 'feature_selection',\n",
-       " 'correlation',\n",
-       " 'frequency_analysis',\n",
-       " 'embeddings',\n",
-       " 'regression',\n",
-       " 'llm',\n",
-       " 'statsmodels',\n",
-       " 'ragas',\n",
-       " 'model_performance',\n",
-       " 'model_validation',\n",
-       " 'rag_performance',\n",
-       " 'model_training',\n",
-       " 'qualitative',\n",
-       " 'classification',\n",
-       " 'kmeans',\n",
-       " 'multiclass_classification',\n",
-       " 'linear_regression',\n",
-       " 'data_quality',\n",
-       " 'text_data',\n",
-       " 'binary_classification',\n",
-       " 'threshold_optimization',\n",
-       " 'stationarity',\n",
-       " 'bias_and_fairness',\n",
-       " 'scorecard',\n",
-       " 'model_explainability',\n",
-       " 'model_comparison',\n",
-       " 'numerical_data',\n",
-       " 'sklearn',\n",
-       " 'model_selection',\n",
-       " 'retrieval_performance',\n",
-       " 'zero_shot',\n",
-       " 'statistical_test',\n",
-       " 'descriptive_statistics',\n",
-       " 'seasonality',\n",
-       " 'analysis',\n",
-       " 'data_validation',\n",
-       " 'data_distribution',\n",
-       " 'feature_importance',\n",
-       " 'metadata',\n",
-       " 'few_shot',\n",
-       " 'visualization',\n",
-       " 'credit_risk',\n",
-       " 'forecasting',\n",
-       " 'AUC',\n",
-       " 'logistic_regression',\n",
-       " 'model_diagnosis',\n",
-       " 'model_interpretation',\n",
-       " 'unit_root_test',\n",
-       " 'categorical_data',\n",
-       " 'data_analysis']"
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Use [list_tags()](https://docs.validmind.ai/validmind/validmind/tests.html#list_tags) to view all unique tags used to describe tests in the ValidMind Library.\n",
+        "\n",
+        "`Tags` describe what a test applies to and help you filter tests for your use case. Examples include:\n",
+        "\n",
+        "- **llm:** Tests that work with Large Language Models.\n",
+        "- **nlp:** Tests relevant for natural language processing.\n",
+        "- **binary_classification:** Tests for binary classification tasks.\n",
+        "- **forecasting:** Tests for forecasting and time-series analysis.\n",
+        "- **tabular_data:** Tests for tabular data like CSVs and Excel spreadsheets."
       ]
-     },
-     "execution_count": 4,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "list_tags()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Finally, to match each task type with its related tags, use the [list_tasks_and_tags()](https://docs.validmind.ai/validmind/validmind/tests.html#list_tasks_and_tags) function:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [
+    },
     {
-     "data": {
-      "text/html": [
-       "<style type=\"text/css\">\n",
-       "#T_ac294 th {\n",
-       "  text-align: left;\n",
-       "}\n",
-       "#T_ac294_row0_col0, #T_ac294_row0_col1, #T_ac294_row1_col0, #T_ac294_row1_col1, #T_ac294_row2_col0, #T_ac294_row2_col1, #T_ac294_row3_col0, #T_ac294_row3_col1, #T_ac294_row4_col0, #T_ac294_row4_col1, #T_ac294_row5_col0, #T_ac294_row5_col1, #T_ac294_row6_col0, #T_ac294_row6_col1, #T_ac294_row7_col0, #T_ac294_row7_col1, #T_ac294_row8_col0, #T_ac294_row8_col1, #T_ac294_row9_col0, #T_ac294_row9_col1, #T_ac294_row10_col0, #T_ac294_row10_col1, #T_ac294_row11_col0, #T_ac294_row11_col1, #T_ac294_row12_col0, #T_ac294_row12_col1, #T_ac294_row13_col0, #T_ac294_row13_col1 {\n",
-       "  text-align: left;\n",
-       "}\n",
-       "</style>\n",
-       "<table id=\"T_ac294\">\n",
-       "  <thead>\n",
-       "    <tr>\n",
-       "      <th id=\"T_ac294_level0_col0\" class=\"col_heading level0 col0\" >Task</th>\n",
-       "      <th id=\"T_ac294_level0_col1\" class=\"col_heading level0 col1\" >Tags</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <td id=\"T_ac294_row0_col0\" class=\"data row0 col0\" >regression</td>\n",
-       "      <td id=\"T_ac294_row0_col1\" class=\"data row0 col1\" >senstivity_analysis, tabular_data, time_series_data, model_predictions, feature_selection, correlation, regression, statsmodels, model_performance, model_training, multiclass_classification, linear_regression, data_quality, text_data, model_explainability, binary_classification, stationarity, bias_and_fairness, numerical_data, sklearn, model_selection, statistical_test, descriptive_statistics, seasonality, analysis, data_validation, data_distribution, metadata, feature_importance, visualization, forecasting, model_diagnosis, model_interpretation, unit_root_test, categorical_data, data_analysis</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_ac294_row1_col0\" class=\"data row1 col0\" >classification</td>\n",
-       "      <td id=\"T_ac294_row1_col1\" class=\"data row1 col1\" >calibration, anomaly_detection, classification_metrics, tabular_data, time_series_data, feature_selection, correlation, statsmodels, model_performance, model_validation, model_training, classification, multiclass_classification, linear_regression, data_quality, text_data, binary_classification, threshold_optimization, bias_and_fairness, scorecard, model_comparison, numerical_data, sklearn, statistical_test, descriptive_statistics, feature_importance, data_distribution, metadata, visualization, credit_risk, AUC, logistic_regression, model_diagnosis, categorical_data, data_analysis</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_ac294_row2_col0\" class=\"data row2 col0\" >text_classification</td>\n",
-       "      <td id=\"T_ac294_row2_col1\" class=\"data row2 col1\" >model_performance, feature_importance, multiclass_classification, few_shot, frequency_analysis, zero_shot, text_data, visualization, llm, binary_classification, ragas, model_diagnosis, model_comparison, sklearn, nlp, retrieval_performance, tabular_data, time_series_data</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_ac294_row3_col0\" class=\"data row3 col0\" >text_summarization</td>\n",
-       "      <td id=\"T_ac294_row3_col1\" class=\"data row3 col1\" >qualitative, few_shot, frequency_analysis, embeddings, zero_shot, text_data, visualization, llm, rag_performance, ragas, retrieval_performance, nlp, dimensionality_reduction, tabular_data, time_series_data</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_ac294_row4_col0\" class=\"data row4 col0\" >data_validation</td>\n",
-       "      <td id=\"T_ac294_row4_col1\" class=\"data row4 col1\" >stationarity, statsmodels, unit_root_test, time_series_data</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_ac294_row5_col0\" class=\"data row5 col0\" >time_series_forecasting</td>\n",
-       "      <td id=\"T_ac294_row5_col1\" class=\"data row5 col1\" >model_training, data_validation, metadata, visualization, model_explainability, sklearn, model_performance, model_predictions, time_series_data</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_ac294_row6_col0\" class=\"data row6 col0\" >nlp</td>\n",
-       "      <td id=\"T_ac294_row6_col1\" class=\"data row6 col1\" >data_validation, frequency_analysis, text_data, visualization, nlp</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_ac294_row7_col0\" class=\"data row7 col0\" >clustering</td>\n",
-       "      <td id=\"T_ac294_row7_col1\" class=\"data row7 col1\" >clustering, model_performance, kmeans, sklearn</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_ac294_row8_col0\" class=\"data row8 col0\" >residual_analysis</td>\n",
-       "      <td id=\"T_ac294_row8_col1\" class=\"data row8 col1\" >regression</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_ac294_row9_col0\" class=\"data row9 col0\" >visualization</td>\n",
-       "      <td id=\"T_ac294_row9_col1\" class=\"data row9 col1\" >regression</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_ac294_row10_col0\" class=\"data row10 col0\" >feature_extraction</td>\n",
-       "      <td id=\"T_ac294_row10_col1\" class=\"data row10 col1\" >embeddings, text_data, visualization, llm</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_ac294_row11_col0\" class=\"data row11 col0\" >text_qa</td>\n",
-       "      <td id=\"T_ac294_row11_col1\" class=\"data row11 col1\" >qualitative, embeddings, visualization, llm, rag_performance, ragas, dimensionality_reduction, retrieval_performance</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_ac294_row12_col0\" class=\"data row12 col0\" >text_generation</td>\n",
-       "      <td id=\"T_ac294_row12_col1\" class=\"data row12 col1\" >qualitative, embeddings, visualization, llm, rag_performance, ragas, dimensionality_reduction, retrieval_performance</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_ac294_row13_col0\" class=\"data row13 col0\" >monitoring</td>\n",
-       "      <td id=\"T_ac294_row13_col1\" class=\"data row13 col1\" >visualization</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n"
+      "cell_type": "code",
+      "execution_count": 4,
+      "metadata": {},
+      "outputs": [
+        {
+          "data": {
+            "text/plain": [
+              "['senstivity_analysis',\n",
+              " 'calibration',\n",
+              " 'clustering',\n",
+              " 'anomaly_detection',\n",
+              " 'nlp',\n",
+              " 'classification_metrics',\n",
+              " 'dimensionality_reduction',\n",
+              " 'tabular_data',\n",
+              " 'time_series_data',\n",
+              " 'model_predictions',\n",
+              " 'feature_selection',\n",
+              " 'correlation',\n",
+              " 'frequency_analysis',\n",
+              " 'embeddings',\n",
+              " 'regression',\n",
+              " 'llm',\n",
+              " 'statsmodels',\n",
+              " 'ragas',\n",
+              " 'model_performance',\n",
+              " 'model_validation',\n",
+              " 'rag_performance',\n",
+              " 'model_training',\n",
+              " 'qualitative',\n",
+              " 'classification',\n",
+              " 'kmeans',\n",
+              " 'multiclass_classification',\n",
+              " 'linear_regression',\n",
+              " 'data_quality',\n",
+              " 'text_data',\n",
+              " 'binary_classification',\n",
+              " 'threshold_optimization',\n",
+              " 'stationarity',\n",
+              " 'bias_and_fairness',\n",
+              " 'scorecard',\n",
+              " 'model_explainability',\n",
+              " 'model_comparison',\n",
+              " 'numerical_data',\n",
+              " 'sklearn',\n",
+              " 'model_selection',\n",
+              " 'retrieval_performance',\n",
+              " 'zero_shot',\n",
+              " 'statistical_test',\n",
+              " 'descriptive_statistics',\n",
+              " 'seasonality',\n",
+              " 'analysis',\n",
+              " 'data_validation',\n",
+              " 'data_distribution',\n",
+              " 'feature_importance',\n",
+              " 'metadata',\n",
+              " 'few_shot',\n",
+              " 'visualization',\n",
+              " 'credit_risk',\n",
+              " 'forecasting',\n",
+              " 'AUC',\n",
+              " 'logistic_regression',\n",
+              " 'model_diagnosis',\n",
+              " 'model_interpretation',\n",
+              " 'unit_root_test',\n",
+              " 'categorical_data',\n",
+              " 'data_analysis']"
+            ]
+          },
+          "execution_count": null,
+          "metadata": {},
+          "output_type": "execute_result"
+        }
       ],
-      "text/plain": [
-       "<pandas.io.formats.style.Styler at 0x38000adc0>"
+      "source": [
+        "list_tags()"
       ]
-     },
-     "execution_count": 5,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "list_tasks_and_tags()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Filter tests by tags and task types\n",
-    "\n",
-    "While listing all tests is useful, you’ll often want to narrow your search. The [list_tests()](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) function supports `filter`, `task`, and `tags` parameters to assist in refining your results.\n",
-    "\n",
-    "Use the `filter` parameter to find tests that match a specific keyword, such as `sklearn`:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 6,
-   "metadata": {},
-   "outputs": [
+    },
     {
-     "data": {
-      "text/html": [
-       "<style type=\"text/css\">\n",
-       "#T_326c3 th {\n",
-       "  text-align: left;\n",
-       "}\n",
-       "#T_326c3_row0_col0, #T_326c3_row0_col1, #T_326c3_row0_col2, #T_326c3_row0_col3, #T_326c3_row0_col4, #T_326c3_row0_col5, #T_326c3_row0_col6, #T_326c3_row0_col7, #T_326c3_row0_col8, #T_326c3_row1_col0, #T_326c3_row1_col1, #T_326c3_row1_col2, #T_326c3_row1_col3, #T_326c3_row1_col4, #T_326c3_row1_col5, #T_326c3_row1_col6, #T_326c3_row1_col7, #T_326c3_row1_col8, #T_326c3_row2_col0, #T_326c3_row2_col1, #T_326c3_row2_col2, #T_326c3_row2_col3, #T_326c3_row2_col4, #T_326c3_row2_col5, #T_326c3_row2_col6, #T_326c3_row2_col7, #T_326c3_row2_col8, #T_326c3_row3_col0, #T_326c3_row3_col1, #T_326c3_row3_col2, #T_326c3_row3_col3, #T_326c3_row3_col4, #T_326c3_row3_col5, #T_326c3_row3_col6, #T_326c3_row3_col7, #T_326c3_row3_col8, #T_326c3_row4_col0, #T_326c3_row4_col1, #T_326c3_row4_col2, #T_326c3_row4_col3, #T_326c3_row4_col4, #T_326c3_row4_col5, #T_326c3_row4_col6, #T_326c3_row4_col7, #T_326c3_row4_col8, #T_326c3_row5_col0, #T_326c3_row5_col1, #T_326c3_row5_col2, #T_326c3_row5_col3, #T_326c3_row5_col4, #T_326c3_row5_col5, #T_326c3_row5_col6, #T_326c3_row5_col7, #T_326c3_row5_col8, #T_326c3_row6_col0, #T_326c3_row6_col1, #T_326c3_row6_col2, #T_326c3_row6_col3, #T_326c3_row6_col4, #T_326c3_row6_col5, #T_326c3_row6_col6, #T_326c3_row6_col7, #T_326c3_row6_col8, #T_326c3_row7_col0, #T_326c3_row7_col1, #T_326c3_row7_col2, #T_326c3_row7_col3, #T_326c3_row7_col4, #T_326c3_row7_col5, #T_326c3_row7_col6, #T_326c3_row7_col7, #T_326c3_row7_col8, #T_326c3_row8_col0, #T_326c3_row8_col1, #T_326c3_row8_col2, #T_326c3_row8_col3, #T_326c3_row8_col4, #T_326c3_row8_col5, #T_326c3_row8_col6, #T_326c3_row8_col7, #T_326c3_row8_col8, #T_326c3_row9_col0, #T_326c3_row9_col1, #T_326c3_row9_col2, #T_326c3_row9_col3, #T_326c3_row9_col4, #T_326c3_row9_col5, #T_326c3_row9_col6, #T_326c3_row9_col7, #T_326c3_row9_col8, #T_326c3_row10_col0, #T_326c3_row10_col1, #T_326c3_row10_col2, #T_326c3_row10_col3, #T_326c3_row10_col4, #T_326c3_row10_col5, #T_326c3_row10_col6, #T_326c3_row10_col7, #T_326c3_row10_col8, #T_326c3_row11_col0, #T_326c3_row11_col1, #T_326c3_row11_col2, #T_326c3_row11_col3, #T_326c3_row11_col4, #T_326c3_row11_col5, #T_326c3_row11_col6, #T_326c3_row11_col7, #T_326c3_row11_col8, #T_326c3_row12_col0, #T_326c3_row12_col1, #T_326c3_row12_col2, #T_326c3_row12_col3, #T_326c3_row12_col4, #T_326c3_row12_col5, #T_326c3_row12_col6, #T_326c3_row12_col7, #T_326c3_row12_col8, #T_326c3_row13_col0, #T_326c3_row13_col1, #T_326c3_row13_col2, #T_326c3_row13_col3, #T_326c3_row13_col4, #T_326c3_row13_col5, #T_326c3_row13_col6, #T_326c3_row13_col7, #T_326c3_row13_col8, #T_326c3_row14_col0, #T_326c3_row14_col1, #T_326c3_row14_col2, #T_326c3_row14_col3, #T_326c3_row14_col4, #T_326c3_row14_col5, #T_326c3_row14_col6, #T_326c3_row14_col7, #T_326c3_row14_col8, #T_326c3_row15_col0, #T_326c3_row15_col1, #T_326c3_row15_col2, #T_326c3_row15_col3, #T_326c3_row15_col4, #T_326c3_row15_col5, #T_326c3_row15_col6, #T_326c3_row15_col7, #T_326c3_row15_col8, #T_326c3_row16_col0, #T_326c3_row16_col1, #T_326c3_row16_col2, #T_326c3_row16_col3, #T_326c3_row16_col4, #T_326c3_row16_col5, #T_326c3_row16_col6, #T_326c3_row16_col7, #T_326c3_row16_col8, #T_326c3_row17_col0, #T_326c3_row17_col1, #T_326c3_row17_col2, #T_326c3_row17_col3, #T_326c3_row17_col4, #T_326c3_row17_col5, #T_326c3_row17_col6, #T_326c3_row17_col7, #T_326c3_row17_col8, #T_326c3_row18_col0, #T_326c3_row18_col1, #T_326c3_row18_col2, #T_326c3_row18_col3, #T_326c3_row18_col4, #T_326c3_row18_col5, #T_326c3_row18_col6, #T_326c3_row18_col7, #T_326c3_row18_col8, #T_326c3_row19_col0, #T_326c3_row19_col1, #T_326c3_row19_col2, #T_326c3_row19_col3, #T_326c3_row19_col4, #T_326c3_row19_col5, #T_326c3_row19_col6, #T_326c3_row19_col7, #T_326c3_row19_col8, #T_326c3_row20_col0, #T_326c3_row20_col1, #T_326c3_row20_col2, #T_326c3_row20_col3, #T_326c3_row20_col4, #T_326c3_row20_col5, #T_326c3_row20_col6, #T_326c3_row20_col7, #T_326c3_row20_col8, #T_326c3_row21_col0, #T_326c3_row21_col1, #T_326c3_row21_col2, #T_326c3_row21_col3, #T_326c3_row21_col4, #T_326c3_row21_col5, #T_326c3_row21_col6, #T_326c3_row21_col7, #T_326c3_row21_col8, #T_326c3_row22_col0, #T_326c3_row22_col1, #T_326c3_row22_col2, #T_326c3_row22_col3, #T_326c3_row22_col4, #T_326c3_row22_col5, #T_326c3_row22_col6, #T_326c3_row22_col7, #T_326c3_row22_col8, #T_326c3_row23_col0, #T_326c3_row23_col1, #T_326c3_row23_col2, #T_326c3_row23_col3, #T_326c3_row23_col4, #T_326c3_row23_col5, #T_326c3_row23_col6, #T_326c3_row23_col7, #T_326c3_row23_col8, #T_326c3_row24_col0, #T_326c3_row24_col1, #T_326c3_row24_col2, #T_326c3_row24_col3, #T_326c3_row24_col4, #T_326c3_row24_col5, #T_326c3_row24_col6, #T_326c3_row24_col7, #T_326c3_row24_col8, #T_326c3_row25_col0, #T_326c3_row25_col1, #T_326c3_row25_col2, #T_326c3_row25_col3, #T_326c3_row25_col4, #T_326c3_row25_col5, #T_326c3_row25_col6, #T_326c3_row25_col7, #T_326c3_row25_col8, #T_326c3_row26_col0, #T_326c3_row26_col1, #T_326c3_row26_col2, #T_326c3_row26_col3, #T_326c3_row26_col4, #T_326c3_row26_col5, #T_326c3_row26_col6, #T_326c3_row26_col7, #T_326c3_row26_col8, #T_326c3_row27_col0, #T_326c3_row27_col1, #T_326c3_row27_col2, #T_326c3_row27_col3, #T_326c3_row27_col4, #T_326c3_row27_col5, #T_326c3_row27_col6, #T_326c3_row27_col7, #T_326c3_row27_col8, #T_326c3_row28_col0, #T_326c3_row28_col1, #T_326c3_row28_col2, #T_326c3_row28_col3, #T_326c3_row28_col4, #T_326c3_row28_col5, #T_326c3_row28_col6, #T_326c3_row28_col7, #T_326c3_row28_col8, #T_326c3_row29_col0, #T_326c3_row29_col1, #T_326c3_row29_col2, #T_326c3_row29_col3, #T_326c3_row29_col4, #T_326c3_row29_col5, #T_326c3_row29_col6, #T_326c3_row29_col7, #T_326c3_row29_col8, #T_326c3_row30_col0, #T_326c3_row30_col1, #T_326c3_row30_col2, #T_326c3_row30_col3, #T_326c3_row30_col4, #T_326c3_row30_col5, #T_326c3_row30_col6, #T_326c3_row30_col7, #T_326c3_row30_col8, #T_326c3_row31_col0, #T_326c3_row31_col1, #T_326c3_row31_col2, #T_326c3_row31_col3, #T_326c3_row31_col4, #T_326c3_row31_col5, #T_326c3_row31_col6, #T_326c3_row31_col7, #T_326c3_row31_col8, #T_326c3_row32_col0, #T_326c3_row32_col1, #T_326c3_row32_col2, #T_326c3_row32_col3, #T_326c3_row32_col4, #T_326c3_row32_col5, #T_326c3_row32_col6, #T_326c3_row32_col7, #T_326c3_row32_col8, #T_326c3_row33_col0, #T_326c3_row33_col1, #T_326c3_row33_col2, #T_326c3_row33_col3, #T_326c3_row33_col4, #T_326c3_row33_col5, #T_326c3_row33_col6, #T_326c3_row33_col7, #T_326c3_row33_col8, #T_326c3_row34_col0, #T_326c3_row34_col1, #T_326c3_row34_col2, #T_326c3_row34_col3, #T_326c3_row34_col4, #T_326c3_row34_col5, #T_326c3_row34_col6, #T_326c3_row34_col7, #T_326c3_row34_col8, #T_326c3_row35_col0, #T_326c3_row35_col1, #T_326c3_row35_col2, #T_326c3_row35_col3, #T_326c3_row35_col4, #T_326c3_row35_col5, #T_326c3_row35_col6, #T_326c3_row35_col7, #T_326c3_row35_col8, #T_326c3_row36_col0, #T_326c3_row36_col1, #T_326c3_row36_col2, #T_326c3_row36_col3, #T_326c3_row36_col4, #T_326c3_row36_col5, #T_326c3_row36_col6, #T_326c3_row36_col7, #T_326c3_row36_col8, #T_326c3_row37_col0, #T_326c3_row37_col1, #T_326c3_row37_col2, #T_326c3_row37_col3, #T_326c3_row37_col4, #T_326c3_row37_col5, #T_326c3_row37_col6, #T_326c3_row37_col7, #T_326c3_row37_col8, #T_326c3_row38_col0, #T_326c3_row38_col1, #T_326c3_row38_col2, #T_326c3_row38_col3, #T_326c3_row38_col4, #T_326c3_row38_col5, #T_326c3_row38_col6, #T_326c3_row38_col7, #T_326c3_row38_col8, #T_326c3_row39_col0, #T_326c3_row39_col1, #T_326c3_row39_col2, #T_326c3_row39_col3, #T_326c3_row39_col4, #T_326c3_row39_col5, #T_326c3_row39_col6, #T_326c3_row39_col7, #T_326c3_row39_col8, #T_326c3_row40_col0, #T_326c3_row40_col1, #T_326c3_row40_col2, #T_326c3_row40_col3, #T_326c3_row40_col4, #T_326c3_row40_col5, #T_326c3_row40_col6, #T_326c3_row40_col7, #T_326c3_row40_col8, #T_326c3_row41_col0, #T_326c3_row41_col1, #T_326c3_row41_col2, #T_326c3_row41_col3, #T_326c3_row41_col4, #T_326c3_row41_col5, #T_326c3_row41_col6, #T_326c3_row41_col7, #T_326c3_row41_col8, #T_326c3_row42_col0, #T_326c3_row42_col1, #T_326c3_row42_col2, #T_326c3_row42_col3, #T_326c3_row42_col4, #T_326c3_row42_col5, #T_326c3_row42_col6, #T_326c3_row42_col7, #T_326c3_row42_col8 {\n",
-       "  text-align: left;\n",
-       "}\n",
-       "</style>\n",
-       "<table id=\"T_326c3\">\n",
-       "  <thead>\n",
-       "    <tr>\n",
-       "      <th id=\"T_326c3_level0_col0\" class=\"col_heading level0 col0\" >ID</th>\n",
-       "      <th id=\"T_326c3_level0_col1\" class=\"col_heading level0 col1\" >Name</th>\n",
-       "      <th id=\"T_326c3_level0_col2\" class=\"col_heading level0 col2\" >Description</th>\n",
-       "      <th id=\"T_326c3_level0_col3\" class=\"col_heading level0 col3\" >Has Figure</th>\n",
-       "      <th id=\"T_326c3_level0_col4\" class=\"col_heading level0 col4\" >Has Table</th>\n",
-       "      <th id=\"T_326c3_level0_col5\" class=\"col_heading level0 col5\" >Required Inputs</th>\n",
-       "      <th id=\"T_326c3_level0_col6\" class=\"col_heading level0 col6\" >Params</th>\n",
-       "      <th id=\"T_326c3_level0_col7\" class=\"col_heading level0 col7\" >Tags</th>\n",
-       "      <th id=\"T_326c3_level0_col8\" class=\"col_heading level0 col8\" >Tasks</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row0_col0\" class=\"data row0 col0\" >validmind.model_validation.ClusterSizeDistribution</td>\n",
-       "      <td id=\"T_326c3_row0_col1\" class=\"data row0 col1\" >Cluster Size Distribution</td>\n",
-       "      <td id=\"T_326c3_row0_col2\" class=\"data row0 col2\" >Assesses the performance of clustering models by comparing the distribution of cluster sizes in model predictions...</td>\n",
-       "      <td id=\"T_326c3_row0_col3\" class=\"data row0 col3\" >True</td>\n",
-       "      <td id=\"T_326c3_row0_col4\" class=\"data row0 col4\" >False</td>\n",
-       "      <td id=\"T_326c3_row0_col5\" class=\"data row0 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_326c3_row0_col6\" class=\"data row0 col6\" >{}</td>\n",
-       "      <td id=\"T_326c3_row0_col7\" class=\"data row0 col7\" >['sklearn', 'model_performance']</td>\n",
-       "      <td id=\"T_326c3_row0_col8\" class=\"data row0 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row1_col0\" class=\"data row1 col0\" >validmind.model_validation.TimeSeriesR2SquareBySegments</td>\n",
-       "      <td id=\"T_326c3_row1_col1\" class=\"data row1 col1\" >Time Series R2 Square By Segments</td>\n",
-       "      <td id=\"T_326c3_row1_col2\" class=\"data row1 col2\" >Evaluates the R-Squared values of regression models over specified time segments in time series data to assess...</td>\n",
-       "      <td id=\"T_326c3_row1_col3\" class=\"data row1 col3\" >True</td>\n",
-       "      <td id=\"T_326c3_row1_col4\" class=\"data row1 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row1_col5\" class=\"data row1 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_326c3_row1_col6\" class=\"data row1 col6\" >{'segments': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_326c3_row1_col7\" class=\"data row1 col7\" >['model_performance', 'sklearn']</td>\n",
-       "      <td id=\"T_326c3_row1_col8\" class=\"data row1 col8\" >['regression', 'time_series_forecasting']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row2_col0\" class=\"data row2 col0\" >validmind.model_validation.sklearn.AdjustedMutualInformation</td>\n",
-       "      <td id=\"T_326c3_row2_col1\" class=\"data row2 col1\" >Adjusted Mutual Information</td>\n",
-       "      <td id=\"T_326c3_row2_col2\" class=\"data row2 col2\" >Evaluates clustering model performance by measuring mutual information between true and predicted labels, adjusting...</td>\n",
-       "      <td id=\"T_326c3_row2_col3\" class=\"data row2 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row2_col4\" class=\"data row2 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row2_col5\" class=\"data row2 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_326c3_row2_col6\" class=\"data row2 col6\" >{}</td>\n",
-       "      <td id=\"T_326c3_row2_col7\" class=\"data row2 col7\" >['sklearn', 'model_performance', 'clustering']</td>\n",
-       "      <td id=\"T_326c3_row2_col8\" class=\"data row2 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row3_col0\" class=\"data row3 col0\" >validmind.model_validation.sklearn.AdjustedRandIndex</td>\n",
-       "      <td id=\"T_326c3_row3_col1\" class=\"data row3 col1\" >Adjusted Rand Index</td>\n",
-       "      <td id=\"T_326c3_row3_col2\" class=\"data row3 col2\" >Measures the similarity between two data clusters using the Adjusted Rand Index (ARI) metric in clustering machine...</td>\n",
-       "      <td id=\"T_326c3_row3_col3\" class=\"data row3 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row3_col4\" class=\"data row3 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row3_col5\" class=\"data row3 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_326c3_row3_col6\" class=\"data row3 col6\" >{}</td>\n",
-       "      <td id=\"T_326c3_row3_col7\" class=\"data row3 col7\" >['sklearn', 'model_performance', 'clustering']</td>\n",
-       "      <td id=\"T_326c3_row3_col8\" class=\"data row3 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row4_col0\" class=\"data row4 col0\" >validmind.model_validation.sklearn.CalibrationCurve</td>\n",
-       "      <td id=\"T_326c3_row4_col1\" class=\"data row4 col1\" >Calibration Curve</td>\n",
-       "      <td id=\"T_326c3_row4_col2\" class=\"data row4 col2\" >Evaluates the calibration of probability estimates by comparing predicted probabilities against observed...</td>\n",
-       "      <td id=\"T_326c3_row4_col3\" class=\"data row4 col3\" >True</td>\n",
-       "      <td id=\"T_326c3_row4_col4\" class=\"data row4 col4\" >False</td>\n",
-       "      <td id=\"T_326c3_row4_col5\" class=\"data row4 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_326c3_row4_col6\" class=\"data row4 col6\" >{'n_bins': {'type': 'int', 'default': 10}}</td>\n",
-       "      <td id=\"T_326c3_row4_col7\" class=\"data row4 col7\" >['sklearn', 'model_performance', 'classification']</td>\n",
-       "      <td id=\"T_326c3_row4_col8\" class=\"data row4 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row5_col0\" class=\"data row5 col0\" >validmind.model_validation.sklearn.ClassifierPerformance</td>\n",
-       "      <td id=\"T_326c3_row5_col1\" class=\"data row5 col1\" >Classifier Performance</td>\n",
-       "      <td id=\"T_326c3_row5_col2\" class=\"data row5 col2\" >Evaluates performance of binary or multiclass classification models using precision, recall, F1-Score, accuracy,...</td>\n",
-       "      <td id=\"T_326c3_row5_col3\" class=\"data row5 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row5_col4\" class=\"data row5 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row5_col5\" class=\"data row5 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_326c3_row5_col6\" class=\"data row5 col6\" >{'average': {'type': 'str', 'default': 'macro'}}</td>\n",
-       "      <td id=\"T_326c3_row5_col7\" class=\"data row5 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_326c3_row5_col8\" class=\"data row5 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row6_col0\" class=\"data row6 col0\" >validmind.model_validation.sklearn.ClassifierThresholdOptimization</td>\n",
-       "      <td id=\"T_326c3_row6_col1\" class=\"data row6 col1\" >Classifier Threshold Optimization</td>\n",
-       "      <td id=\"T_326c3_row6_col2\" class=\"data row6 col2\" >Analyzes and visualizes different threshold optimization methods for binary classification models....</td>\n",
-       "      <td id=\"T_326c3_row6_col3\" class=\"data row6 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row6_col4\" class=\"data row6 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row6_col5\" class=\"data row6 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_326c3_row6_col6\" class=\"data row6 col6\" >{'methods': {'type': None, 'default': None}, 'target_recall': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_326c3_row6_col7\" class=\"data row6 col7\" >['model_validation', 'threshold_optimization', 'classification_metrics']</td>\n",
-       "      <td id=\"T_326c3_row6_col8\" class=\"data row6 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row7_col0\" class=\"data row7 col0\" >validmind.model_validation.sklearn.ClusterCosineSimilarity</td>\n",
-       "      <td id=\"T_326c3_row7_col1\" class=\"data row7 col1\" >Cluster Cosine Similarity</td>\n",
-       "      <td id=\"T_326c3_row7_col2\" class=\"data row7 col2\" >Measures the intra-cluster similarity of a clustering model using cosine similarity....</td>\n",
-       "      <td id=\"T_326c3_row7_col3\" class=\"data row7 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row7_col4\" class=\"data row7 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row7_col5\" class=\"data row7 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_326c3_row7_col6\" class=\"data row7 col6\" >{}</td>\n",
-       "      <td id=\"T_326c3_row7_col7\" class=\"data row7 col7\" >['sklearn', 'model_performance', 'clustering']</td>\n",
-       "      <td id=\"T_326c3_row7_col8\" class=\"data row7 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row8_col0\" class=\"data row8 col0\" >validmind.model_validation.sklearn.ClusterPerformanceMetrics</td>\n",
-       "      <td id=\"T_326c3_row8_col1\" class=\"data row8 col1\" >Cluster Performance Metrics</td>\n",
-       "      <td id=\"T_326c3_row8_col2\" class=\"data row8 col2\" >Evaluates the performance of clustering machine learning models using multiple established metrics....</td>\n",
-       "      <td id=\"T_326c3_row8_col3\" class=\"data row8 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row8_col4\" class=\"data row8 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row8_col5\" class=\"data row8 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_326c3_row8_col6\" class=\"data row8 col6\" >{}</td>\n",
-       "      <td id=\"T_326c3_row8_col7\" class=\"data row8 col7\" >['sklearn', 'model_performance', 'clustering']</td>\n",
-       "      <td id=\"T_326c3_row8_col8\" class=\"data row8 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row9_col0\" class=\"data row9 col0\" >validmind.model_validation.sklearn.CompletenessScore</td>\n",
-       "      <td id=\"T_326c3_row9_col1\" class=\"data row9 col1\" >Completeness Score</td>\n",
-       "      <td id=\"T_326c3_row9_col2\" class=\"data row9 col2\" >Evaluates a clustering model's capacity to categorize instances from a single class into the same cluster....</td>\n",
-       "      <td id=\"T_326c3_row9_col3\" class=\"data row9 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row9_col4\" class=\"data row9 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row9_col5\" class=\"data row9 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_326c3_row9_col6\" class=\"data row9 col6\" >{}</td>\n",
-       "      <td id=\"T_326c3_row9_col7\" class=\"data row9 col7\" >['sklearn', 'model_performance', 'clustering']</td>\n",
-       "      <td id=\"T_326c3_row9_col8\" class=\"data row9 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row10_col0\" class=\"data row10 col0\" >validmind.model_validation.sklearn.ConfusionMatrix</td>\n",
-       "      <td id=\"T_326c3_row10_col1\" class=\"data row10 col1\" >Confusion Matrix</td>\n",
-       "      <td id=\"T_326c3_row10_col2\" class=\"data row10 col2\" >Evaluates and visually represents the classification ML model's predictive performance using a Confusion Matrix...</td>\n",
-       "      <td id=\"T_326c3_row10_col3\" class=\"data row10 col3\" >True</td>\n",
-       "      <td id=\"T_326c3_row10_col4\" class=\"data row10 col4\" >False</td>\n",
-       "      <td id=\"T_326c3_row10_col5\" class=\"data row10 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_326c3_row10_col6\" class=\"data row10 col6\" >{'threshold': {'type': 'float', 'default': 0.5}}</td>\n",
-       "      <td id=\"T_326c3_row10_col7\" class=\"data row10 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_326c3_row10_col8\" class=\"data row10 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row11_col0\" class=\"data row11 col0\" >validmind.model_validation.sklearn.FeatureImportance</td>\n",
-       "      <td id=\"T_326c3_row11_col1\" class=\"data row11 col1\" >Feature Importance</td>\n",
-       "      <td id=\"T_326c3_row11_col2\" class=\"data row11 col2\" >Compute feature importance scores for a given model and generate a summary table...</td>\n",
-       "      <td id=\"T_326c3_row11_col3\" class=\"data row11 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row11_col4\" class=\"data row11 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row11_col5\" class=\"data row11 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_326c3_row11_col6\" class=\"data row11 col6\" >{'num_features': {'type': 'int', 'default': 3}}</td>\n",
-       "      <td id=\"T_326c3_row11_col7\" class=\"data row11 col7\" >['model_explainability', 'sklearn']</td>\n",
-       "      <td id=\"T_326c3_row11_col8\" class=\"data row11 col8\" >['regression', 'time_series_forecasting']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row12_col0\" class=\"data row12 col0\" >validmind.model_validation.sklearn.FowlkesMallowsScore</td>\n",
-       "      <td id=\"T_326c3_row12_col1\" class=\"data row12 col1\" >Fowlkes Mallows Score</td>\n",
-       "      <td id=\"T_326c3_row12_col2\" class=\"data row12 col2\" >Evaluates the similarity between predicted and actual cluster assignments in a model using the Fowlkes-Mallows...</td>\n",
-       "      <td id=\"T_326c3_row12_col3\" class=\"data row12 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row12_col4\" class=\"data row12 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row12_col5\" class=\"data row12 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_326c3_row12_col6\" class=\"data row12 col6\" >{}</td>\n",
-       "      <td id=\"T_326c3_row12_col7\" class=\"data row12 col7\" >['sklearn', 'model_performance']</td>\n",
-       "      <td id=\"T_326c3_row12_col8\" class=\"data row12 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row13_col0\" class=\"data row13 col0\" >validmind.model_validation.sklearn.HomogeneityScore</td>\n",
-       "      <td id=\"T_326c3_row13_col1\" class=\"data row13 col1\" >Homogeneity Score</td>\n",
-       "      <td id=\"T_326c3_row13_col2\" class=\"data row13 col2\" >Assesses clustering homogeneity by comparing true and predicted labels, scoring from 0 (heterogeneous) to 1...</td>\n",
-       "      <td id=\"T_326c3_row13_col3\" class=\"data row13 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row13_col4\" class=\"data row13 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row13_col5\" class=\"data row13 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_326c3_row13_col6\" class=\"data row13 col6\" >{}</td>\n",
-       "      <td id=\"T_326c3_row13_col7\" class=\"data row13 col7\" >['sklearn', 'model_performance']</td>\n",
-       "      <td id=\"T_326c3_row13_col8\" class=\"data row13 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row14_col0\" class=\"data row14 col0\" >validmind.model_validation.sklearn.HyperParametersTuning</td>\n",
-       "      <td id=\"T_326c3_row14_col1\" class=\"data row14 col1\" >Hyper Parameters Tuning</td>\n",
-       "      <td id=\"T_326c3_row14_col2\" class=\"data row14 col2\" >Performs exhaustive grid search over specified parameter ranges to find optimal model configurations...</td>\n",
-       "      <td id=\"T_326c3_row14_col3\" class=\"data row14 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row14_col4\" class=\"data row14 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row14_col5\" class=\"data row14 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_326c3_row14_col6\" class=\"data row14 col6\" >{'param_grid': {'type': 'dict', 'default': None}, 'scoring': {'type': None, 'default': None}, 'thresholds': {'type': None, 'default': None}, 'fit_params': {'type': 'dict', 'default': None}}</td>\n",
-       "      <td id=\"T_326c3_row14_col7\" class=\"data row14 col7\" >['sklearn', 'model_performance']</td>\n",
-       "      <td id=\"T_326c3_row14_col8\" class=\"data row14 col8\" >['clustering', 'classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row15_col0\" class=\"data row15 col0\" >validmind.model_validation.sklearn.KMeansClustersOptimization</td>\n",
-       "      <td id=\"T_326c3_row15_col1\" class=\"data row15 col1\" >K Means Clusters Optimization</td>\n",
-       "      <td id=\"T_326c3_row15_col2\" class=\"data row15 col2\" >Optimizes the number of clusters in K-means models using Elbow and Silhouette methods....</td>\n",
-       "      <td id=\"T_326c3_row15_col3\" class=\"data row15 col3\" >True</td>\n",
-       "      <td id=\"T_326c3_row15_col4\" class=\"data row15 col4\" >False</td>\n",
-       "      <td id=\"T_326c3_row15_col5\" class=\"data row15 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_326c3_row15_col6\" class=\"data row15 col6\" >{'n_clusters': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_326c3_row15_col7\" class=\"data row15 col7\" >['sklearn', 'model_performance', 'kmeans']</td>\n",
-       "      <td id=\"T_326c3_row15_col8\" class=\"data row15 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row16_col0\" class=\"data row16 col0\" >validmind.model_validation.sklearn.MinimumAccuracy</td>\n",
-       "      <td id=\"T_326c3_row16_col1\" class=\"data row16 col1\" >Minimum Accuracy</td>\n",
-       "      <td id=\"T_326c3_row16_col2\" class=\"data row16 col2\" >Checks if the model's prediction accuracy meets or surpasses a specified threshold....</td>\n",
-       "      <td id=\"T_326c3_row16_col3\" class=\"data row16 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row16_col4\" class=\"data row16 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row16_col5\" class=\"data row16 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_326c3_row16_col6\" class=\"data row16 col6\" >{'min_threshold': {'type': 'float', 'default': 0.7}}</td>\n",
-       "      <td id=\"T_326c3_row16_col7\" class=\"data row16 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_326c3_row16_col8\" class=\"data row16 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row17_col0\" class=\"data row17 col0\" >validmind.model_validation.sklearn.MinimumF1Score</td>\n",
-       "      <td id=\"T_326c3_row17_col1\" class=\"data row17 col1\" >Minimum F1 Score</td>\n",
-       "      <td id=\"T_326c3_row17_col2\" class=\"data row17 col2\" >Assesses if the model's F1 score on the validation set meets a predefined minimum threshold, ensuring balanced...</td>\n",
-       "      <td id=\"T_326c3_row17_col3\" class=\"data row17 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row17_col4\" class=\"data row17 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row17_col5\" class=\"data row17 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_326c3_row17_col6\" class=\"data row17 col6\" >{'min_threshold': {'type': 'float', 'default': 0.5}}</td>\n",
-       "      <td id=\"T_326c3_row17_col7\" class=\"data row17 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_326c3_row17_col8\" class=\"data row17 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row18_col0\" class=\"data row18 col0\" >validmind.model_validation.sklearn.MinimumROCAUCScore</td>\n",
-       "      <td id=\"T_326c3_row18_col1\" class=\"data row18 col1\" >Minimum ROCAUC Score</td>\n",
-       "      <td id=\"T_326c3_row18_col2\" class=\"data row18 col2\" >Validates model by checking if the ROC AUC score meets or surpasses a specified threshold....</td>\n",
-       "      <td id=\"T_326c3_row18_col3\" class=\"data row18 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row18_col4\" class=\"data row18 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row18_col5\" class=\"data row18 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_326c3_row18_col6\" class=\"data row18 col6\" >{'min_threshold': {'type': 'float', 'default': 0.5}}</td>\n",
-       "      <td id=\"T_326c3_row18_col7\" class=\"data row18 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_326c3_row18_col8\" class=\"data row18 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row19_col0\" class=\"data row19 col0\" >validmind.model_validation.sklearn.ModelParameters</td>\n",
-       "      <td id=\"T_326c3_row19_col1\" class=\"data row19 col1\" >Model Parameters</td>\n",
-       "      <td id=\"T_326c3_row19_col2\" class=\"data row19 col2\" >Extracts and displays model parameters in a structured format for transparency and reproducibility....</td>\n",
-       "      <td id=\"T_326c3_row19_col3\" class=\"data row19 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row19_col4\" class=\"data row19 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row19_col5\" class=\"data row19 col5\" >['model']</td>\n",
-       "      <td id=\"T_326c3_row19_col6\" class=\"data row19 col6\" >{'model_params': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_326c3_row19_col7\" class=\"data row19 col7\" >['model_training', 'metadata']</td>\n",
-       "      <td id=\"T_326c3_row19_col8\" class=\"data row19 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row20_col0\" class=\"data row20 col0\" >validmind.model_validation.sklearn.ModelsPerformanceComparison</td>\n",
-       "      <td id=\"T_326c3_row20_col1\" class=\"data row20 col1\" >Models Performance Comparison</td>\n",
-       "      <td id=\"T_326c3_row20_col2\" class=\"data row20 col2\" >Evaluates and compares the performance of multiple Machine Learning models using various metrics like accuracy,...</td>\n",
-       "      <td id=\"T_326c3_row20_col3\" class=\"data row20 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row20_col4\" class=\"data row20 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row20_col5\" class=\"data row20 col5\" >['dataset', 'models']</td>\n",
-       "      <td id=\"T_326c3_row20_col6\" class=\"data row20 col6\" >{}</td>\n",
-       "      <td id=\"T_326c3_row20_col7\" class=\"data row20 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'model_comparison']</td>\n",
-       "      <td id=\"T_326c3_row20_col8\" class=\"data row20 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row21_col0\" class=\"data row21 col0\" >validmind.model_validation.sklearn.OverfitDiagnosis</td>\n",
-       "      <td id=\"T_326c3_row21_col1\" class=\"data row21 col1\" >Overfit Diagnosis</td>\n",
-       "      <td id=\"T_326c3_row21_col2\" class=\"data row21 col2\" >Assesses potential overfitting in a model's predictions, identifying regions where performance between training and...</td>\n",
-       "      <td id=\"T_326c3_row21_col3\" class=\"data row21 col3\" >True</td>\n",
-       "      <td id=\"T_326c3_row21_col4\" class=\"data row21 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row21_col5\" class=\"data row21 col5\" >['model', 'datasets']</td>\n",
-       "      <td id=\"T_326c3_row21_col6\" class=\"data row21 col6\" >{'metric': {'type': 'str', 'default': None}, 'cut_off_threshold': {'type': 'float', 'default': 0.04}}</td>\n",
-       "      <td id=\"T_326c3_row21_col7\" class=\"data row21 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'linear_regression', 'model_diagnosis']</td>\n",
-       "      <td id=\"T_326c3_row21_col8\" class=\"data row21 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row22_col0\" class=\"data row22 col0\" >validmind.model_validation.sklearn.PermutationFeatureImportance</td>\n",
-       "      <td id=\"T_326c3_row22_col1\" class=\"data row22 col1\" >Permutation Feature Importance</td>\n",
-       "      <td id=\"T_326c3_row22_col2\" class=\"data row22 col2\" >Assesses the significance of each feature in a model by evaluating the impact on model performance when feature...</td>\n",
-       "      <td id=\"T_326c3_row22_col3\" class=\"data row22 col3\" >True</td>\n",
-       "      <td id=\"T_326c3_row22_col4\" class=\"data row22 col4\" >False</td>\n",
-       "      <td id=\"T_326c3_row22_col5\" class=\"data row22 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_326c3_row22_col6\" class=\"data row22 col6\" >{'fontsize': {'type': None, 'default': None}, 'figure_height': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_326c3_row22_col7\" class=\"data row22 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'feature_importance', 'visualization']</td>\n",
-       "      <td id=\"T_326c3_row22_col8\" class=\"data row22 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row23_col0\" class=\"data row23 col0\" >validmind.model_validation.sklearn.PopulationStabilityIndex</td>\n",
-       "      <td id=\"T_326c3_row23_col1\" class=\"data row23 col1\" >Population Stability Index</td>\n",
-       "      <td id=\"T_326c3_row23_col2\" class=\"data row23 col2\" >Assesses the Population Stability Index (PSI) to quantify the stability of an ML model's predictions across...</td>\n",
-       "      <td id=\"T_326c3_row23_col3\" class=\"data row23 col3\" >True</td>\n",
-       "      <td id=\"T_326c3_row23_col4\" class=\"data row23 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row23_col5\" class=\"data row23 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_326c3_row23_col6\" class=\"data row23 col6\" >{'num_bins': {'type': 'int', 'default': 10}, 'mode': {'type': 'str', 'default': 'fixed'}}</td>\n",
-       "      <td id=\"T_326c3_row23_col7\" class=\"data row23 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_326c3_row23_col8\" class=\"data row23 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row24_col0\" class=\"data row24 col0\" >validmind.model_validation.sklearn.PrecisionRecallCurve</td>\n",
-       "      <td id=\"T_326c3_row24_col1\" class=\"data row24 col1\" >Precision Recall Curve</td>\n",
-       "      <td id=\"T_326c3_row24_col2\" class=\"data row24 col2\" >Evaluates the precision-recall trade-off for binary classification models and visualizes the Precision-Recall curve....</td>\n",
-       "      <td id=\"T_326c3_row24_col3\" class=\"data row24 col3\" >True</td>\n",
-       "      <td id=\"T_326c3_row24_col4\" class=\"data row24 col4\" >False</td>\n",
-       "      <td id=\"T_326c3_row24_col5\" class=\"data row24 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_326c3_row24_col6\" class=\"data row24 col6\" >{}</td>\n",
-       "      <td id=\"T_326c3_row24_col7\" class=\"data row24 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_326c3_row24_col8\" class=\"data row24 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row25_col0\" class=\"data row25 col0\" >validmind.model_validation.sklearn.ROCCurve</td>\n",
-       "      <td id=\"T_326c3_row25_col1\" class=\"data row25 col1\" >ROC Curve</td>\n",
-       "      <td id=\"T_326c3_row25_col2\" class=\"data row25 col2\" >Evaluates binary classification model performance by generating and plotting the Receiver Operating Characteristic...</td>\n",
-       "      <td id=\"T_326c3_row25_col3\" class=\"data row25 col3\" >True</td>\n",
-       "      <td id=\"T_326c3_row25_col4\" class=\"data row25 col4\" >False</td>\n",
-       "      <td id=\"T_326c3_row25_col5\" class=\"data row25 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_326c3_row25_col6\" class=\"data row25 col6\" >{}</td>\n",
-       "      <td id=\"T_326c3_row25_col7\" class=\"data row25 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_326c3_row25_col8\" class=\"data row25 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row26_col0\" class=\"data row26 col0\" >validmind.model_validation.sklearn.RegressionErrors</td>\n",
-       "      <td id=\"T_326c3_row26_col1\" class=\"data row26 col1\" >Regression Errors</td>\n",
-       "      <td id=\"T_326c3_row26_col2\" class=\"data row26 col2\" >Assesses the performance and error distribution of a regression model using various error metrics....</td>\n",
-       "      <td id=\"T_326c3_row26_col3\" class=\"data row26 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row26_col4\" class=\"data row26 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row26_col5\" class=\"data row26 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_326c3_row26_col6\" class=\"data row26 col6\" >{}</td>\n",
-       "      <td id=\"T_326c3_row26_col7\" class=\"data row26 col7\" >['sklearn', 'model_performance']</td>\n",
-       "      <td id=\"T_326c3_row26_col8\" class=\"data row26 col8\" >['regression', 'classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row27_col0\" class=\"data row27 col0\" >validmind.model_validation.sklearn.RegressionErrorsComparison</td>\n",
-       "      <td id=\"T_326c3_row27_col1\" class=\"data row27 col1\" >Regression Errors Comparison</td>\n",
-       "      <td id=\"T_326c3_row27_col2\" class=\"data row27 col2\" >Assesses multiple regression error metrics to compare model performance across different datasets, emphasizing...</td>\n",
-       "      <td id=\"T_326c3_row27_col3\" class=\"data row27 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row27_col4\" class=\"data row27 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row27_col5\" class=\"data row27 col5\" >['datasets', 'models']</td>\n",
-       "      <td id=\"T_326c3_row27_col6\" class=\"data row27 col6\" >{}</td>\n",
-       "      <td id=\"T_326c3_row27_col7\" class=\"data row27 col7\" >['model_performance', 'sklearn']</td>\n",
-       "      <td id=\"T_326c3_row27_col8\" class=\"data row27 col8\" >['regression', 'time_series_forecasting']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row28_col0\" class=\"data row28 col0\" >validmind.model_validation.sklearn.RegressionPerformance</td>\n",
-       "      <td id=\"T_326c3_row28_col1\" class=\"data row28 col1\" >Regression Performance</td>\n",
-       "      <td id=\"T_326c3_row28_col2\" class=\"data row28 col2\" >Evaluates the performance of a regression model using five different metrics: MAE, MSE, RMSE, MAPE, and MBD....</td>\n",
-       "      <td id=\"T_326c3_row28_col3\" class=\"data row28 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row28_col4\" class=\"data row28 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row28_col5\" class=\"data row28 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_326c3_row28_col6\" class=\"data row28 col6\" >{}</td>\n",
-       "      <td id=\"T_326c3_row28_col7\" class=\"data row28 col7\" >['sklearn', 'model_performance']</td>\n",
-       "      <td id=\"T_326c3_row28_col8\" class=\"data row28 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row29_col0\" class=\"data row29 col0\" >validmind.model_validation.sklearn.RegressionR2Square</td>\n",
-       "      <td id=\"T_326c3_row29_col1\" class=\"data row29 col1\" >Regression R2 Square</td>\n",
-       "      <td id=\"T_326c3_row29_col2\" class=\"data row29 col2\" >Assesses the overall goodness-of-fit of a regression model by evaluating R-squared (R2) and Adjusted R-squared (Adj...</td>\n",
-       "      <td id=\"T_326c3_row29_col3\" class=\"data row29 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row29_col4\" class=\"data row29 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row29_col5\" class=\"data row29 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_326c3_row29_col6\" class=\"data row29 col6\" >{}</td>\n",
-       "      <td id=\"T_326c3_row29_col7\" class=\"data row29 col7\" >['sklearn', 'model_performance']</td>\n",
-       "      <td id=\"T_326c3_row29_col8\" class=\"data row29 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row30_col0\" class=\"data row30 col0\" >validmind.model_validation.sklearn.RegressionR2SquareComparison</td>\n",
-       "      <td id=\"T_326c3_row30_col1\" class=\"data row30 col1\" >Regression R2 Square Comparison</td>\n",
-       "      <td id=\"T_326c3_row30_col2\" class=\"data row30 col2\" >Compares R-Squared and Adjusted R-Squared values for different regression models across multiple datasets to assess...</td>\n",
-       "      <td id=\"T_326c3_row30_col3\" class=\"data row30 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row30_col4\" class=\"data row30 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row30_col5\" class=\"data row30 col5\" >['datasets', 'models']</td>\n",
-       "      <td id=\"T_326c3_row30_col6\" class=\"data row30 col6\" >{}</td>\n",
-       "      <td id=\"T_326c3_row30_col7\" class=\"data row30 col7\" >['model_performance', 'sklearn']</td>\n",
-       "      <td id=\"T_326c3_row30_col8\" class=\"data row30 col8\" >['regression', 'time_series_forecasting']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row31_col0\" class=\"data row31 col0\" >validmind.model_validation.sklearn.RobustnessDiagnosis</td>\n",
-       "      <td id=\"T_326c3_row31_col1\" class=\"data row31 col1\" >Robustness Diagnosis</td>\n",
-       "      <td id=\"T_326c3_row31_col2\" class=\"data row31 col2\" >Assesses the robustness of a machine learning model by evaluating performance decay under noisy conditions....</td>\n",
-       "      <td id=\"T_326c3_row31_col3\" class=\"data row31 col3\" >True</td>\n",
-       "      <td id=\"T_326c3_row31_col4\" class=\"data row31 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row31_col5\" class=\"data row31 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_326c3_row31_col6\" class=\"data row31 col6\" >{'metric': {'type': 'str', 'default': None}, 'scaling_factor_std_dev_list': {'type': None, 'default': [0.1, 0.2, 0.3, 0.4, 0.5]}, 'performance_decay_threshold': {'type': 'float', 'default': 0.05}}</td>\n",
-       "      <td id=\"T_326c3_row31_col7\" class=\"data row31 col7\" >['sklearn', 'model_diagnosis', 'visualization']</td>\n",
-       "      <td id=\"T_326c3_row31_col8\" class=\"data row31 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row32_col0\" class=\"data row32 col0\" >validmind.model_validation.sklearn.SHAPGlobalImportance</td>\n",
-       "      <td id=\"T_326c3_row32_col1\" class=\"data row32 col1\" >SHAP Global Importance</td>\n",
-       "      <td id=\"T_326c3_row32_col2\" class=\"data row32 col2\" >Evaluates and visualizes global feature importance using SHAP values for model explanation and risk identification....</td>\n",
-       "      <td id=\"T_326c3_row32_col3\" class=\"data row32 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row32_col4\" class=\"data row32 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row32_col5\" class=\"data row32 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_326c3_row32_col6\" class=\"data row32 col6\" >{'kernel_explainer_samples': {'type': 'int', 'default': 10}, 'tree_or_linear_explainer_samples': {'type': 'int', 'default': 200}, 'class_of_interest': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_326c3_row32_col7\" class=\"data row32 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'feature_importance', 'visualization']</td>\n",
-       "      <td id=\"T_326c3_row32_col8\" class=\"data row32 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row33_col0\" class=\"data row33 col0\" >validmind.model_validation.sklearn.ScoreProbabilityAlignment</td>\n",
-       "      <td id=\"T_326c3_row33_col1\" class=\"data row33 col1\" >Score Probability Alignment</td>\n",
-       "      <td id=\"T_326c3_row33_col2\" class=\"data row33 col2\" >Analyzes the alignment between credit scores and predicted probabilities....</td>\n",
-       "      <td id=\"T_326c3_row33_col3\" class=\"data row33 col3\" >True</td>\n",
-       "      <td id=\"T_326c3_row33_col4\" class=\"data row33 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row33_col5\" class=\"data row33 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_326c3_row33_col6\" class=\"data row33 col6\" >{'score_column': {'type': 'str', 'default': 'score'}, 'n_bins': {'type': 'int', 'default': 10}}</td>\n",
-       "      <td id=\"T_326c3_row33_col7\" class=\"data row33 col7\" >['visualization', 'credit_risk', 'calibration']</td>\n",
-       "      <td id=\"T_326c3_row33_col8\" class=\"data row33 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row34_col0\" class=\"data row34 col0\" >validmind.model_validation.sklearn.SilhouettePlot</td>\n",
-       "      <td id=\"T_326c3_row34_col1\" class=\"data row34 col1\" >Silhouette Plot</td>\n",
-       "      <td id=\"T_326c3_row34_col2\" class=\"data row34 col2\" >Calculates and visualizes Silhouette Score, assessing the degree of data point suitability to its cluster in ML...</td>\n",
-       "      <td id=\"T_326c3_row34_col3\" class=\"data row34 col3\" >True</td>\n",
-       "      <td id=\"T_326c3_row34_col4\" class=\"data row34 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row34_col5\" class=\"data row34 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_326c3_row34_col6\" class=\"data row34 col6\" >{}</td>\n",
-       "      <td id=\"T_326c3_row34_col7\" class=\"data row34 col7\" >['sklearn', 'model_performance']</td>\n",
-       "      <td id=\"T_326c3_row34_col8\" class=\"data row34 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row35_col0\" class=\"data row35 col0\" >validmind.model_validation.sklearn.TrainingTestDegradation</td>\n",
-       "      <td id=\"T_326c3_row35_col1\" class=\"data row35 col1\" >Training Test Degradation</td>\n",
-       "      <td id=\"T_326c3_row35_col2\" class=\"data row35 col2\" >Tests if model performance degradation between training and test datasets exceeds a predefined threshold....</td>\n",
-       "      <td id=\"T_326c3_row35_col3\" class=\"data row35 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row35_col4\" class=\"data row35 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row35_col5\" class=\"data row35 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_326c3_row35_col6\" class=\"data row35 col6\" >{'max_threshold': {'type': 'float', 'default': 0.1}}</td>\n",
-       "      <td id=\"T_326c3_row35_col7\" class=\"data row35 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_326c3_row35_col8\" class=\"data row35 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row36_col0\" class=\"data row36 col0\" >validmind.model_validation.sklearn.VMeasure</td>\n",
-       "      <td id=\"T_326c3_row36_col1\" class=\"data row36 col1\" >V Measure</td>\n",
-       "      <td id=\"T_326c3_row36_col2\" class=\"data row36 col2\" >Evaluates homogeneity and completeness of a clustering model using the V Measure Score....</td>\n",
-       "      <td id=\"T_326c3_row36_col3\" class=\"data row36 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row36_col4\" class=\"data row36 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row36_col5\" class=\"data row36 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_326c3_row36_col6\" class=\"data row36 col6\" >{}</td>\n",
-       "      <td id=\"T_326c3_row36_col7\" class=\"data row36 col7\" >['sklearn', 'model_performance']</td>\n",
-       "      <td id=\"T_326c3_row36_col8\" class=\"data row36 col8\" >['clustering']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row37_col0\" class=\"data row37 col0\" >validmind.model_validation.sklearn.WeakspotsDiagnosis</td>\n",
-       "      <td id=\"T_326c3_row37_col1\" class=\"data row37 col1\" >Weakspots Diagnosis</td>\n",
-       "      <td id=\"T_326c3_row37_col2\" class=\"data row37 col2\" >Identifies and visualizes weak spots in a machine learning model's performance across various sections of the...</td>\n",
-       "      <td id=\"T_326c3_row37_col3\" class=\"data row37 col3\" >True</td>\n",
-       "      <td id=\"T_326c3_row37_col4\" class=\"data row37 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row37_col5\" class=\"data row37 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_326c3_row37_col6\" class=\"data row37 col6\" >{'features_columns': {'type': None, 'default': None}, 'metrics': {'type': None, 'default': None}, 'thresholds': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_326c3_row37_col7\" class=\"data row37 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_diagnosis', 'visualization']</td>\n",
-       "      <td id=\"T_326c3_row37_col8\" class=\"data row37 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row38_col0\" class=\"data row38 col0\" >validmind.ongoing_monitoring.CalibrationCurveDrift</td>\n",
-       "      <td id=\"T_326c3_row38_col1\" class=\"data row38 col1\" >Calibration Curve Drift</td>\n",
-       "      <td id=\"T_326c3_row38_col2\" class=\"data row38 col2\" >Evaluates changes in probability calibration between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_326c3_row38_col3\" class=\"data row38 col3\" >True</td>\n",
-       "      <td id=\"T_326c3_row38_col4\" class=\"data row38 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row38_col5\" class=\"data row38 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_326c3_row38_col6\" class=\"data row38 col6\" >{'n_bins': {'type': 'int', 'default': 10}, 'drift_pct_threshold': {'type': 'float', 'default': 20}}</td>\n",
-       "      <td id=\"T_326c3_row38_col7\" class=\"data row38 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_326c3_row38_col8\" class=\"data row38 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row39_col0\" class=\"data row39 col0\" >validmind.ongoing_monitoring.ClassDiscriminationDrift</td>\n",
-       "      <td id=\"T_326c3_row39_col1\" class=\"data row39 col1\" >Class Discrimination Drift</td>\n",
-       "      <td id=\"T_326c3_row39_col2\" class=\"data row39 col2\" >Compares classification discrimination metrics between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_326c3_row39_col3\" class=\"data row39 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row39_col4\" class=\"data row39 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row39_col5\" class=\"data row39 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_326c3_row39_col6\" class=\"data row39 col6\" >{'drift_pct_threshold': {'type': '_empty', 'default': 20}}</td>\n",
-       "      <td id=\"T_326c3_row39_col7\" class=\"data row39 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_326c3_row39_col8\" class=\"data row39 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row40_col0\" class=\"data row40 col0\" >validmind.ongoing_monitoring.ClassificationAccuracyDrift</td>\n",
-       "      <td id=\"T_326c3_row40_col1\" class=\"data row40 col1\" >Classification Accuracy Drift</td>\n",
-       "      <td id=\"T_326c3_row40_col2\" class=\"data row40 col2\" >Compares classification accuracy metrics between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_326c3_row40_col3\" class=\"data row40 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row40_col4\" class=\"data row40 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row40_col5\" class=\"data row40 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_326c3_row40_col6\" class=\"data row40 col6\" >{'drift_pct_threshold': {'type': '_empty', 'default': 20}}</td>\n",
-       "      <td id=\"T_326c3_row40_col7\" class=\"data row40 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_326c3_row40_col8\" class=\"data row40 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row41_col0\" class=\"data row41 col0\" >validmind.ongoing_monitoring.ConfusionMatrixDrift</td>\n",
-       "      <td id=\"T_326c3_row41_col1\" class=\"data row41 col1\" >Confusion Matrix Drift</td>\n",
-       "      <td id=\"T_326c3_row41_col2\" class=\"data row41 col2\" >Compares confusion matrix metrics between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_326c3_row41_col3\" class=\"data row41 col3\" >False</td>\n",
-       "      <td id=\"T_326c3_row41_col4\" class=\"data row41 col4\" >True</td>\n",
-       "      <td id=\"T_326c3_row41_col5\" class=\"data row41 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_326c3_row41_col6\" class=\"data row41 col6\" >{'drift_pct_threshold': {'type': '_empty', 'default': 20}}</td>\n",
-       "      <td id=\"T_326c3_row41_col7\" class=\"data row41 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_326c3_row41_col8\" class=\"data row41 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_326c3_row42_col0\" class=\"data row42 col0\" >validmind.ongoing_monitoring.ROCCurveDrift</td>\n",
-       "      <td id=\"T_326c3_row42_col1\" class=\"data row42 col1\" >ROC Curve Drift</td>\n",
-       "      <td id=\"T_326c3_row42_col2\" class=\"data row42 col2\" >Compares ROC curves between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_326c3_row42_col3\" class=\"data row42 col3\" >True</td>\n",
-       "      <td id=\"T_326c3_row42_col4\" class=\"data row42 col4\" >False</td>\n",
-       "      <td id=\"T_326c3_row42_col5\" class=\"data row42 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_326c3_row42_col6\" class=\"data row42 col6\" >{}</td>\n",
-       "      <td id=\"T_326c3_row42_col7\" class=\"data row42 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_326c3_row42_col8\" class=\"data row42 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n"
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Finally, to match each task type with its related tags, use the [list_tasks_and_tags()](https://docs.validmind.ai/validmind/validmind/tests.html#list_tasks_and_tags) function:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style type=\"text/css\">\n",
+              "#T_ac294 th {\n",
+              "  text-align: left;\n",
+              "}\n",
+              "#T_ac294_row0_col0, #T_ac294_row0_col1, #T_ac294_row1_col0, #T_ac294_row1_col1, #T_ac294_row2_col0, #T_ac294_row2_col1, #T_ac294_row3_col0, #T_ac294_row3_col1, #T_ac294_row4_col0, #T_ac294_row4_col1, #T_ac294_row5_col0, #T_ac294_row5_col1, #T_ac294_row6_col0, #T_ac294_row6_col1, #T_ac294_row7_col0, #T_ac294_row7_col1, #T_ac294_row8_col0, #T_ac294_row8_col1, #T_ac294_row9_col0, #T_ac294_row9_col1, #T_ac294_row10_col0, #T_ac294_row10_col1, #T_ac294_row11_col0, #T_ac294_row11_col1, #T_ac294_row12_col0, #T_ac294_row12_col1, #T_ac294_row13_col0, #T_ac294_row13_col1 {\n",
+              "  text-align: left;\n",
+              "}\n",
+              "</style>\n",
+              "<table id=\"T_ac294\">\n",
+              "  <thead>\n",
+              "    <tr>\n",
+              "      <th id=\"T_ac294_level0_col0\" class=\"col_heading level0 col0\" >Task</th>\n",
+              "      <th id=\"T_ac294_level0_col1\" class=\"col_heading level0 col1\" >Tags</th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "    <tr>\n",
+              "      <td id=\"T_ac294_row0_col0\" class=\"data row0 col0\" >regression</td>\n",
+              "      <td id=\"T_ac294_row0_col1\" class=\"data row0 col1\" >senstivity_analysis, tabular_data, time_series_data, model_predictions, feature_selection, correlation, regression, statsmodels, model_performance, model_training, multiclass_classification, linear_regression, data_quality, text_data, model_explainability, binary_classification, stationarity, bias_and_fairness, numerical_data, sklearn, model_selection, statistical_test, descriptive_statistics, seasonality, analysis, data_validation, data_distribution, metadata, feature_importance, visualization, forecasting, model_diagnosis, model_interpretation, unit_root_test, categorical_data, data_analysis</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_ac294_row1_col0\" class=\"data row1 col0\" >classification</td>\n",
+              "      <td id=\"T_ac294_row1_col1\" class=\"data row1 col1\" >calibration, anomaly_detection, classification_metrics, tabular_data, time_series_data, feature_selection, correlation, statsmodels, model_performance, model_validation, model_training, classification, multiclass_classification, linear_regression, data_quality, text_data, binary_classification, threshold_optimization, bias_and_fairness, scorecard, model_comparison, numerical_data, sklearn, statistical_test, descriptive_statistics, feature_importance, data_distribution, metadata, visualization, credit_risk, AUC, logistic_regression, model_diagnosis, categorical_data, data_analysis</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_ac294_row2_col0\" class=\"data row2 col0\" >text_classification</td>\n",
+              "      <td id=\"T_ac294_row2_col1\" class=\"data row2 col1\" >model_performance, feature_importance, multiclass_classification, few_shot, frequency_analysis, zero_shot, text_data, visualization, llm, binary_classification, ragas, model_diagnosis, model_comparison, sklearn, nlp, retrieval_performance, tabular_data, time_series_data</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_ac294_row3_col0\" class=\"data row3 col0\" >text_summarization</td>\n",
+              "      <td id=\"T_ac294_row3_col1\" class=\"data row3 col1\" >qualitative, few_shot, frequency_analysis, embeddings, zero_shot, text_data, visualization, llm, rag_performance, ragas, retrieval_performance, nlp, dimensionality_reduction, tabular_data, time_series_data</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_ac294_row4_col0\" class=\"data row4 col0\" >data_validation</td>\n",
+              "      <td id=\"T_ac294_row4_col1\" class=\"data row4 col1\" >stationarity, statsmodels, unit_root_test, time_series_data</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_ac294_row5_col0\" class=\"data row5 col0\" >time_series_forecasting</td>\n",
+              "      <td id=\"T_ac294_row5_col1\" class=\"data row5 col1\" >model_training, data_validation, metadata, visualization, model_explainability, sklearn, model_performance, model_predictions, time_series_data</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_ac294_row6_col0\" class=\"data row6 col0\" >nlp</td>\n",
+              "      <td id=\"T_ac294_row6_col1\" class=\"data row6 col1\" >data_validation, frequency_analysis, text_data, visualization, nlp</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_ac294_row7_col0\" class=\"data row7 col0\" >clustering</td>\n",
+              "      <td id=\"T_ac294_row7_col1\" class=\"data row7 col1\" >clustering, model_performance, kmeans, sklearn</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_ac294_row8_col0\" class=\"data row8 col0\" >residual_analysis</td>\n",
+              "      <td id=\"T_ac294_row8_col1\" class=\"data row8 col1\" >regression</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_ac294_row9_col0\" class=\"data row9 col0\" >visualization</td>\n",
+              "      <td id=\"T_ac294_row9_col1\" class=\"data row9 col1\" >regression</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_ac294_row10_col0\" class=\"data row10 col0\" >feature_extraction</td>\n",
+              "      <td id=\"T_ac294_row10_col1\" class=\"data row10 col1\" >embeddings, text_data, visualization, llm</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_ac294_row11_col0\" class=\"data row11 col0\" >text_qa</td>\n",
+              "      <td id=\"T_ac294_row11_col1\" class=\"data row11 col1\" >qualitative, embeddings, visualization, llm, rag_performance, ragas, dimensionality_reduction, retrieval_performance</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_ac294_row12_col0\" class=\"data row12 col0\" >text_generation</td>\n",
+              "      <td id=\"T_ac294_row12_col1\" class=\"data row12 col1\" >qualitative, embeddings, visualization, llm, rag_performance, ragas, dimensionality_reduction, retrieval_performance</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_ac294_row13_col0\" class=\"data row13 col0\" >monitoring</td>\n",
+              "      <td id=\"T_ac294_row13_col1\" class=\"data row13 col1\" >visualization</td>\n",
+              "    </tr>\n",
+              "  </tbody>\n",
+              "</table>\n"
+            ],
+            "text/plain": [
+              "<pandas.io.formats.style.Styler at 0x38000adc0>"
+            ]
+          },
+          "execution_count": null,
+          "metadata": {},
+          "output_type": "execute_result"
+        }
       ],
-      "text/plain": [
-       "<pandas.io.formats.style.Styler at 0x1052e6790>"
+      "source": [
+        "list_tasks_and_tags()"
       ]
-     },
-     "execution_count": 6,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "list_tests(filter=\"sklearn\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Use the `task` parameter to find tests that match a specific task type,  such as `classification`:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 7,
-   "metadata": {},
-   "outputs": [
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Filter tests by tags and task types\n",
+        "\n",
+        "While listing all tests is useful, you’ll often want to narrow your search. The [list_tests()](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) function supports `filter`, `task`, and `tags` parameters to assist in refining your results.\n",
+        "\n",
+        "Use the `filter` parameter to find tests that match a specific keyword, such as `sklearn`:"
+      ]
+    },
     {
-     "data": {
-      "text/html": [
-       "<style type=\"text/css\">\n",
-       "#T_56dd5 th {\n",
-       "  text-align: left;\n",
-       "}\n",
-       "#T_56dd5_row0_col0, #T_56dd5_row0_col1, #T_56dd5_row0_col2, #T_56dd5_row0_col3, #T_56dd5_row0_col4, #T_56dd5_row0_col5, #T_56dd5_row0_col6, #T_56dd5_row0_col7, #T_56dd5_row0_col8, #T_56dd5_row1_col0, #T_56dd5_row1_col1, #T_56dd5_row1_col2, #T_56dd5_row1_col3, #T_56dd5_row1_col4, #T_56dd5_row1_col5, #T_56dd5_row1_col6, #T_56dd5_row1_col7, #T_56dd5_row1_col8, #T_56dd5_row2_col0, #T_56dd5_row2_col1, #T_56dd5_row2_col2, #T_56dd5_row2_col3, #T_56dd5_row2_col4, #T_56dd5_row2_col5, #T_56dd5_row2_col6, #T_56dd5_row2_col7, #T_56dd5_row2_col8, #T_56dd5_row3_col0, #T_56dd5_row3_col1, #T_56dd5_row3_col2, #T_56dd5_row3_col3, #T_56dd5_row3_col4, #T_56dd5_row3_col5, #T_56dd5_row3_col6, #T_56dd5_row3_col7, #T_56dd5_row3_col8, #T_56dd5_row4_col0, #T_56dd5_row4_col1, #T_56dd5_row4_col2, #T_56dd5_row4_col3, #T_56dd5_row4_col4, #T_56dd5_row4_col5, #T_56dd5_row4_col6, #T_56dd5_row4_col7, #T_56dd5_row4_col8, #T_56dd5_row5_col0, #T_56dd5_row5_col1, #T_56dd5_row5_col2, #T_56dd5_row5_col3, #T_56dd5_row5_col4, #T_56dd5_row5_col5, #T_56dd5_row5_col6, #T_56dd5_row5_col7, #T_56dd5_row5_col8, #T_56dd5_row6_col0, #T_56dd5_row6_col1, #T_56dd5_row6_col2, #T_56dd5_row6_col3, #T_56dd5_row6_col4, #T_56dd5_row6_col5, #T_56dd5_row6_col6, #T_56dd5_row6_col7, #T_56dd5_row6_col8, #T_56dd5_row7_col0, #T_56dd5_row7_col1, #T_56dd5_row7_col2, #T_56dd5_row7_col3, #T_56dd5_row7_col4, #T_56dd5_row7_col5, #T_56dd5_row7_col6, #T_56dd5_row7_col7, #T_56dd5_row7_col8, #T_56dd5_row8_col0, #T_56dd5_row8_col1, #T_56dd5_row8_col2, #T_56dd5_row8_col3, #T_56dd5_row8_col4, #T_56dd5_row8_col5, #T_56dd5_row8_col6, #T_56dd5_row8_col7, #T_56dd5_row8_col8, #T_56dd5_row9_col0, #T_56dd5_row9_col1, #T_56dd5_row9_col2, #T_56dd5_row9_col3, #T_56dd5_row9_col4, #T_56dd5_row9_col5, #T_56dd5_row9_col6, #T_56dd5_row9_col7, #T_56dd5_row9_col8, #T_56dd5_row10_col0, #T_56dd5_row10_col1, #T_56dd5_row10_col2, #T_56dd5_row10_col3, #T_56dd5_row10_col4, #T_56dd5_row10_col5, #T_56dd5_row10_col6, #T_56dd5_row10_col7, #T_56dd5_row10_col8, #T_56dd5_row11_col0, #T_56dd5_row11_col1, #T_56dd5_row11_col2, #T_56dd5_row11_col3, #T_56dd5_row11_col4, #T_56dd5_row11_col5, #T_56dd5_row11_col6, #T_56dd5_row11_col7, #T_56dd5_row11_col8, #T_56dd5_row12_col0, #T_56dd5_row12_col1, #T_56dd5_row12_col2, #T_56dd5_row12_col3, #T_56dd5_row12_col4, #T_56dd5_row12_col5, #T_56dd5_row12_col6, #T_56dd5_row12_col7, #T_56dd5_row12_col8, #T_56dd5_row13_col0, #T_56dd5_row13_col1, #T_56dd5_row13_col2, #T_56dd5_row13_col3, #T_56dd5_row13_col4, #T_56dd5_row13_col5, #T_56dd5_row13_col6, #T_56dd5_row13_col7, #T_56dd5_row13_col8, #T_56dd5_row14_col0, #T_56dd5_row14_col1, #T_56dd5_row14_col2, #T_56dd5_row14_col3, #T_56dd5_row14_col4, #T_56dd5_row14_col5, #T_56dd5_row14_col6, #T_56dd5_row14_col7, #T_56dd5_row14_col8, #T_56dd5_row15_col0, #T_56dd5_row15_col1, #T_56dd5_row15_col2, #T_56dd5_row15_col3, #T_56dd5_row15_col4, #T_56dd5_row15_col5, #T_56dd5_row15_col6, #T_56dd5_row15_col7, #T_56dd5_row15_col8, #T_56dd5_row16_col0, #T_56dd5_row16_col1, #T_56dd5_row16_col2, #T_56dd5_row16_col3, #T_56dd5_row16_col4, #T_56dd5_row16_col5, #T_56dd5_row16_col6, #T_56dd5_row16_col7, #T_56dd5_row16_col8, #T_56dd5_row17_col0, #T_56dd5_row17_col1, #T_56dd5_row17_col2, #T_56dd5_row17_col3, #T_56dd5_row17_col4, #T_56dd5_row17_col5, #T_56dd5_row17_col6, #T_56dd5_row17_col7, #T_56dd5_row17_col8, #T_56dd5_row18_col0, #T_56dd5_row18_col1, #T_56dd5_row18_col2, #T_56dd5_row18_col3, #T_56dd5_row18_col4, #T_56dd5_row18_col5, #T_56dd5_row18_col6, #T_56dd5_row18_col7, #T_56dd5_row18_col8, #T_56dd5_row19_col0, #T_56dd5_row19_col1, #T_56dd5_row19_col2, #T_56dd5_row19_col3, #T_56dd5_row19_col4, #T_56dd5_row19_col5, #T_56dd5_row19_col6, #T_56dd5_row19_col7, #T_56dd5_row19_col8, #T_56dd5_row20_col0, #T_56dd5_row20_col1, #T_56dd5_row20_col2, #T_56dd5_row20_col3, #T_56dd5_row20_col4, #T_56dd5_row20_col5, #T_56dd5_row20_col6, #T_56dd5_row20_col7, #T_56dd5_row20_col8, #T_56dd5_row21_col0, #T_56dd5_row21_col1, #T_56dd5_row21_col2, #T_56dd5_row21_col3, #T_56dd5_row21_col4, #T_56dd5_row21_col5, #T_56dd5_row21_col6, #T_56dd5_row21_col7, #T_56dd5_row21_col8, #T_56dd5_row22_col0, #T_56dd5_row22_col1, #T_56dd5_row22_col2, #T_56dd5_row22_col3, #T_56dd5_row22_col4, #T_56dd5_row22_col5, #T_56dd5_row22_col6, #T_56dd5_row22_col7, #T_56dd5_row22_col8, #T_56dd5_row23_col0, #T_56dd5_row23_col1, #T_56dd5_row23_col2, #T_56dd5_row23_col3, #T_56dd5_row23_col4, #T_56dd5_row23_col5, #T_56dd5_row23_col6, #T_56dd5_row23_col7, #T_56dd5_row23_col8, #T_56dd5_row24_col0, #T_56dd5_row24_col1, #T_56dd5_row24_col2, #T_56dd5_row24_col3, #T_56dd5_row24_col4, #T_56dd5_row24_col5, #T_56dd5_row24_col6, #T_56dd5_row24_col7, #T_56dd5_row24_col8, #T_56dd5_row25_col0, #T_56dd5_row25_col1, #T_56dd5_row25_col2, #T_56dd5_row25_col3, #T_56dd5_row25_col4, #T_56dd5_row25_col5, #T_56dd5_row25_col6, #T_56dd5_row25_col7, #T_56dd5_row25_col8, #T_56dd5_row26_col0, #T_56dd5_row26_col1, #T_56dd5_row26_col2, #T_56dd5_row26_col3, #T_56dd5_row26_col4, #T_56dd5_row26_col5, #T_56dd5_row26_col6, #T_56dd5_row26_col7, #T_56dd5_row26_col8, #T_56dd5_row27_col0, #T_56dd5_row27_col1, #T_56dd5_row27_col2, #T_56dd5_row27_col3, #T_56dd5_row27_col4, #T_56dd5_row27_col5, #T_56dd5_row27_col6, #T_56dd5_row27_col7, #T_56dd5_row27_col8, #T_56dd5_row28_col0, #T_56dd5_row28_col1, #T_56dd5_row28_col2, #T_56dd5_row28_col3, #T_56dd5_row28_col4, #T_56dd5_row28_col5, #T_56dd5_row28_col6, #T_56dd5_row28_col7, #T_56dd5_row28_col8, #T_56dd5_row29_col0, #T_56dd5_row29_col1, #T_56dd5_row29_col2, #T_56dd5_row29_col3, #T_56dd5_row29_col4, #T_56dd5_row29_col5, #T_56dd5_row29_col6, #T_56dd5_row29_col7, #T_56dd5_row29_col8, #T_56dd5_row30_col0, #T_56dd5_row30_col1, #T_56dd5_row30_col2, #T_56dd5_row30_col3, #T_56dd5_row30_col4, #T_56dd5_row30_col5, #T_56dd5_row30_col6, #T_56dd5_row30_col7, #T_56dd5_row30_col8, #T_56dd5_row31_col0, #T_56dd5_row31_col1, #T_56dd5_row31_col2, #T_56dd5_row31_col3, #T_56dd5_row31_col4, #T_56dd5_row31_col5, #T_56dd5_row31_col6, #T_56dd5_row31_col7, #T_56dd5_row31_col8, #T_56dd5_row32_col0, #T_56dd5_row32_col1, #T_56dd5_row32_col2, #T_56dd5_row32_col3, #T_56dd5_row32_col4, #T_56dd5_row32_col5, #T_56dd5_row32_col6, #T_56dd5_row32_col7, #T_56dd5_row32_col8, #T_56dd5_row33_col0, #T_56dd5_row33_col1, #T_56dd5_row33_col2, #T_56dd5_row33_col3, #T_56dd5_row33_col4, #T_56dd5_row33_col5, #T_56dd5_row33_col6, #T_56dd5_row33_col7, #T_56dd5_row33_col8, #T_56dd5_row34_col0, #T_56dd5_row34_col1, #T_56dd5_row34_col2, #T_56dd5_row34_col3, #T_56dd5_row34_col4, #T_56dd5_row34_col5, #T_56dd5_row34_col6, #T_56dd5_row34_col7, #T_56dd5_row34_col8, #T_56dd5_row35_col0, #T_56dd5_row35_col1, #T_56dd5_row35_col2, #T_56dd5_row35_col3, #T_56dd5_row35_col4, #T_56dd5_row35_col5, #T_56dd5_row35_col6, #T_56dd5_row35_col7, #T_56dd5_row35_col8, #T_56dd5_row36_col0, #T_56dd5_row36_col1, #T_56dd5_row36_col2, #T_56dd5_row36_col3, #T_56dd5_row36_col4, #T_56dd5_row36_col5, #T_56dd5_row36_col6, #T_56dd5_row36_col7, #T_56dd5_row36_col8, #T_56dd5_row37_col0, #T_56dd5_row37_col1, #T_56dd5_row37_col2, #T_56dd5_row37_col3, #T_56dd5_row37_col4, #T_56dd5_row37_col5, #T_56dd5_row37_col6, #T_56dd5_row37_col7, #T_56dd5_row37_col8, #T_56dd5_row38_col0, #T_56dd5_row38_col1, #T_56dd5_row38_col2, #T_56dd5_row38_col3, #T_56dd5_row38_col4, #T_56dd5_row38_col5, #T_56dd5_row38_col6, #T_56dd5_row38_col7, #T_56dd5_row38_col8, #T_56dd5_row39_col0, #T_56dd5_row39_col1, #T_56dd5_row39_col2, #T_56dd5_row39_col3, #T_56dd5_row39_col4, #T_56dd5_row39_col5, #T_56dd5_row39_col6, #T_56dd5_row39_col7, #T_56dd5_row39_col8, #T_56dd5_row40_col0, #T_56dd5_row40_col1, #T_56dd5_row40_col2, #T_56dd5_row40_col3, #T_56dd5_row40_col4, #T_56dd5_row40_col5, #T_56dd5_row40_col6, #T_56dd5_row40_col7, #T_56dd5_row40_col8, #T_56dd5_row41_col0, #T_56dd5_row41_col1, #T_56dd5_row41_col2, #T_56dd5_row41_col3, #T_56dd5_row41_col4, #T_56dd5_row41_col5, #T_56dd5_row41_col6, #T_56dd5_row41_col7, #T_56dd5_row41_col8, #T_56dd5_row42_col0, #T_56dd5_row42_col1, #T_56dd5_row42_col2, #T_56dd5_row42_col3, #T_56dd5_row42_col4, #T_56dd5_row42_col5, #T_56dd5_row42_col6, #T_56dd5_row42_col7, #T_56dd5_row42_col8, #T_56dd5_row43_col0, #T_56dd5_row43_col1, #T_56dd5_row43_col2, #T_56dd5_row43_col3, #T_56dd5_row43_col4, #T_56dd5_row43_col5, #T_56dd5_row43_col6, #T_56dd5_row43_col7, #T_56dd5_row43_col8, #T_56dd5_row44_col0, #T_56dd5_row44_col1, #T_56dd5_row44_col2, #T_56dd5_row44_col3, #T_56dd5_row44_col4, #T_56dd5_row44_col5, #T_56dd5_row44_col6, #T_56dd5_row44_col7, #T_56dd5_row44_col8, #T_56dd5_row45_col0, #T_56dd5_row45_col1, #T_56dd5_row45_col2, #T_56dd5_row45_col3, #T_56dd5_row45_col4, #T_56dd5_row45_col5, #T_56dd5_row45_col6, #T_56dd5_row45_col7, #T_56dd5_row45_col8, #T_56dd5_row46_col0, #T_56dd5_row46_col1, #T_56dd5_row46_col2, #T_56dd5_row46_col3, #T_56dd5_row46_col4, #T_56dd5_row46_col5, #T_56dd5_row46_col6, #T_56dd5_row46_col7, #T_56dd5_row46_col8, #T_56dd5_row47_col0, #T_56dd5_row47_col1, #T_56dd5_row47_col2, #T_56dd5_row47_col3, #T_56dd5_row47_col4, #T_56dd5_row47_col5, #T_56dd5_row47_col6, #T_56dd5_row47_col7, #T_56dd5_row47_col8, #T_56dd5_row48_col0, #T_56dd5_row48_col1, #T_56dd5_row48_col2, #T_56dd5_row48_col3, #T_56dd5_row48_col4, #T_56dd5_row48_col5, #T_56dd5_row48_col6, #T_56dd5_row48_col7, #T_56dd5_row48_col8, #T_56dd5_row49_col0, #T_56dd5_row49_col1, #T_56dd5_row49_col2, #T_56dd5_row49_col3, #T_56dd5_row49_col4, #T_56dd5_row49_col5, #T_56dd5_row49_col6, #T_56dd5_row49_col7, #T_56dd5_row49_col8, #T_56dd5_row50_col0, #T_56dd5_row50_col1, #T_56dd5_row50_col2, #T_56dd5_row50_col3, #T_56dd5_row50_col4, #T_56dd5_row50_col5, #T_56dd5_row50_col6, #T_56dd5_row50_col7, #T_56dd5_row50_col8, #T_56dd5_row51_col0, #T_56dd5_row51_col1, #T_56dd5_row51_col2, #T_56dd5_row51_col3, #T_56dd5_row51_col4, #T_56dd5_row51_col5, #T_56dd5_row51_col6, #T_56dd5_row51_col7, #T_56dd5_row51_col8, #T_56dd5_row52_col0, #T_56dd5_row52_col1, #T_56dd5_row52_col2, #T_56dd5_row52_col3, #T_56dd5_row52_col4, #T_56dd5_row52_col5, #T_56dd5_row52_col6, #T_56dd5_row52_col7, #T_56dd5_row52_col8, #T_56dd5_row53_col0, #T_56dd5_row53_col1, #T_56dd5_row53_col2, #T_56dd5_row53_col3, #T_56dd5_row53_col4, #T_56dd5_row53_col5, #T_56dd5_row53_col6, #T_56dd5_row53_col7, #T_56dd5_row53_col8, #T_56dd5_row54_col0, #T_56dd5_row54_col1, #T_56dd5_row54_col2, #T_56dd5_row54_col3, #T_56dd5_row54_col4, #T_56dd5_row54_col5, #T_56dd5_row54_col6, #T_56dd5_row54_col7, #T_56dd5_row54_col8, #T_56dd5_row55_col0, #T_56dd5_row55_col1, #T_56dd5_row55_col2, #T_56dd5_row55_col3, #T_56dd5_row55_col4, #T_56dd5_row55_col5, #T_56dd5_row55_col6, #T_56dd5_row55_col7, #T_56dd5_row55_col8, #T_56dd5_row56_col0, #T_56dd5_row56_col1, #T_56dd5_row56_col2, #T_56dd5_row56_col3, #T_56dd5_row56_col4, #T_56dd5_row56_col5, #T_56dd5_row56_col6, #T_56dd5_row56_col7, #T_56dd5_row56_col8, #T_56dd5_row57_col0, #T_56dd5_row57_col1, #T_56dd5_row57_col2, #T_56dd5_row57_col3, #T_56dd5_row57_col4, #T_56dd5_row57_col5, #T_56dd5_row57_col6, #T_56dd5_row57_col7, #T_56dd5_row57_col8, #T_56dd5_row58_col0, #T_56dd5_row58_col1, #T_56dd5_row58_col2, #T_56dd5_row58_col3, #T_56dd5_row58_col4, #T_56dd5_row58_col5, #T_56dd5_row58_col6, #T_56dd5_row58_col7, #T_56dd5_row58_col8, #T_56dd5_row59_col0, #T_56dd5_row59_col1, #T_56dd5_row59_col2, #T_56dd5_row59_col3, #T_56dd5_row59_col4, #T_56dd5_row59_col5, #T_56dd5_row59_col6, #T_56dd5_row59_col7, #T_56dd5_row59_col8, #T_56dd5_row60_col0, #T_56dd5_row60_col1, #T_56dd5_row60_col2, #T_56dd5_row60_col3, #T_56dd5_row60_col4, #T_56dd5_row60_col5, #T_56dd5_row60_col6, #T_56dd5_row60_col7, #T_56dd5_row60_col8, #T_56dd5_row61_col0, #T_56dd5_row61_col1, #T_56dd5_row61_col2, #T_56dd5_row61_col3, #T_56dd5_row61_col4, #T_56dd5_row61_col5, #T_56dd5_row61_col6, #T_56dd5_row61_col7, #T_56dd5_row61_col8, #T_56dd5_row62_col0, #T_56dd5_row62_col1, #T_56dd5_row62_col2, #T_56dd5_row62_col3, #T_56dd5_row62_col4, #T_56dd5_row62_col5, #T_56dd5_row62_col6, #T_56dd5_row62_col7, #T_56dd5_row62_col8, #T_56dd5_row63_col0, #T_56dd5_row63_col1, #T_56dd5_row63_col2, #T_56dd5_row63_col3, #T_56dd5_row63_col4, #T_56dd5_row63_col5, #T_56dd5_row63_col6, #T_56dd5_row63_col7, #T_56dd5_row63_col8, #T_56dd5_row64_col0, #T_56dd5_row64_col1, #T_56dd5_row64_col2, #T_56dd5_row64_col3, #T_56dd5_row64_col4, #T_56dd5_row64_col5, #T_56dd5_row64_col6, #T_56dd5_row64_col7, #T_56dd5_row64_col8, #T_56dd5_row65_col0, #T_56dd5_row65_col1, #T_56dd5_row65_col2, #T_56dd5_row65_col3, #T_56dd5_row65_col4, #T_56dd5_row65_col5, #T_56dd5_row65_col6, #T_56dd5_row65_col7, #T_56dd5_row65_col8, #T_56dd5_row66_col0, #T_56dd5_row66_col1, #T_56dd5_row66_col2, #T_56dd5_row66_col3, #T_56dd5_row66_col4, #T_56dd5_row66_col5, #T_56dd5_row66_col6, #T_56dd5_row66_col7, #T_56dd5_row66_col8, #T_56dd5_row67_col0, #T_56dd5_row67_col1, #T_56dd5_row67_col2, #T_56dd5_row67_col3, #T_56dd5_row67_col4, #T_56dd5_row67_col5, #T_56dd5_row67_col6, #T_56dd5_row67_col7, #T_56dd5_row67_col8, #T_56dd5_row68_col0, #T_56dd5_row68_col1, #T_56dd5_row68_col2, #T_56dd5_row68_col3, #T_56dd5_row68_col4, #T_56dd5_row68_col5, #T_56dd5_row68_col6, #T_56dd5_row68_col7, #T_56dd5_row68_col8, #T_56dd5_row69_col0, #T_56dd5_row69_col1, #T_56dd5_row69_col2, #T_56dd5_row69_col3, #T_56dd5_row69_col4, #T_56dd5_row69_col5, #T_56dd5_row69_col6, #T_56dd5_row69_col7, #T_56dd5_row69_col8, #T_56dd5_row70_col0, #T_56dd5_row70_col1, #T_56dd5_row70_col2, #T_56dd5_row70_col3, #T_56dd5_row70_col4, #T_56dd5_row70_col5, #T_56dd5_row70_col6, #T_56dd5_row70_col7, #T_56dd5_row70_col8, #T_56dd5_row71_col0, #T_56dd5_row71_col1, #T_56dd5_row71_col2, #T_56dd5_row71_col3, #T_56dd5_row71_col4, #T_56dd5_row71_col5, #T_56dd5_row71_col6, #T_56dd5_row71_col7, #T_56dd5_row71_col8, #T_56dd5_row72_col0, #T_56dd5_row72_col1, #T_56dd5_row72_col2, #T_56dd5_row72_col3, #T_56dd5_row72_col4, #T_56dd5_row72_col5, #T_56dd5_row72_col6, #T_56dd5_row72_col7, #T_56dd5_row72_col8, #T_56dd5_row73_col0, #T_56dd5_row73_col1, #T_56dd5_row73_col2, #T_56dd5_row73_col3, #T_56dd5_row73_col4, #T_56dd5_row73_col5, #T_56dd5_row73_col6, #T_56dd5_row73_col7, #T_56dd5_row73_col8, #T_56dd5_row74_col0, #T_56dd5_row74_col1, #T_56dd5_row74_col2, #T_56dd5_row74_col3, #T_56dd5_row74_col4, #T_56dd5_row74_col5, #T_56dd5_row74_col6, #T_56dd5_row74_col7, #T_56dd5_row74_col8, #T_56dd5_row75_col0, #T_56dd5_row75_col1, #T_56dd5_row75_col2, #T_56dd5_row75_col3, #T_56dd5_row75_col4, #T_56dd5_row75_col5, #T_56dd5_row75_col6, #T_56dd5_row75_col7, #T_56dd5_row75_col8 {\n",
-       "  text-align: left;\n",
-       "}\n",
-       "</style>\n",
-       "<table id=\"T_56dd5\">\n",
-       "  <thead>\n",
-       "    <tr>\n",
-       "      <th id=\"T_56dd5_level0_col0\" class=\"col_heading level0 col0\" >ID</th>\n",
-       "      <th id=\"T_56dd5_level0_col1\" class=\"col_heading level0 col1\" >Name</th>\n",
-       "      <th id=\"T_56dd5_level0_col2\" class=\"col_heading level0 col2\" >Description</th>\n",
-       "      <th id=\"T_56dd5_level0_col3\" class=\"col_heading level0 col3\" >Has Figure</th>\n",
-       "      <th id=\"T_56dd5_level0_col4\" class=\"col_heading level0 col4\" >Has Table</th>\n",
-       "      <th id=\"T_56dd5_level0_col5\" class=\"col_heading level0 col5\" >Required Inputs</th>\n",
-       "      <th id=\"T_56dd5_level0_col6\" class=\"col_heading level0 col6\" >Params</th>\n",
-       "      <th id=\"T_56dd5_level0_col7\" class=\"col_heading level0 col7\" >Tags</th>\n",
-       "      <th id=\"T_56dd5_level0_col8\" class=\"col_heading level0 col8\" >Tasks</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row0_col0\" class=\"data row0 col0\" >validmind.data_validation.BivariateScatterPlots</td>\n",
-       "      <td id=\"T_56dd5_row0_col1\" class=\"data row0 col1\" >Bivariate Scatter Plots</td>\n",
-       "      <td id=\"T_56dd5_row0_col2\" class=\"data row0 col2\" >Generates bivariate scatterplots to visually inspect relationships between pairs of numerical predictor variables...</td>\n",
-       "      <td id=\"T_56dd5_row0_col3\" class=\"data row0 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row0_col4\" class=\"data row0 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row0_col5\" class=\"data row0 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row0_col6\" class=\"data row0 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row0_col7\" class=\"data row0 col7\" >['tabular_data', 'numerical_data', 'visualization']</td>\n",
-       "      <td id=\"T_56dd5_row0_col8\" class=\"data row0 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row1_col0\" class=\"data row1 col0\" >validmind.data_validation.ChiSquaredFeaturesTable</td>\n",
-       "      <td id=\"T_56dd5_row1_col1\" class=\"data row1 col1\" >Chi Squared Features Table</td>\n",
-       "      <td id=\"T_56dd5_row1_col2\" class=\"data row1 col2\" >Assesses the statistical association between categorical features and a target variable using the Chi-Squared test....</td>\n",
-       "      <td id=\"T_56dd5_row1_col3\" class=\"data row1 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row1_col4\" class=\"data row1 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row1_col5\" class=\"data row1 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row1_col6\" class=\"data row1 col6\" >{'p_threshold': {'type': '_empty', 'default': 0.05}}</td>\n",
-       "      <td id=\"T_56dd5_row1_col7\" class=\"data row1 col7\" >['tabular_data', 'categorical_data', 'statistical_test']</td>\n",
-       "      <td id=\"T_56dd5_row1_col8\" class=\"data row1 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row2_col0\" class=\"data row2 col0\" >validmind.data_validation.ClassImbalance</td>\n",
-       "      <td id=\"T_56dd5_row2_col1\" class=\"data row2 col1\" >Class Imbalance</td>\n",
-       "      <td id=\"T_56dd5_row2_col2\" class=\"data row2 col2\" >Evaluates and quantifies class distribution imbalance in a dataset used by a machine learning model....</td>\n",
-       "      <td id=\"T_56dd5_row2_col3\" class=\"data row2 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row2_col4\" class=\"data row2 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row2_col5\" class=\"data row2 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row2_col6\" class=\"data row2 col6\" >{'min_percent_threshold': {'type': 'int', 'default': 10}}</td>\n",
-       "      <td id=\"T_56dd5_row2_col7\" class=\"data row2 col7\" >['tabular_data', 'binary_classification', 'multiclass_classification', 'data_quality']</td>\n",
-       "      <td id=\"T_56dd5_row2_col8\" class=\"data row2 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row3_col0\" class=\"data row3 col0\" >validmind.data_validation.DatasetDescription</td>\n",
-       "      <td id=\"T_56dd5_row3_col1\" class=\"data row3 col1\" >Dataset Description</td>\n",
-       "      <td id=\"T_56dd5_row3_col2\" class=\"data row3 col2\" >Provides comprehensive analysis and statistical summaries of each column in a machine learning model's dataset....</td>\n",
-       "      <td id=\"T_56dd5_row3_col3\" class=\"data row3 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row3_col4\" class=\"data row3 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row3_col5\" class=\"data row3 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row3_col6\" class=\"data row3 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row3_col7\" class=\"data row3 col7\" >['tabular_data', 'time_series_data', 'text_data']</td>\n",
-       "      <td id=\"T_56dd5_row3_col8\" class=\"data row3 col8\" >['classification', 'regression', 'text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row4_col0\" class=\"data row4 col0\" >validmind.data_validation.DatasetSplit</td>\n",
-       "      <td id=\"T_56dd5_row4_col1\" class=\"data row4 col1\" >Dataset Split</td>\n",
-       "      <td id=\"T_56dd5_row4_col2\" class=\"data row4 col2\" >Evaluates and visualizes the distribution proportions among training, testing, and validation datasets of an ML...</td>\n",
-       "      <td id=\"T_56dd5_row4_col3\" class=\"data row4 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row4_col4\" class=\"data row4 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row4_col5\" class=\"data row4 col5\" >['datasets']</td>\n",
-       "      <td id=\"T_56dd5_row4_col6\" class=\"data row4 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row4_col7\" class=\"data row4 col7\" >['tabular_data', 'time_series_data', 'text_data']</td>\n",
-       "      <td id=\"T_56dd5_row4_col8\" class=\"data row4 col8\" >['classification', 'regression', 'text_classification', 'text_summarization']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row5_col0\" class=\"data row5 col0\" >validmind.data_validation.DescriptiveStatistics</td>\n",
-       "      <td id=\"T_56dd5_row5_col1\" class=\"data row5 col1\" >Descriptive Statistics</td>\n",
-       "      <td id=\"T_56dd5_row5_col2\" class=\"data row5 col2\" >Performs a detailed descriptive statistical analysis of both numerical and categorical data within a model's...</td>\n",
-       "      <td id=\"T_56dd5_row5_col3\" class=\"data row5 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row5_col4\" class=\"data row5 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row5_col5\" class=\"data row5 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row5_col6\" class=\"data row5 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row5_col7\" class=\"data row5 col7\" >['tabular_data', 'time_series_data', 'data_quality']</td>\n",
-       "      <td id=\"T_56dd5_row5_col8\" class=\"data row5 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row6_col0\" class=\"data row6 col0\" >validmind.data_validation.Duplicates</td>\n",
-       "      <td id=\"T_56dd5_row6_col1\" class=\"data row6 col1\" >Duplicates</td>\n",
-       "      <td id=\"T_56dd5_row6_col2\" class=\"data row6 col2\" >Tests dataset for duplicate entries, ensuring model reliability via data quality verification....</td>\n",
-       "      <td id=\"T_56dd5_row6_col3\" class=\"data row6 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row6_col4\" class=\"data row6 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row6_col5\" class=\"data row6 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row6_col6\" class=\"data row6 col6\" >{'min_threshold': {'type': '_empty', 'default': 1}}</td>\n",
-       "      <td id=\"T_56dd5_row6_col7\" class=\"data row6 col7\" >['tabular_data', 'data_quality', 'text_data']</td>\n",
-       "      <td id=\"T_56dd5_row6_col8\" class=\"data row6 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row7_col0\" class=\"data row7 col0\" >validmind.data_validation.FeatureTargetCorrelationPlot</td>\n",
-       "      <td id=\"T_56dd5_row7_col1\" class=\"data row7 col1\" >Feature Target Correlation Plot</td>\n",
-       "      <td id=\"T_56dd5_row7_col2\" class=\"data row7 col2\" >Visualizes the correlation between input features and the model's target output in a color-coded horizontal bar...</td>\n",
-       "      <td id=\"T_56dd5_row7_col3\" class=\"data row7 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row7_col4\" class=\"data row7 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row7_col5\" class=\"data row7 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row7_col6\" class=\"data row7 col6\" >{'fig_height': {'type': '_empty', 'default': 600}}</td>\n",
-       "      <td id=\"T_56dd5_row7_col7\" class=\"data row7 col7\" >['tabular_data', 'visualization', 'correlation']</td>\n",
-       "      <td id=\"T_56dd5_row7_col8\" class=\"data row7 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row8_col0\" class=\"data row8 col0\" >validmind.data_validation.HighCardinality</td>\n",
-       "      <td id=\"T_56dd5_row8_col1\" class=\"data row8 col1\" >High Cardinality</td>\n",
-       "      <td id=\"T_56dd5_row8_col2\" class=\"data row8 col2\" >Assesses the number of unique values in categorical columns to detect high cardinality and potential overfitting....</td>\n",
-       "      <td id=\"T_56dd5_row8_col3\" class=\"data row8 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row8_col4\" class=\"data row8 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row8_col5\" class=\"data row8 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row8_col6\" class=\"data row8 col6\" >{'num_threshold': {'type': 'int', 'default': 100}, 'percent_threshold': {'type': 'float', 'default': 0.1}, 'threshold_type': {'type': 'str', 'default': 'percent'}}</td>\n",
-       "      <td id=\"T_56dd5_row8_col7\" class=\"data row8 col7\" >['tabular_data', 'data_quality', 'categorical_data']</td>\n",
-       "      <td id=\"T_56dd5_row8_col8\" class=\"data row8 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row9_col0\" class=\"data row9 col0\" >validmind.data_validation.HighPearsonCorrelation</td>\n",
-       "      <td id=\"T_56dd5_row9_col1\" class=\"data row9 col1\" >High Pearson Correlation</td>\n",
-       "      <td id=\"T_56dd5_row9_col2\" class=\"data row9 col2\" >Identifies highly correlated feature pairs in a dataset suggesting feature redundancy or multicollinearity....</td>\n",
-       "      <td id=\"T_56dd5_row9_col3\" class=\"data row9 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row9_col4\" class=\"data row9 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row9_col5\" class=\"data row9 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row9_col6\" class=\"data row9 col6\" >{'max_threshold': {'type': 'float', 'default': 0.3}, 'top_n_correlations': {'type': 'int', 'default': 10}, 'feature_columns': {'type': 'list', 'default': None}}</td>\n",
-       "      <td id=\"T_56dd5_row9_col7\" class=\"data row9 col7\" >['tabular_data', 'data_quality', 'correlation']</td>\n",
-       "      <td id=\"T_56dd5_row9_col8\" class=\"data row9 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row10_col0\" class=\"data row10 col0\" >validmind.data_validation.IQROutliersBarPlot</td>\n",
-       "      <td id=\"T_56dd5_row10_col1\" class=\"data row10 col1\" >IQR Outliers Bar Plot</td>\n",
-       "      <td id=\"T_56dd5_row10_col2\" class=\"data row10 col2\" >Visualizes outlier distribution across percentiles in numerical data using the Interquartile Range (IQR) method....</td>\n",
-       "      <td id=\"T_56dd5_row10_col3\" class=\"data row10 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row10_col4\" class=\"data row10 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row10_col5\" class=\"data row10 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row10_col6\" class=\"data row10 col6\" >{'threshold': {'type': 'float', 'default': 1.5}, 'fig_width': {'type': 'int', 'default': 800}}</td>\n",
-       "      <td id=\"T_56dd5_row10_col7\" class=\"data row10 col7\" >['tabular_data', 'visualization', 'numerical_data']</td>\n",
-       "      <td id=\"T_56dd5_row10_col8\" class=\"data row10 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row11_col0\" class=\"data row11 col0\" >validmind.data_validation.IQROutliersTable</td>\n",
-       "      <td id=\"T_56dd5_row11_col1\" class=\"data row11 col1\" >IQR Outliers Table</td>\n",
-       "      <td id=\"T_56dd5_row11_col2\" class=\"data row11 col2\" >Determines and summarizes outliers in numerical features using the Interquartile Range method....</td>\n",
-       "      <td id=\"T_56dd5_row11_col3\" class=\"data row11 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row11_col4\" class=\"data row11 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row11_col5\" class=\"data row11 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row11_col6\" class=\"data row11 col6\" >{'threshold': {'type': 'float', 'default': 1.5}}</td>\n",
-       "      <td id=\"T_56dd5_row11_col7\" class=\"data row11 col7\" >['tabular_data', 'numerical_data']</td>\n",
-       "      <td id=\"T_56dd5_row11_col8\" class=\"data row11 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row12_col0\" class=\"data row12 col0\" >validmind.data_validation.IsolationForestOutliers</td>\n",
-       "      <td id=\"T_56dd5_row12_col1\" class=\"data row12 col1\" >Isolation Forest Outliers</td>\n",
-       "      <td id=\"T_56dd5_row12_col2\" class=\"data row12 col2\" >Detects outliers in a dataset using the Isolation Forest algorithm and visualizes results through scatter plots....</td>\n",
-       "      <td id=\"T_56dd5_row12_col3\" class=\"data row12 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row12_col4\" class=\"data row12 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row12_col5\" class=\"data row12 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row12_col6\" class=\"data row12 col6\" >{'random_state': {'type': 'int', 'default': 0}, 'contamination': {'type': 'float', 'default': 0.1}, 'feature_columns': {'type': 'list', 'default': None}}</td>\n",
-       "      <td id=\"T_56dd5_row12_col7\" class=\"data row12 col7\" >['tabular_data', 'anomaly_detection']</td>\n",
-       "      <td id=\"T_56dd5_row12_col8\" class=\"data row12 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row13_col0\" class=\"data row13 col0\" >validmind.data_validation.JarqueBera</td>\n",
-       "      <td id=\"T_56dd5_row13_col1\" class=\"data row13 col1\" >Jarque Bera</td>\n",
-       "      <td id=\"T_56dd5_row13_col2\" class=\"data row13 col2\" >Assesses normality of dataset features in an ML model using the Jarque-Bera test....</td>\n",
-       "      <td id=\"T_56dd5_row13_col3\" class=\"data row13 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row13_col4\" class=\"data row13 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row13_col5\" class=\"data row13 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row13_col6\" class=\"data row13 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row13_col7\" class=\"data row13 col7\" >['tabular_data', 'data_distribution', 'statistical_test', 'statsmodels']</td>\n",
-       "      <td id=\"T_56dd5_row13_col8\" class=\"data row13 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row14_col0\" class=\"data row14 col0\" >validmind.data_validation.MissingValues</td>\n",
-       "      <td id=\"T_56dd5_row14_col1\" class=\"data row14 col1\" >Missing Values</td>\n",
-       "      <td id=\"T_56dd5_row14_col2\" class=\"data row14 col2\" >Evaluates dataset quality by ensuring missing value ratio across all features does not exceed a set threshold....</td>\n",
-       "      <td id=\"T_56dd5_row14_col3\" class=\"data row14 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row14_col4\" class=\"data row14 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row14_col5\" class=\"data row14 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row14_col6\" class=\"data row14 col6\" >{'min_threshold': {'type': 'int', 'default': 1}}</td>\n",
-       "      <td id=\"T_56dd5_row14_col7\" class=\"data row14 col7\" >['tabular_data', 'data_quality']</td>\n",
-       "      <td id=\"T_56dd5_row14_col8\" class=\"data row14 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row15_col0\" class=\"data row15 col0\" >validmind.data_validation.MissingValuesBarPlot</td>\n",
-       "      <td id=\"T_56dd5_row15_col1\" class=\"data row15 col1\" >Missing Values Bar Plot</td>\n",
-       "      <td id=\"T_56dd5_row15_col2\" class=\"data row15 col2\" >Assesses the percentage and distribution of missing values in the dataset via a bar plot, with emphasis on...</td>\n",
-       "      <td id=\"T_56dd5_row15_col3\" class=\"data row15 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row15_col4\" class=\"data row15 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row15_col5\" class=\"data row15 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row15_col6\" class=\"data row15 col6\" >{'threshold': {'type': 'int', 'default': 80}, 'fig_height': {'type': 'int', 'default': 600}}</td>\n",
-       "      <td id=\"T_56dd5_row15_col7\" class=\"data row15 col7\" >['tabular_data', 'data_quality', 'visualization']</td>\n",
-       "      <td id=\"T_56dd5_row15_col8\" class=\"data row15 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row16_col0\" class=\"data row16 col0\" >validmind.data_validation.MutualInformation</td>\n",
-       "      <td id=\"T_56dd5_row16_col1\" class=\"data row16 col1\" >Mutual Information</td>\n",
-       "      <td id=\"T_56dd5_row16_col2\" class=\"data row16 col2\" >Calculates mutual information scores between features and target variable to evaluate feature relevance....</td>\n",
-       "      <td id=\"T_56dd5_row16_col3\" class=\"data row16 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row16_col4\" class=\"data row16 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row16_col5\" class=\"data row16 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row16_col6\" class=\"data row16 col6\" >{'min_threshold': {'type': 'float', 'default': 0.01}, 'task': {'type': 'str', 'default': 'classification'}}</td>\n",
-       "      <td id=\"T_56dd5_row16_col7\" class=\"data row16 col7\" >['feature_selection', 'data_analysis']</td>\n",
-       "      <td id=\"T_56dd5_row16_col8\" class=\"data row16 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row17_col0\" class=\"data row17 col0\" >validmind.data_validation.PearsonCorrelationMatrix</td>\n",
-       "      <td id=\"T_56dd5_row17_col1\" class=\"data row17 col1\" >Pearson Correlation Matrix</td>\n",
-       "      <td id=\"T_56dd5_row17_col2\" class=\"data row17 col2\" >Evaluates linear dependency between numerical variables in a dataset via a Pearson Correlation coefficient heat map....</td>\n",
-       "      <td id=\"T_56dd5_row17_col3\" class=\"data row17 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row17_col4\" class=\"data row17 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row17_col5\" class=\"data row17 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row17_col6\" class=\"data row17 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row17_col7\" class=\"data row17 col7\" >['tabular_data', 'numerical_data', 'correlation']</td>\n",
-       "      <td id=\"T_56dd5_row17_col8\" class=\"data row17 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row18_col0\" class=\"data row18 col0\" >validmind.data_validation.ProtectedClassesDescription</td>\n",
-       "      <td id=\"T_56dd5_row18_col1\" class=\"data row18 col1\" >Protected Classes Description</td>\n",
-       "      <td id=\"T_56dd5_row18_col2\" class=\"data row18 col2\" >Visualizes the distribution of protected classes in the dataset relative to the target variable...</td>\n",
-       "      <td id=\"T_56dd5_row18_col3\" class=\"data row18 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row18_col4\" class=\"data row18 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row18_col5\" class=\"data row18 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row18_col6\" class=\"data row18 col6\" >{'protected_classes': {'type': '_empty', 'default': None}}</td>\n",
-       "      <td id=\"T_56dd5_row18_col7\" class=\"data row18 col7\" >['bias_and_fairness', 'descriptive_statistics']</td>\n",
-       "      <td id=\"T_56dd5_row18_col8\" class=\"data row18 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row19_col0\" class=\"data row19 col0\" >validmind.data_validation.RunsTest</td>\n",
-       "      <td id=\"T_56dd5_row19_col1\" class=\"data row19 col1\" >Runs Test</td>\n",
-       "      <td id=\"T_56dd5_row19_col2\" class=\"data row19 col2\" >Executes Runs Test on ML model to detect non-random patterns in output data sequence....</td>\n",
-       "      <td id=\"T_56dd5_row19_col3\" class=\"data row19 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row19_col4\" class=\"data row19 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row19_col5\" class=\"data row19 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row19_col6\" class=\"data row19 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row19_col7\" class=\"data row19 col7\" >['tabular_data', 'statistical_test', 'statsmodels']</td>\n",
-       "      <td id=\"T_56dd5_row19_col8\" class=\"data row19 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row20_col0\" class=\"data row20 col0\" >validmind.data_validation.ScatterPlot</td>\n",
-       "      <td id=\"T_56dd5_row20_col1\" class=\"data row20 col1\" >Scatter Plot</td>\n",
-       "      <td id=\"T_56dd5_row20_col2\" class=\"data row20 col2\" >Assesses visual relationships, patterns, and outliers among features in a dataset through scatter plot matrices....</td>\n",
-       "      <td id=\"T_56dd5_row20_col3\" class=\"data row20 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row20_col4\" class=\"data row20 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row20_col5\" class=\"data row20 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row20_col6\" class=\"data row20 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row20_col7\" class=\"data row20 col7\" >['tabular_data', 'visualization']</td>\n",
-       "      <td id=\"T_56dd5_row20_col8\" class=\"data row20 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row21_col0\" class=\"data row21 col0\" >validmind.data_validation.ScoreBandDefaultRates</td>\n",
-       "      <td id=\"T_56dd5_row21_col1\" class=\"data row21 col1\" >Score Band Default Rates</td>\n",
-       "      <td id=\"T_56dd5_row21_col2\" class=\"data row21 col2\" >Analyzes default rates and population distribution across credit score bands....</td>\n",
-       "      <td id=\"T_56dd5_row21_col3\" class=\"data row21 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row21_col4\" class=\"data row21 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row21_col5\" class=\"data row21 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row21_col6\" class=\"data row21 col6\" >{'score_column': {'type': 'str', 'default': 'score'}, 'score_bands': {'type': 'list', 'default': None}}</td>\n",
-       "      <td id=\"T_56dd5_row21_col7\" class=\"data row21 col7\" >['visualization', 'credit_risk', 'scorecard']</td>\n",
-       "      <td id=\"T_56dd5_row21_col8\" class=\"data row21 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row22_col0\" class=\"data row22 col0\" >validmind.data_validation.ShapiroWilk</td>\n",
-       "      <td id=\"T_56dd5_row22_col1\" class=\"data row22 col1\" >Shapiro Wilk</td>\n",
-       "      <td id=\"T_56dd5_row22_col2\" class=\"data row22 col2\" >Evaluates feature-wise normality of training data using the Shapiro-Wilk test....</td>\n",
-       "      <td id=\"T_56dd5_row22_col3\" class=\"data row22 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row22_col4\" class=\"data row22 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row22_col5\" class=\"data row22 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row22_col6\" class=\"data row22 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row22_col7\" class=\"data row22 col7\" >['tabular_data', 'data_distribution', 'statistical_test']</td>\n",
-       "      <td id=\"T_56dd5_row22_col8\" class=\"data row22 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row23_col0\" class=\"data row23 col0\" >validmind.data_validation.Skewness</td>\n",
-       "      <td id=\"T_56dd5_row23_col1\" class=\"data row23 col1\" >Skewness</td>\n",
-       "      <td id=\"T_56dd5_row23_col2\" class=\"data row23 col2\" >Evaluates the skewness of numerical data in a dataset to check against a defined threshold, aiming to ensure data...</td>\n",
-       "      <td id=\"T_56dd5_row23_col3\" class=\"data row23 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row23_col4\" class=\"data row23 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row23_col5\" class=\"data row23 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row23_col6\" class=\"data row23 col6\" >{'max_threshold': {'type': '_empty', 'default': 1}}</td>\n",
-       "      <td id=\"T_56dd5_row23_col7\" class=\"data row23 col7\" >['data_quality', 'tabular_data']</td>\n",
-       "      <td id=\"T_56dd5_row23_col8\" class=\"data row23 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row24_col0\" class=\"data row24 col0\" >validmind.data_validation.TabularCategoricalBarPlots</td>\n",
-       "      <td id=\"T_56dd5_row24_col1\" class=\"data row24 col1\" >Tabular Categorical Bar Plots</td>\n",
-       "      <td id=\"T_56dd5_row24_col2\" class=\"data row24 col2\" >Generates and visualizes bar plots for each category in categorical features to evaluate the dataset's composition....</td>\n",
-       "      <td id=\"T_56dd5_row24_col3\" class=\"data row24 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row24_col4\" class=\"data row24 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row24_col5\" class=\"data row24 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row24_col6\" class=\"data row24 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row24_col7\" class=\"data row24 col7\" >['tabular_data', 'visualization']</td>\n",
-       "      <td id=\"T_56dd5_row24_col8\" class=\"data row24 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row25_col0\" class=\"data row25 col0\" >validmind.data_validation.TabularDateTimeHistograms</td>\n",
-       "      <td id=\"T_56dd5_row25_col1\" class=\"data row25 col1\" >Tabular Date Time Histograms</td>\n",
-       "      <td id=\"T_56dd5_row25_col2\" class=\"data row25 col2\" >Generates histograms to provide graphical insight into the distribution of time intervals in a model's datetime...</td>\n",
-       "      <td id=\"T_56dd5_row25_col3\" class=\"data row25 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row25_col4\" class=\"data row25 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row25_col5\" class=\"data row25 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row25_col6\" class=\"data row25 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row25_col7\" class=\"data row25 col7\" >['time_series_data', 'visualization']</td>\n",
-       "      <td id=\"T_56dd5_row25_col8\" class=\"data row25 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row26_col0\" class=\"data row26 col0\" >validmind.data_validation.TabularDescriptionTables</td>\n",
-       "      <td id=\"T_56dd5_row26_col1\" class=\"data row26 col1\" >Tabular Description Tables</td>\n",
-       "      <td id=\"T_56dd5_row26_col2\" class=\"data row26 col2\" >Summarizes key descriptive statistics for numerical, categorical, and datetime variables in a dataset....</td>\n",
-       "      <td id=\"T_56dd5_row26_col3\" class=\"data row26 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row26_col4\" class=\"data row26 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row26_col5\" class=\"data row26 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row26_col6\" class=\"data row26 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row26_col7\" class=\"data row26 col7\" >['tabular_data']</td>\n",
-       "      <td id=\"T_56dd5_row26_col8\" class=\"data row26 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row27_col0\" class=\"data row27 col0\" >validmind.data_validation.TabularNumericalHistograms</td>\n",
-       "      <td id=\"T_56dd5_row27_col1\" class=\"data row27 col1\" >Tabular Numerical Histograms</td>\n",
-       "      <td id=\"T_56dd5_row27_col2\" class=\"data row27 col2\" >Generates histograms for each numerical feature in a dataset to provide visual insights into data distribution and...</td>\n",
-       "      <td id=\"T_56dd5_row27_col3\" class=\"data row27 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row27_col4\" class=\"data row27 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row27_col5\" class=\"data row27 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row27_col6\" class=\"data row27 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row27_col7\" class=\"data row27 col7\" >['tabular_data', 'visualization']</td>\n",
-       "      <td id=\"T_56dd5_row27_col8\" class=\"data row27 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row28_col0\" class=\"data row28 col0\" >validmind.data_validation.TargetRateBarPlots</td>\n",
-       "      <td id=\"T_56dd5_row28_col1\" class=\"data row28 col1\" >Target Rate Bar Plots</td>\n",
-       "      <td id=\"T_56dd5_row28_col2\" class=\"data row28 col2\" >Generates bar plots visualizing the default rates of categorical features for a classification machine learning...</td>\n",
-       "      <td id=\"T_56dd5_row28_col3\" class=\"data row28 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row28_col4\" class=\"data row28 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row28_col5\" class=\"data row28 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row28_col6\" class=\"data row28 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row28_col7\" class=\"data row28 col7\" >['tabular_data', 'visualization', 'categorical_data']</td>\n",
-       "      <td id=\"T_56dd5_row28_col8\" class=\"data row28 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row29_col0\" class=\"data row29 col0\" >validmind.data_validation.TooManyZeroValues</td>\n",
-       "      <td id=\"T_56dd5_row29_col1\" class=\"data row29 col1\" >Too Many Zero Values</td>\n",
-       "      <td id=\"T_56dd5_row29_col2\" class=\"data row29 col2\" >Identifies numerical columns in a dataset that contain an excessive number of zero values, defined by a threshold...</td>\n",
-       "      <td id=\"T_56dd5_row29_col3\" class=\"data row29 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row29_col4\" class=\"data row29 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row29_col5\" class=\"data row29 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row29_col6\" class=\"data row29 col6\" >{'max_percent_threshold': {'type': 'float', 'default': 0.03}}</td>\n",
-       "      <td id=\"T_56dd5_row29_col7\" class=\"data row29 col7\" >['tabular_data']</td>\n",
-       "      <td id=\"T_56dd5_row29_col8\" class=\"data row29 col8\" >['regression', 'classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row30_col0\" class=\"data row30 col0\" >validmind.data_validation.UniqueRows</td>\n",
-       "      <td id=\"T_56dd5_row30_col1\" class=\"data row30 col1\" >Unique Rows</td>\n",
-       "      <td id=\"T_56dd5_row30_col2\" class=\"data row30 col2\" >Verifies the diversity of the dataset by ensuring that the count of unique rows exceeds a prescribed threshold....</td>\n",
-       "      <td id=\"T_56dd5_row30_col3\" class=\"data row30 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row30_col4\" class=\"data row30 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row30_col5\" class=\"data row30 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row30_col6\" class=\"data row30 col6\" >{'min_percent_threshold': {'type': 'float', 'default': 1}}</td>\n",
-       "      <td id=\"T_56dd5_row30_col7\" class=\"data row30 col7\" >['tabular_data']</td>\n",
-       "      <td id=\"T_56dd5_row30_col8\" class=\"data row30 col8\" >['regression', 'classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row31_col0\" class=\"data row31 col0\" >validmind.data_validation.WOEBinPlots</td>\n",
-       "      <td id=\"T_56dd5_row31_col1\" class=\"data row31 col1\" >WOE Bin Plots</td>\n",
-       "      <td id=\"T_56dd5_row31_col2\" class=\"data row31 col2\" >Generates visualizations of Weight of Evidence (WoE) and Information Value (IV) for understanding predictive power...</td>\n",
-       "      <td id=\"T_56dd5_row31_col3\" class=\"data row31 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row31_col4\" class=\"data row31 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row31_col5\" class=\"data row31 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row31_col6\" class=\"data row31 col6\" >{'breaks_adj': {'type': 'list', 'default': None}, 'fig_height': {'type': 'int', 'default': 600}, 'fig_width': {'type': 'int', 'default': 500}}</td>\n",
-       "      <td id=\"T_56dd5_row31_col7\" class=\"data row31 col7\" >['tabular_data', 'visualization', 'categorical_data']</td>\n",
-       "      <td id=\"T_56dd5_row31_col8\" class=\"data row31 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row32_col0\" class=\"data row32 col0\" >validmind.data_validation.WOEBinTable</td>\n",
-       "      <td id=\"T_56dd5_row32_col1\" class=\"data row32 col1\" >WOE Bin Table</td>\n",
-       "      <td id=\"T_56dd5_row32_col2\" class=\"data row32 col2\" >Assesses the Weight of Evidence (WoE) and Information Value (IV) of each feature to evaluate its predictive power...</td>\n",
-       "      <td id=\"T_56dd5_row32_col3\" class=\"data row32 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row32_col4\" class=\"data row32 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row32_col5\" class=\"data row32 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row32_col6\" class=\"data row32 col6\" >{'breaks_adj': {'type': 'list', 'default': None}}</td>\n",
-       "      <td id=\"T_56dd5_row32_col7\" class=\"data row32 col7\" >['tabular_data', 'categorical_data']</td>\n",
-       "      <td id=\"T_56dd5_row32_col8\" class=\"data row32 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row33_col0\" class=\"data row33 col0\" >validmind.model_validation.FeaturesAUC</td>\n",
-       "      <td id=\"T_56dd5_row33_col1\" class=\"data row33 col1\" >Features AUC</td>\n",
-       "      <td id=\"T_56dd5_row33_col2\" class=\"data row33 col2\" >Evaluates the discriminatory power of each individual feature within a binary classification model by calculating...</td>\n",
-       "      <td id=\"T_56dd5_row33_col3\" class=\"data row33 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row33_col4\" class=\"data row33 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row33_col5\" class=\"data row33 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row33_col6\" class=\"data row33 col6\" >{'fontsize': {'type': 'int', 'default': 12}, 'figure_height': {'type': 'int', 'default': 500}}</td>\n",
-       "      <td id=\"T_56dd5_row33_col7\" class=\"data row33 col7\" >['feature_importance', 'AUC', 'visualization']</td>\n",
-       "      <td id=\"T_56dd5_row33_col8\" class=\"data row33 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row34_col0\" class=\"data row34 col0\" >validmind.model_validation.sklearn.CalibrationCurve</td>\n",
-       "      <td id=\"T_56dd5_row34_col1\" class=\"data row34 col1\" >Calibration Curve</td>\n",
-       "      <td id=\"T_56dd5_row34_col2\" class=\"data row34 col2\" >Evaluates the calibration of probability estimates by comparing predicted probabilities against observed...</td>\n",
-       "      <td id=\"T_56dd5_row34_col3\" class=\"data row34 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row34_col4\" class=\"data row34 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row34_col5\" class=\"data row34 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_56dd5_row34_col6\" class=\"data row34 col6\" >{'n_bins': {'type': 'int', 'default': 10}}</td>\n",
-       "      <td id=\"T_56dd5_row34_col7\" class=\"data row34 col7\" >['sklearn', 'model_performance', 'classification']</td>\n",
-       "      <td id=\"T_56dd5_row34_col8\" class=\"data row34 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row35_col0\" class=\"data row35 col0\" >validmind.model_validation.sklearn.ClassifierPerformance</td>\n",
-       "      <td id=\"T_56dd5_row35_col1\" class=\"data row35 col1\" >Classifier Performance</td>\n",
-       "      <td id=\"T_56dd5_row35_col2\" class=\"data row35 col2\" >Evaluates performance of binary or multiclass classification models using precision, recall, F1-Score, accuracy,...</td>\n",
-       "      <td id=\"T_56dd5_row35_col3\" class=\"data row35 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row35_col4\" class=\"data row35 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row35_col5\" class=\"data row35 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row35_col6\" class=\"data row35 col6\" >{'average': {'type': 'str', 'default': 'macro'}}</td>\n",
-       "      <td id=\"T_56dd5_row35_col7\" class=\"data row35 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_56dd5_row35_col8\" class=\"data row35 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row36_col0\" class=\"data row36 col0\" >validmind.model_validation.sklearn.ClassifierThresholdOptimization</td>\n",
-       "      <td id=\"T_56dd5_row36_col1\" class=\"data row36 col1\" >Classifier Threshold Optimization</td>\n",
-       "      <td id=\"T_56dd5_row36_col2\" class=\"data row36 col2\" >Analyzes and visualizes different threshold optimization methods for binary classification models....</td>\n",
-       "      <td id=\"T_56dd5_row36_col3\" class=\"data row36 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row36_col4\" class=\"data row36 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row36_col5\" class=\"data row36 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row36_col6\" class=\"data row36 col6\" >{'methods': {'type': None, 'default': None}, 'target_recall': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_56dd5_row36_col7\" class=\"data row36 col7\" >['model_validation', 'threshold_optimization', 'classification_metrics']</td>\n",
-       "      <td id=\"T_56dd5_row36_col8\" class=\"data row36 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row37_col0\" class=\"data row37 col0\" >validmind.model_validation.sklearn.ConfusionMatrix</td>\n",
-       "      <td id=\"T_56dd5_row37_col1\" class=\"data row37 col1\" >Confusion Matrix</td>\n",
-       "      <td id=\"T_56dd5_row37_col2\" class=\"data row37 col2\" >Evaluates and visually represents the classification ML model's predictive performance using a Confusion Matrix...</td>\n",
-       "      <td id=\"T_56dd5_row37_col3\" class=\"data row37 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row37_col4\" class=\"data row37 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row37_col5\" class=\"data row37 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row37_col6\" class=\"data row37 col6\" >{'threshold': {'type': 'float', 'default': 0.5}}</td>\n",
-       "      <td id=\"T_56dd5_row37_col7\" class=\"data row37 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_56dd5_row37_col8\" class=\"data row37 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row38_col0\" class=\"data row38 col0\" >validmind.model_validation.sklearn.HyperParametersTuning</td>\n",
-       "      <td id=\"T_56dd5_row38_col1\" class=\"data row38 col1\" >Hyper Parameters Tuning</td>\n",
-       "      <td id=\"T_56dd5_row38_col2\" class=\"data row38 col2\" >Performs exhaustive grid search over specified parameter ranges to find optimal model configurations...</td>\n",
-       "      <td id=\"T_56dd5_row38_col3\" class=\"data row38 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row38_col4\" class=\"data row38 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row38_col5\" class=\"data row38 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_56dd5_row38_col6\" class=\"data row38 col6\" >{'param_grid': {'type': 'dict', 'default': None}, 'scoring': {'type': None, 'default': None}, 'thresholds': {'type': None, 'default': None}, 'fit_params': {'type': 'dict', 'default': None}}</td>\n",
-       "      <td id=\"T_56dd5_row38_col7\" class=\"data row38 col7\" >['sklearn', 'model_performance']</td>\n",
-       "      <td id=\"T_56dd5_row38_col8\" class=\"data row38 col8\" >['clustering', 'classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row39_col0\" class=\"data row39 col0\" >validmind.model_validation.sklearn.MinimumAccuracy</td>\n",
-       "      <td id=\"T_56dd5_row39_col1\" class=\"data row39 col1\" >Minimum Accuracy</td>\n",
-       "      <td id=\"T_56dd5_row39_col2\" class=\"data row39 col2\" >Checks if the model's prediction accuracy meets or surpasses a specified threshold....</td>\n",
-       "      <td id=\"T_56dd5_row39_col3\" class=\"data row39 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row39_col4\" class=\"data row39 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row39_col5\" class=\"data row39 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row39_col6\" class=\"data row39 col6\" >{'min_threshold': {'type': 'float', 'default': 0.7}}</td>\n",
-       "      <td id=\"T_56dd5_row39_col7\" class=\"data row39 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_56dd5_row39_col8\" class=\"data row39 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row40_col0\" class=\"data row40 col0\" >validmind.model_validation.sklearn.MinimumF1Score</td>\n",
-       "      <td id=\"T_56dd5_row40_col1\" class=\"data row40 col1\" >Minimum F1 Score</td>\n",
-       "      <td id=\"T_56dd5_row40_col2\" class=\"data row40 col2\" >Assesses if the model's F1 score on the validation set meets a predefined minimum threshold, ensuring balanced...</td>\n",
-       "      <td id=\"T_56dd5_row40_col3\" class=\"data row40 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row40_col4\" class=\"data row40 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row40_col5\" class=\"data row40 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row40_col6\" class=\"data row40 col6\" >{'min_threshold': {'type': 'float', 'default': 0.5}}</td>\n",
-       "      <td id=\"T_56dd5_row40_col7\" class=\"data row40 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_56dd5_row40_col8\" class=\"data row40 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row41_col0\" class=\"data row41 col0\" >validmind.model_validation.sklearn.MinimumROCAUCScore</td>\n",
-       "      <td id=\"T_56dd5_row41_col1\" class=\"data row41 col1\" >Minimum ROCAUC Score</td>\n",
-       "      <td id=\"T_56dd5_row41_col2\" class=\"data row41 col2\" >Validates model by checking if the ROC AUC score meets or surpasses a specified threshold....</td>\n",
-       "      <td id=\"T_56dd5_row41_col3\" class=\"data row41 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row41_col4\" class=\"data row41 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row41_col5\" class=\"data row41 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row41_col6\" class=\"data row41 col6\" >{'min_threshold': {'type': 'float', 'default': 0.5}}</td>\n",
-       "      <td id=\"T_56dd5_row41_col7\" class=\"data row41 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_56dd5_row41_col8\" class=\"data row41 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row42_col0\" class=\"data row42 col0\" >validmind.model_validation.sklearn.ModelParameters</td>\n",
-       "      <td id=\"T_56dd5_row42_col1\" class=\"data row42 col1\" >Model Parameters</td>\n",
-       "      <td id=\"T_56dd5_row42_col2\" class=\"data row42 col2\" >Extracts and displays model parameters in a structured format for transparency and reproducibility....</td>\n",
-       "      <td id=\"T_56dd5_row42_col3\" class=\"data row42 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row42_col4\" class=\"data row42 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row42_col5\" class=\"data row42 col5\" >['model']</td>\n",
-       "      <td id=\"T_56dd5_row42_col6\" class=\"data row42 col6\" >{'model_params': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_56dd5_row42_col7\" class=\"data row42 col7\" >['model_training', 'metadata']</td>\n",
-       "      <td id=\"T_56dd5_row42_col8\" class=\"data row42 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row43_col0\" class=\"data row43 col0\" >validmind.model_validation.sklearn.ModelsPerformanceComparison</td>\n",
-       "      <td id=\"T_56dd5_row43_col1\" class=\"data row43 col1\" >Models Performance Comparison</td>\n",
-       "      <td id=\"T_56dd5_row43_col2\" class=\"data row43 col2\" >Evaluates and compares the performance of multiple Machine Learning models using various metrics like accuracy,...</td>\n",
-       "      <td id=\"T_56dd5_row43_col3\" class=\"data row43 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row43_col4\" class=\"data row43 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row43_col5\" class=\"data row43 col5\" >['dataset', 'models']</td>\n",
-       "      <td id=\"T_56dd5_row43_col6\" class=\"data row43 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row43_col7\" class=\"data row43 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'model_comparison']</td>\n",
-       "      <td id=\"T_56dd5_row43_col8\" class=\"data row43 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row44_col0\" class=\"data row44 col0\" >validmind.model_validation.sklearn.OverfitDiagnosis</td>\n",
-       "      <td id=\"T_56dd5_row44_col1\" class=\"data row44 col1\" >Overfit Diagnosis</td>\n",
-       "      <td id=\"T_56dd5_row44_col2\" class=\"data row44 col2\" >Assesses potential overfitting in a model's predictions, identifying regions where performance between training and...</td>\n",
-       "      <td id=\"T_56dd5_row44_col3\" class=\"data row44 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row44_col4\" class=\"data row44 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row44_col5\" class=\"data row44 col5\" >['model', 'datasets']</td>\n",
-       "      <td id=\"T_56dd5_row44_col6\" class=\"data row44 col6\" >{'metric': {'type': 'str', 'default': None}, 'cut_off_threshold': {'type': 'float', 'default': 0.04}}</td>\n",
-       "      <td id=\"T_56dd5_row44_col7\" class=\"data row44 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'linear_regression', 'model_diagnosis']</td>\n",
-       "      <td id=\"T_56dd5_row44_col8\" class=\"data row44 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row45_col0\" class=\"data row45 col0\" >validmind.model_validation.sklearn.PermutationFeatureImportance</td>\n",
-       "      <td id=\"T_56dd5_row45_col1\" class=\"data row45 col1\" >Permutation Feature Importance</td>\n",
-       "      <td id=\"T_56dd5_row45_col2\" class=\"data row45 col2\" >Assesses the significance of each feature in a model by evaluating the impact on model performance when feature...</td>\n",
-       "      <td id=\"T_56dd5_row45_col3\" class=\"data row45 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row45_col4\" class=\"data row45 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row45_col5\" class=\"data row45 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_56dd5_row45_col6\" class=\"data row45 col6\" >{'fontsize': {'type': None, 'default': None}, 'figure_height': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_56dd5_row45_col7\" class=\"data row45 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'feature_importance', 'visualization']</td>\n",
-       "      <td id=\"T_56dd5_row45_col8\" class=\"data row45 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row46_col0\" class=\"data row46 col0\" >validmind.model_validation.sklearn.PopulationStabilityIndex</td>\n",
-       "      <td id=\"T_56dd5_row46_col1\" class=\"data row46 col1\" >Population Stability Index</td>\n",
-       "      <td id=\"T_56dd5_row46_col2\" class=\"data row46 col2\" >Assesses the Population Stability Index (PSI) to quantify the stability of an ML model's predictions across...</td>\n",
-       "      <td id=\"T_56dd5_row46_col3\" class=\"data row46 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row46_col4\" class=\"data row46 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row46_col5\" class=\"data row46 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row46_col6\" class=\"data row46 col6\" >{'num_bins': {'type': 'int', 'default': 10}, 'mode': {'type': 'str', 'default': 'fixed'}}</td>\n",
-       "      <td id=\"T_56dd5_row46_col7\" class=\"data row46 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_56dd5_row46_col8\" class=\"data row46 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row47_col0\" class=\"data row47 col0\" >validmind.model_validation.sklearn.PrecisionRecallCurve</td>\n",
-       "      <td id=\"T_56dd5_row47_col1\" class=\"data row47 col1\" >Precision Recall Curve</td>\n",
-       "      <td id=\"T_56dd5_row47_col2\" class=\"data row47 col2\" >Evaluates the precision-recall trade-off for binary classification models and visualizes the Precision-Recall curve....</td>\n",
-       "      <td id=\"T_56dd5_row47_col3\" class=\"data row47 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row47_col4\" class=\"data row47 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row47_col5\" class=\"data row47 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_56dd5_row47_col6\" class=\"data row47 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row47_col7\" class=\"data row47 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_56dd5_row47_col8\" class=\"data row47 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row48_col0\" class=\"data row48 col0\" >validmind.model_validation.sklearn.ROCCurve</td>\n",
-       "      <td id=\"T_56dd5_row48_col1\" class=\"data row48 col1\" >ROC Curve</td>\n",
-       "      <td id=\"T_56dd5_row48_col2\" class=\"data row48 col2\" >Evaluates binary classification model performance by generating and plotting the Receiver Operating Characteristic...</td>\n",
-       "      <td id=\"T_56dd5_row48_col3\" class=\"data row48 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row48_col4\" class=\"data row48 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row48_col5\" class=\"data row48 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_56dd5_row48_col6\" class=\"data row48 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row48_col7\" class=\"data row48 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_56dd5_row48_col8\" class=\"data row48 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row49_col0\" class=\"data row49 col0\" >validmind.model_validation.sklearn.RegressionErrors</td>\n",
-       "      <td id=\"T_56dd5_row49_col1\" class=\"data row49 col1\" >Regression Errors</td>\n",
-       "      <td id=\"T_56dd5_row49_col2\" class=\"data row49 col2\" >Assesses the performance and error distribution of a regression model using various error metrics....</td>\n",
-       "      <td id=\"T_56dd5_row49_col3\" class=\"data row49 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row49_col4\" class=\"data row49 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row49_col5\" class=\"data row49 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_56dd5_row49_col6\" class=\"data row49 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row49_col7\" class=\"data row49 col7\" >['sklearn', 'model_performance']</td>\n",
-       "      <td id=\"T_56dd5_row49_col8\" class=\"data row49 col8\" >['regression', 'classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row50_col0\" class=\"data row50 col0\" >validmind.model_validation.sklearn.RobustnessDiagnosis</td>\n",
-       "      <td id=\"T_56dd5_row50_col1\" class=\"data row50 col1\" >Robustness Diagnosis</td>\n",
-       "      <td id=\"T_56dd5_row50_col2\" class=\"data row50 col2\" >Assesses the robustness of a machine learning model by evaluating performance decay under noisy conditions....</td>\n",
-       "      <td id=\"T_56dd5_row50_col3\" class=\"data row50 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row50_col4\" class=\"data row50 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row50_col5\" class=\"data row50 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row50_col6\" class=\"data row50 col6\" >{'metric': {'type': 'str', 'default': None}, 'scaling_factor_std_dev_list': {'type': None, 'default': [0.1, 0.2, 0.3, 0.4, 0.5]}, 'performance_decay_threshold': {'type': 'float', 'default': 0.05}}</td>\n",
-       "      <td id=\"T_56dd5_row50_col7\" class=\"data row50 col7\" >['sklearn', 'model_diagnosis', 'visualization']</td>\n",
-       "      <td id=\"T_56dd5_row50_col8\" class=\"data row50 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row51_col0\" class=\"data row51 col0\" >validmind.model_validation.sklearn.SHAPGlobalImportance</td>\n",
-       "      <td id=\"T_56dd5_row51_col1\" class=\"data row51 col1\" >SHAP Global Importance</td>\n",
-       "      <td id=\"T_56dd5_row51_col2\" class=\"data row51 col2\" >Evaluates and visualizes global feature importance using SHAP values for model explanation and risk identification....</td>\n",
-       "      <td id=\"T_56dd5_row51_col3\" class=\"data row51 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row51_col4\" class=\"data row51 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row51_col5\" class=\"data row51 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_56dd5_row51_col6\" class=\"data row51 col6\" >{'kernel_explainer_samples': {'type': 'int', 'default': 10}, 'tree_or_linear_explainer_samples': {'type': 'int', 'default': 200}, 'class_of_interest': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_56dd5_row51_col7\" class=\"data row51 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'feature_importance', 'visualization']</td>\n",
-       "      <td id=\"T_56dd5_row51_col8\" class=\"data row51 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row52_col0\" class=\"data row52 col0\" >validmind.model_validation.sklearn.ScoreProbabilityAlignment</td>\n",
-       "      <td id=\"T_56dd5_row52_col1\" class=\"data row52 col1\" >Score Probability Alignment</td>\n",
-       "      <td id=\"T_56dd5_row52_col2\" class=\"data row52 col2\" >Analyzes the alignment between credit scores and predicted probabilities....</td>\n",
-       "      <td id=\"T_56dd5_row52_col3\" class=\"data row52 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row52_col4\" class=\"data row52 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row52_col5\" class=\"data row52 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_56dd5_row52_col6\" class=\"data row52 col6\" >{'score_column': {'type': 'str', 'default': 'score'}, 'n_bins': {'type': 'int', 'default': 10}}</td>\n",
-       "      <td id=\"T_56dd5_row52_col7\" class=\"data row52 col7\" >['visualization', 'credit_risk', 'calibration']</td>\n",
-       "      <td id=\"T_56dd5_row52_col8\" class=\"data row52 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row53_col0\" class=\"data row53 col0\" >validmind.model_validation.sklearn.TrainingTestDegradation</td>\n",
-       "      <td id=\"T_56dd5_row53_col1\" class=\"data row53 col1\" >Training Test Degradation</td>\n",
-       "      <td id=\"T_56dd5_row53_col2\" class=\"data row53 col2\" >Tests if model performance degradation between training and test datasets exceeds a predefined threshold....</td>\n",
-       "      <td id=\"T_56dd5_row53_col3\" class=\"data row53 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row53_col4\" class=\"data row53 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row53_col5\" class=\"data row53 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row53_col6\" class=\"data row53 col6\" >{'max_threshold': {'type': 'float', 'default': 0.1}}</td>\n",
-       "      <td id=\"T_56dd5_row53_col7\" class=\"data row53 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_56dd5_row53_col8\" class=\"data row53 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row54_col0\" class=\"data row54 col0\" >validmind.model_validation.sklearn.WeakspotsDiagnosis</td>\n",
-       "      <td id=\"T_56dd5_row54_col1\" class=\"data row54 col1\" >Weakspots Diagnosis</td>\n",
-       "      <td id=\"T_56dd5_row54_col2\" class=\"data row54 col2\" >Identifies and visualizes weak spots in a machine learning model's performance across various sections of the...</td>\n",
-       "      <td id=\"T_56dd5_row54_col3\" class=\"data row54 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row54_col4\" class=\"data row54 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row54_col5\" class=\"data row54 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row54_col6\" class=\"data row54 col6\" >{'features_columns': {'type': None, 'default': None}, 'metrics': {'type': None, 'default': None}, 'thresholds': {'type': None, 'default': None}}</td>\n",
-       "      <td id=\"T_56dd5_row54_col7\" class=\"data row54 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_diagnosis', 'visualization']</td>\n",
-       "      <td id=\"T_56dd5_row54_col8\" class=\"data row54 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row55_col0\" class=\"data row55 col0\" >validmind.model_validation.statsmodels.CumulativePredictionProbabilities</td>\n",
-       "      <td id=\"T_56dd5_row55_col1\" class=\"data row55 col1\" >Cumulative Prediction Probabilities</td>\n",
-       "      <td id=\"T_56dd5_row55_col2\" class=\"data row55 col2\" >Visualizes cumulative probabilities of positive and negative classes for both training and testing in classification models....</td>\n",
-       "      <td id=\"T_56dd5_row55_col3\" class=\"data row55 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row55_col4\" class=\"data row55 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row55_col5\" class=\"data row55 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row55_col6\" class=\"data row55 col6\" >{'title': {'type': 'str', 'default': 'Cumulative Probabilities'}}</td>\n",
-       "      <td id=\"T_56dd5_row55_col7\" class=\"data row55 col7\" >['visualization', 'credit_risk']</td>\n",
-       "      <td id=\"T_56dd5_row55_col8\" class=\"data row55 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row56_col0\" class=\"data row56 col0\" >validmind.model_validation.statsmodels.GINITable</td>\n",
-       "      <td id=\"T_56dd5_row56_col1\" class=\"data row56 col1\" >GINI Table</td>\n",
-       "      <td id=\"T_56dd5_row56_col2\" class=\"data row56 col2\" >Evaluates classification model performance using AUC, GINI, and KS metrics for training and test datasets....</td>\n",
-       "      <td id=\"T_56dd5_row56_col3\" class=\"data row56 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row56_col4\" class=\"data row56 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row56_col5\" class=\"data row56 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row56_col6\" class=\"data row56 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row56_col7\" class=\"data row56 col7\" >['model_performance']</td>\n",
-       "      <td id=\"T_56dd5_row56_col8\" class=\"data row56 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row57_col0\" class=\"data row57 col0\" >validmind.model_validation.statsmodels.KolmogorovSmirnov</td>\n",
-       "      <td id=\"T_56dd5_row57_col1\" class=\"data row57 col1\" >Kolmogorov Smirnov</td>\n",
-       "      <td id=\"T_56dd5_row57_col2\" class=\"data row57 col2\" >Assesses whether each feature in the dataset aligns with a normal distribution using the Kolmogorov-Smirnov test....</td>\n",
-       "      <td id=\"T_56dd5_row57_col3\" class=\"data row57 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row57_col4\" class=\"data row57 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row57_col5\" class=\"data row57 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_56dd5_row57_col6\" class=\"data row57 col6\" >{'dist': {'type': 'str', 'default': 'norm'}}</td>\n",
-       "      <td id=\"T_56dd5_row57_col7\" class=\"data row57 col7\" >['tabular_data', 'data_distribution', 'statistical_test', 'statsmodels']</td>\n",
-       "      <td id=\"T_56dd5_row57_col8\" class=\"data row57 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row58_col0\" class=\"data row58 col0\" >validmind.model_validation.statsmodels.Lilliefors</td>\n",
-       "      <td id=\"T_56dd5_row58_col1\" class=\"data row58 col1\" >Lilliefors</td>\n",
-       "      <td id=\"T_56dd5_row58_col2\" class=\"data row58 col2\" >Assesses the normality of feature distributions in an ML model's training dataset using the Lilliefors test....</td>\n",
-       "      <td id=\"T_56dd5_row58_col3\" class=\"data row58 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row58_col4\" class=\"data row58 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row58_col5\" class=\"data row58 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row58_col6\" class=\"data row58 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row58_col7\" class=\"data row58 col7\" >['tabular_data', 'data_distribution', 'statistical_test', 'statsmodels']</td>\n",
-       "      <td id=\"T_56dd5_row58_col8\" class=\"data row58 col8\" >['classification', 'regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row59_col0\" class=\"data row59 col0\" >validmind.model_validation.statsmodels.PredictionProbabilitiesHistogram</td>\n",
-       "      <td id=\"T_56dd5_row59_col1\" class=\"data row59 col1\" >Prediction Probabilities Histogram</td>\n",
-       "      <td id=\"T_56dd5_row59_col2\" class=\"data row59 col2\" >Assesses the predictive probability distribution for binary classification to evaluate model performance and...</td>\n",
-       "      <td id=\"T_56dd5_row59_col3\" class=\"data row59 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row59_col4\" class=\"data row59 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row59_col5\" class=\"data row59 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row59_col6\" class=\"data row59 col6\" >{'title': {'type': 'str', 'default': 'Histogram of Predictive Probabilities'}}</td>\n",
-       "      <td id=\"T_56dd5_row59_col7\" class=\"data row59 col7\" >['visualization', 'credit_risk']</td>\n",
-       "      <td id=\"T_56dd5_row59_col8\" class=\"data row59 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row60_col0\" class=\"data row60 col0\" >validmind.model_validation.statsmodels.ScorecardHistogram</td>\n",
-       "      <td id=\"T_56dd5_row60_col1\" class=\"data row60 col1\" >Scorecard Histogram</td>\n",
-       "      <td id=\"T_56dd5_row60_col2\" class=\"data row60 col2\" >The Scorecard Histogram test evaluates the distribution of credit scores between default and non-default instances,...</td>\n",
-       "      <td id=\"T_56dd5_row60_col3\" class=\"data row60 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row60_col4\" class=\"data row60 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row60_col5\" class=\"data row60 col5\" >['dataset']</td>\n",
-       "      <td id=\"T_56dd5_row60_col6\" class=\"data row60 col6\" >{'title': {'type': 'str', 'default': 'Histogram of Scores'}, 'score_column': {'type': 'str', 'default': 'score'}}</td>\n",
-       "      <td id=\"T_56dd5_row60_col7\" class=\"data row60 col7\" >['visualization', 'credit_risk', 'logistic_regression']</td>\n",
-       "      <td id=\"T_56dd5_row60_col8\" class=\"data row60 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row61_col0\" class=\"data row61 col0\" >validmind.ongoing_monitoring.CalibrationCurveDrift</td>\n",
-       "      <td id=\"T_56dd5_row61_col1\" class=\"data row61 col1\" >Calibration Curve Drift</td>\n",
-       "      <td id=\"T_56dd5_row61_col2\" class=\"data row61 col2\" >Evaluates changes in probability calibration between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_56dd5_row61_col3\" class=\"data row61 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row61_col4\" class=\"data row61 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row61_col5\" class=\"data row61 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row61_col6\" class=\"data row61 col6\" >{'n_bins': {'type': 'int', 'default': 10}, 'drift_pct_threshold': {'type': 'float', 'default': 20}}</td>\n",
-       "      <td id=\"T_56dd5_row61_col7\" class=\"data row61 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_56dd5_row61_col8\" class=\"data row61 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row62_col0\" class=\"data row62 col0\" >validmind.ongoing_monitoring.ClassDiscriminationDrift</td>\n",
-       "      <td id=\"T_56dd5_row62_col1\" class=\"data row62 col1\" >Class Discrimination Drift</td>\n",
-       "      <td id=\"T_56dd5_row62_col2\" class=\"data row62 col2\" >Compares classification discrimination metrics between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_56dd5_row62_col3\" class=\"data row62 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row62_col4\" class=\"data row62 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row62_col5\" class=\"data row62 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row62_col6\" class=\"data row62 col6\" >{'drift_pct_threshold': {'type': '_empty', 'default': 20}}</td>\n",
-       "      <td id=\"T_56dd5_row62_col7\" class=\"data row62 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_56dd5_row62_col8\" class=\"data row62 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row63_col0\" class=\"data row63 col0\" >validmind.ongoing_monitoring.ClassImbalanceDrift</td>\n",
-       "      <td id=\"T_56dd5_row63_col1\" class=\"data row63 col1\" >Class Imbalance Drift</td>\n",
-       "      <td id=\"T_56dd5_row63_col2\" class=\"data row63 col2\" >Evaluates drift in class distribution between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_56dd5_row63_col3\" class=\"data row63 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row63_col4\" class=\"data row63 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row63_col5\" class=\"data row63 col5\" >['datasets']</td>\n",
-       "      <td id=\"T_56dd5_row63_col6\" class=\"data row63 col6\" >{'drift_pct_threshold': {'type': 'float', 'default': 5.0}, 'title': {'type': 'str', 'default': 'Class Distribution Drift'}}</td>\n",
-       "      <td id=\"T_56dd5_row63_col7\" class=\"data row63 col7\" >['tabular_data', 'binary_classification', 'multiclass_classification']</td>\n",
-       "      <td id=\"T_56dd5_row63_col8\" class=\"data row63 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row64_col0\" class=\"data row64 col0\" >validmind.ongoing_monitoring.ClassificationAccuracyDrift</td>\n",
-       "      <td id=\"T_56dd5_row64_col1\" class=\"data row64 col1\" >Classification Accuracy Drift</td>\n",
-       "      <td id=\"T_56dd5_row64_col2\" class=\"data row64 col2\" >Compares classification accuracy metrics between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_56dd5_row64_col3\" class=\"data row64 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row64_col4\" class=\"data row64 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row64_col5\" class=\"data row64 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row64_col6\" class=\"data row64 col6\" >{'drift_pct_threshold': {'type': '_empty', 'default': 20}}</td>\n",
-       "      <td id=\"T_56dd5_row64_col7\" class=\"data row64 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_56dd5_row64_col8\" class=\"data row64 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row65_col0\" class=\"data row65 col0\" >validmind.ongoing_monitoring.ConfusionMatrixDrift</td>\n",
-       "      <td id=\"T_56dd5_row65_col1\" class=\"data row65 col1\" >Confusion Matrix Drift</td>\n",
-       "      <td id=\"T_56dd5_row65_col2\" class=\"data row65 col2\" >Compares confusion matrix metrics between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_56dd5_row65_col3\" class=\"data row65 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row65_col4\" class=\"data row65 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row65_col5\" class=\"data row65 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row65_col6\" class=\"data row65 col6\" >{'drift_pct_threshold': {'type': '_empty', 'default': 20}}</td>\n",
-       "      <td id=\"T_56dd5_row65_col7\" class=\"data row65 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
-       "      <td id=\"T_56dd5_row65_col8\" class=\"data row65 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row66_col0\" class=\"data row66 col0\" >validmind.ongoing_monitoring.CumulativePredictionProbabilitiesDrift</td>\n",
-       "      <td id=\"T_56dd5_row66_col1\" class=\"data row66 col1\" >Cumulative Prediction Probabilities Drift</td>\n",
-       "      <td id=\"T_56dd5_row66_col2\" class=\"data row66 col2\" >Compares cumulative prediction probability distributions between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_56dd5_row66_col3\" class=\"data row66 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row66_col4\" class=\"data row66 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row66_col5\" class=\"data row66 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row66_col6\" class=\"data row66 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row66_col7\" class=\"data row66 col7\" >['visualization', 'credit_risk']</td>\n",
-       "      <td id=\"T_56dd5_row66_col8\" class=\"data row66 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row67_col0\" class=\"data row67 col0\" >validmind.ongoing_monitoring.PredictionProbabilitiesHistogramDrift</td>\n",
-       "      <td id=\"T_56dd5_row67_col1\" class=\"data row67 col1\" >Prediction Probabilities Histogram Drift</td>\n",
-       "      <td id=\"T_56dd5_row67_col2\" class=\"data row67 col2\" >Compares prediction probability distributions between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_56dd5_row67_col3\" class=\"data row67 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row67_col4\" class=\"data row67 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row67_col5\" class=\"data row67 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row67_col6\" class=\"data row67 col6\" >{'title': {'type': '_empty', 'default': 'Prediction Probabilities Histogram Drift'}, 'drift_pct_threshold': {'type': 'float', 'default': 20.0}}</td>\n",
-       "      <td id=\"T_56dd5_row67_col7\" class=\"data row67 col7\" >['visualization', 'credit_risk']</td>\n",
-       "      <td id=\"T_56dd5_row67_col8\" class=\"data row67 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row68_col0\" class=\"data row68 col0\" >validmind.ongoing_monitoring.ROCCurveDrift</td>\n",
-       "      <td id=\"T_56dd5_row68_col1\" class=\"data row68 col1\" >ROC Curve Drift</td>\n",
-       "      <td id=\"T_56dd5_row68_col2\" class=\"data row68 col2\" >Compares ROC curves between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_56dd5_row68_col3\" class=\"data row68 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row68_col4\" class=\"data row68 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row68_col5\" class=\"data row68 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row68_col6\" class=\"data row68 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row68_col7\" class=\"data row68 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_56dd5_row68_col8\" class=\"data row68 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row69_col0\" class=\"data row69 col0\" >validmind.ongoing_monitoring.ScoreBandsDrift</td>\n",
-       "      <td id=\"T_56dd5_row69_col1\" class=\"data row69 col1\" >Score Bands Drift</td>\n",
-       "      <td id=\"T_56dd5_row69_col2\" class=\"data row69 col2\" >Analyzes drift in population distribution and default rates across score bands....</td>\n",
-       "      <td id=\"T_56dd5_row69_col3\" class=\"data row69 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row69_col4\" class=\"data row69 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row69_col5\" class=\"data row69 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row69_col6\" class=\"data row69 col6\" >{'score_column': {'type': 'str', 'default': 'score'}, 'score_bands': {'type': 'list', 'default': None}, 'drift_threshold': {'type': 'float', 'default': 20.0}}</td>\n",
-       "      <td id=\"T_56dd5_row69_col7\" class=\"data row69 col7\" >['visualization', 'credit_risk', 'scorecard']</td>\n",
-       "      <td id=\"T_56dd5_row69_col8\" class=\"data row69 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row70_col0\" class=\"data row70 col0\" >validmind.ongoing_monitoring.ScorecardHistogramDrift</td>\n",
-       "      <td id=\"T_56dd5_row70_col1\" class=\"data row70 col1\" >Scorecard Histogram Drift</td>\n",
-       "      <td id=\"T_56dd5_row70_col2\" class=\"data row70 col2\" >Compares score distributions between reference and monitoring datasets for each class....</td>\n",
-       "      <td id=\"T_56dd5_row70_col3\" class=\"data row70 col3\" >True</td>\n",
-       "      <td id=\"T_56dd5_row70_col4\" class=\"data row70 col4\" >True</td>\n",
-       "      <td id=\"T_56dd5_row70_col5\" class=\"data row70 col5\" >['datasets']</td>\n",
-       "      <td id=\"T_56dd5_row70_col6\" class=\"data row70 col6\" >{'score_column': {'type': 'str', 'default': 'score'}, 'title': {'type': 'str', 'default': 'Scorecard Histogram Drift'}, 'drift_pct_threshold': {'type': 'float', 'default': 20.0}}</td>\n",
-       "      <td id=\"T_56dd5_row70_col7\" class=\"data row70 col7\" >['visualization', 'credit_risk', 'logistic_regression']</td>\n",
-       "      <td id=\"T_56dd5_row70_col8\" class=\"data row70 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row71_col0\" class=\"data row71 col0\" >validmind.unit_metrics.classification.Accuracy</td>\n",
-       "      <td id=\"T_56dd5_row71_col1\" class=\"data row71 col1\" >Accuracy</td>\n",
-       "      <td id=\"T_56dd5_row71_col2\" class=\"data row71 col2\" >Calculates the accuracy of a model</td>\n",
-       "      <td id=\"T_56dd5_row71_col3\" class=\"data row71 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row71_col4\" class=\"data row71 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row71_col5\" class=\"data row71 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_56dd5_row71_col6\" class=\"data row71 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row71_col7\" class=\"data row71 col7\" >['classification']</td>\n",
-       "      <td id=\"T_56dd5_row71_col8\" class=\"data row71 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row72_col0\" class=\"data row72 col0\" >validmind.unit_metrics.classification.F1</td>\n",
-       "      <td id=\"T_56dd5_row72_col1\" class=\"data row72 col1\" >F1</td>\n",
-       "      <td id=\"T_56dd5_row72_col2\" class=\"data row72 col2\" >Calculates the F1 score for a classification model.</td>\n",
-       "      <td id=\"T_56dd5_row72_col3\" class=\"data row72 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row72_col4\" class=\"data row72 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row72_col5\" class=\"data row72 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_56dd5_row72_col6\" class=\"data row72 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row72_col7\" class=\"data row72 col7\" >['classification']</td>\n",
-       "      <td id=\"T_56dd5_row72_col8\" class=\"data row72 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row73_col0\" class=\"data row73 col0\" >validmind.unit_metrics.classification.Precision</td>\n",
-       "      <td id=\"T_56dd5_row73_col1\" class=\"data row73 col1\" >Precision</td>\n",
-       "      <td id=\"T_56dd5_row73_col2\" class=\"data row73 col2\" >Calculates the precision for a classification model.</td>\n",
-       "      <td id=\"T_56dd5_row73_col3\" class=\"data row73 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row73_col4\" class=\"data row73 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row73_col5\" class=\"data row73 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_56dd5_row73_col6\" class=\"data row73 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row73_col7\" class=\"data row73 col7\" >['classification']</td>\n",
-       "      <td id=\"T_56dd5_row73_col8\" class=\"data row73 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row74_col0\" class=\"data row74 col0\" >validmind.unit_metrics.classification.ROC_AUC</td>\n",
-       "      <td id=\"T_56dd5_row74_col1\" class=\"data row74 col1\" >ROC AUC</td>\n",
-       "      <td id=\"T_56dd5_row74_col2\" class=\"data row74 col2\" >Calculates the ROC AUC for a classification model.</td>\n",
-       "      <td id=\"T_56dd5_row74_col3\" class=\"data row74 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row74_col4\" class=\"data row74 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row74_col5\" class=\"data row74 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_56dd5_row74_col6\" class=\"data row74 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row74_col7\" class=\"data row74 col7\" >['classification']</td>\n",
-       "      <td id=\"T_56dd5_row74_col8\" class=\"data row74 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_56dd5_row75_col0\" class=\"data row75 col0\" >validmind.unit_metrics.classification.Recall</td>\n",
-       "      <td id=\"T_56dd5_row75_col1\" class=\"data row75 col1\" >Recall</td>\n",
-       "      <td id=\"T_56dd5_row75_col2\" class=\"data row75 col2\" >Calculates the recall for a classification model.</td>\n",
-       "      <td id=\"T_56dd5_row75_col3\" class=\"data row75 col3\" >False</td>\n",
-       "      <td id=\"T_56dd5_row75_col4\" class=\"data row75 col4\" >False</td>\n",
-       "      <td id=\"T_56dd5_row75_col5\" class=\"data row75 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_56dd5_row75_col6\" class=\"data row75 col6\" >{}</td>\n",
-       "      <td id=\"T_56dd5_row75_col7\" class=\"data row75 col7\" >['classification']</td>\n",
-       "      <td id=\"T_56dd5_row75_col8\" class=\"data row75 col8\" >['classification']</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n"
+      "cell_type": "code",
+      "execution_count": 6,
+      "metadata": {},
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style type=\"text/css\">\n",
+              "#T_326c3 th {\n",
+              "  text-align: left;\n",
+              "}\n",
+              "#T_326c3_row0_col0, #T_326c3_row0_col1, #T_326c3_row0_col2, #T_326c3_row0_col3, #T_326c3_row0_col4, #T_326c3_row0_col5, #T_326c3_row0_col6, #T_326c3_row0_col7, #T_326c3_row0_col8, #T_326c3_row1_col0, #T_326c3_row1_col1, #T_326c3_row1_col2, #T_326c3_row1_col3, #T_326c3_row1_col4, #T_326c3_row1_col5, #T_326c3_row1_col6, #T_326c3_row1_col7, #T_326c3_row1_col8, #T_326c3_row2_col0, #T_326c3_row2_col1, #T_326c3_row2_col2, #T_326c3_row2_col3, #T_326c3_row2_col4, #T_326c3_row2_col5, #T_326c3_row2_col6, #T_326c3_row2_col7, #T_326c3_row2_col8, #T_326c3_row3_col0, #T_326c3_row3_col1, #T_326c3_row3_col2, #T_326c3_row3_col3, #T_326c3_row3_col4, #T_326c3_row3_col5, #T_326c3_row3_col6, #T_326c3_row3_col7, #T_326c3_row3_col8, #T_326c3_row4_col0, #T_326c3_row4_col1, #T_326c3_row4_col2, #T_326c3_row4_col3, #T_326c3_row4_col4, #T_326c3_row4_col5, #T_326c3_row4_col6, #T_326c3_row4_col7, #T_326c3_row4_col8, #T_326c3_row5_col0, #T_326c3_row5_col1, #T_326c3_row5_col2, #T_326c3_row5_col3, #T_326c3_row5_col4, #T_326c3_row5_col5, #T_326c3_row5_col6, #T_326c3_row5_col7, #T_326c3_row5_col8, #T_326c3_row6_col0, #T_326c3_row6_col1, #T_326c3_row6_col2, #T_326c3_row6_col3, #T_326c3_row6_col4, #T_326c3_row6_col5, #T_326c3_row6_col6, #T_326c3_row6_col7, #T_326c3_row6_col8, #T_326c3_row7_col0, #T_326c3_row7_col1, #T_326c3_row7_col2, #T_326c3_row7_col3, #T_326c3_row7_col4, #T_326c3_row7_col5, #T_326c3_row7_col6, #T_326c3_row7_col7, #T_326c3_row7_col8, #T_326c3_row8_col0, #T_326c3_row8_col1, #T_326c3_row8_col2, #T_326c3_row8_col3, #T_326c3_row8_col4, #T_326c3_row8_col5, #T_326c3_row8_col6, #T_326c3_row8_col7, #T_326c3_row8_col8, #T_326c3_row9_col0, #T_326c3_row9_col1, #T_326c3_row9_col2, #T_326c3_row9_col3, #T_326c3_row9_col4, #T_326c3_row9_col5, #T_326c3_row9_col6, #T_326c3_row9_col7, #T_326c3_row9_col8, #T_326c3_row10_col0, #T_326c3_row10_col1, #T_326c3_row10_col2, #T_326c3_row10_col3, #T_326c3_row10_col4, #T_326c3_row10_col5, #T_326c3_row10_col6, #T_326c3_row10_col7, #T_326c3_row10_col8, #T_326c3_row11_col0, #T_326c3_row11_col1, #T_326c3_row11_col2, #T_326c3_row11_col3, #T_326c3_row11_col4, #T_326c3_row11_col5, #T_326c3_row11_col6, #T_326c3_row11_col7, #T_326c3_row11_col8, #T_326c3_row12_col0, #T_326c3_row12_col1, #T_326c3_row12_col2, #T_326c3_row12_col3, #T_326c3_row12_col4, #T_326c3_row12_col5, #T_326c3_row12_col6, #T_326c3_row12_col7, #T_326c3_row12_col8, #T_326c3_row13_col0, #T_326c3_row13_col1, #T_326c3_row13_col2, #T_326c3_row13_col3, #T_326c3_row13_col4, #T_326c3_row13_col5, #T_326c3_row13_col6, #T_326c3_row13_col7, #T_326c3_row13_col8, #T_326c3_row14_col0, #T_326c3_row14_col1, #T_326c3_row14_col2, #T_326c3_row14_col3, #T_326c3_row14_col4, #T_326c3_row14_col5, #T_326c3_row14_col6, #T_326c3_row14_col7, #T_326c3_row14_col8, #T_326c3_row15_col0, #T_326c3_row15_col1, #T_326c3_row15_col2, #T_326c3_row15_col3, #T_326c3_row15_col4, #T_326c3_row15_col5, #T_326c3_row15_col6, #T_326c3_row15_col7, #T_326c3_row15_col8, #T_326c3_row16_col0, #T_326c3_row16_col1, #T_326c3_row16_col2, #T_326c3_row16_col3, #T_326c3_row16_col4, #T_326c3_row16_col5, #T_326c3_row16_col6, #T_326c3_row16_col7, #T_326c3_row16_col8, #T_326c3_row17_col0, #T_326c3_row17_col1, #T_326c3_row17_col2, #T_326c3_row17_col3, #T_326c3_row17_col4, #T_326c3_row17_col5, #T_326c3_row17_col6, #T_326c3_row17_col7, #T_326c3_row17_col8, #T_326c3_row18_col0, #T_326c3_row18_col1, #T_326c3_row18_col2, #T_326c3_row18_col3, #T_326c3_row18_col4, #T_326c3_row18_col5, #T_326c3_row18_col6, #T_326c3_row18_col7, #T_326c3_row18_col8, #T_326c3_row19_col0, #T_326c3_row19_col1, #T_326c3_row19_col2, #T_326c3_row19_col3, #T_326c3_row19_col4, #T_326c3_row19_col5, #T_326c3_row19_col6, #T_326c3_row19_col7, #T_326c3_row19_col8, #T_326c3_row20_col0, #T_326c3_row20_col1, #T_326c3_row20_col2, #T_326c3_row20_col3, #T_326c3_row20_col4, #T_326c3_row20_col5, #T_326c3_row20_col6, #T_326c3_row20_col7, #T_326c3_row20_col8, #T_326c3_row21_col0, #T_326c3_row21_col1, #T_326c3_row21_col2, #T_326c3_row21_col3, #T_326c3_row21_col4, #T_326c3_row21_col5, #T_326c3_row21_col6, #T_326c3_row21_col7, #T_326c3_row21_col8, #T_326c3_row22_col0, #T_326c3_row22_col1, #T_326c3_row22_col2, #T_326c3_row22_col3, #T_326c3_row22_col4, #T_326c3_row22_col5, #T_326c3_row22_col6, #T_326c3_row22_col7, #T_326c3_row22_col8, #T_326c3_row23_col0, #T_326c3_row23_col1, #T_326c3_row23_col2, #T_326c3_row23_col3, #T_326c3_row23_col4, #T_326c3_row23_col5, #T_326c3_row23_col6, #T_326c3_row23_col7, #T_326c3_row23_col8, #T_326c3_row24_col0, #T_326c3_row24_col1, #T_326c3_row24_col2, #T_326c3_row24_col3, #T_326c3_row24_col4, #T_326c3_row24_col5, #T_326c3_row24_col6, #T_326c3_row24_col7, #T_326c3_row24_col8, #T_326c3_row25_col0, #T_326c3_row25_col1, #T_326c3_row25_col2, #T_326c3_row25_col3, #T_326c3_row25_col4, #T_326c3_row25_col5, #T_326c3_row25_col6, #T_326c3_row25_col7, #T_326c3_row25_col8, #T_326c3_row26_col0, #T_326c3_row26_col1, #T_326c3_row26_col2, #T_326c3_row26_col3, #T_326c3_row26_col4, #T_326c3_row26_col5, #T_326c3_row26_col6, #T_326c3_row26_col7, #T_326c3_row26_col8, #T_326c3_row27_col0, #T_326c3_row27_col1, #T_326c3_row27_col2, #T_326c3_row27_col3, #T_326c3_row27_col4, #T_326c3_row27_col5, #T_326c3_row27_col6, #T_326c3_row27_col7, #T_326c3_row27_col8, #T_326c3_row28_col0, #T_326c3_row28_col1, #T_326c3_row28_col2, #T_326c3_row28_col3, #T_326c3_row28_col4, #T_326c3_row28_col5, #T_326c3_row28_col6, #T_326c3_row28_col7, #T_326c3_row28_col8, #T_326c3_row29_col0, #T_326c3_row29_col1, #T_326c3_row29_col2, #T_326c3_row29_col3, #T_326c3_row29_col4, #T_326c3_row29_col5, #T_326c3_row29_col6, #T_326c3_row29_col7, #T_326c3_row29_col8, #T_326c3_row30_col0, #T_326c3_row30_col1, #T_326c3_row30_col2, #T_326c3_row30_col3, #T_326c3_row30_col4, #T_326c3_row30_col5, #T_326c3_row30_col6, #T_326c3_row30_col7, #T_326c3_row30_col8, #T_326c3_row31_col0, #T_326c3_row31_col1, #T_326c3_row31_col2, #T_326c3_row31_col3, #T_326c3_row31_col4, #T_326c3_row31_col5, #T_326c3_row31_col6, #T_326c3_row31_col7, #T_326c3_row31_col8, #T_326c3_row32_col0, #T_326c3_row32_col1, #T_326c3_row32_col2, #T_326c3_row32_col3, #T_326c3_row32_col4, #T_326c3_row32_col5, #T_326c3_row32_col6, #T_326c3_row32_col7, #T_326c3_row32_col8, #T_326c3_row33_col0, #T_326c3_row33_col1, #T_326c3_row33_col2, #T_326c3_row33_col3, #T_326c3_row33_col4, #T_326c3_row33_col5, #T_326c3_row33_col6, #T_326c3_row33_col7, #T_326c3_row33_col8, #T_326c3_row34_col0, #T_326c3_row34_col1, #T_326c3_row34_col2, #T_326c3_row34_col3, #T_326c3_row34_col4, #T_326c3_row34_col5, #T_326c3_row34_col6, #T_326c3_row34_col7, #T_326c3_row34_col8, #T_326c3_row35_col0, #T_326c3_row35_col1, #T_326c3_row35_col2, #T_326c3_row35_col3, #T_326c3_row35_col4, #T_326c3_row35_col5, #T_326c3_row35_col6, #T_326c3_row35_col7, #T_326c3_row35_col8, #T_326c3_row36_col0, #T_326c3_row36_col1, #T_326c3_row36_col2, #T_326c3_row36_col3, #T_326c3_row36_col4, #T_326c3_row36_col5, #T_326c3_row36_col6, #T_326c3_row36_col7, #T_326c3_row36_col8, #T_326c3_row37_col0, #T_326c3_row37_col1, #T_326c3_row37_col2, #T_326c3_row37_col3, #T_326c3_row37_col4, #T_326c3_row37_col5, #T_326c3_row37_col6, #T_326c3_row37_col7, #T_326c3_row37_col8, #T_326c3_row38_col0, #T_326c3_row38_col1, #T_326c3_row38_col2, #T_326c3_row38_col3, #T_326c3_row38_col4, #T_326c3_row38_col5, #T_326c3_row38_col6, #T_326c3_row38_col7, #T_326c3_row38_col8, #T_326c3_row39_col0, #T_326c3_row39_col1, #T_326c3_row39_col2, #T_326c3_row39_col3, #T_326c3_row39_col4, #T_326c3_row39_col5, #T_326c3_row39_col6, #T_326c3_row39_col7, #T_326c3_row39_col8, #T_326c3_row40_col0, #T_326c3_row40_col1, #T_326c3_row40_col2, #T_326c3_row40_col3, #T_326c3_row40_col4, #T_326c3_row40_col5, #T_326c3_row40_col6, #T_326c3_row40_col7, #T_326c3_row40_col8, #T_326c3_row41_col0, #T_326c3_row41_col1, #T_326c3_row41_col2, #T_326c3_row41_col3, #T_326c3_row41_col4, #T_326c3_row41_col5, #T_326c3_row41_col6, #T_326c3_row41_col7, #T_326c3_row41_col8, #T_326c3_row42_col0, #T_326c3_row42_col1, #T_326c3_row42_col2, #T_326c3_row42_col3, #T_326c3_row42_col4, #T_326c3_row42_col5, #T_326c3_row42_col6, #T_326c3_row42_col7, #T_326c3_row42_col8 {\n",
+              "  text-align: left;\n",
+              "}\n",
+              "</style>\n",
+              "<table id=\"T_326c3\">\n",
+              "  <thead>\n",
+              "    <tr>\n",
+              "      <th id=\"T_326c3_level0_col0\" class=\"col_heading level0 col0\" >ID</th>\n",
+              "      <th id=\"T_326c3_level0_col1\" class=\"col_heading level0 col1\" >Name</th>\n",
+              "      <th id=\"T_326c3_level0_col2\" class=\"col_heading level0 col2\" >Description</th>\n",
+              "      <th id=\"T_326c3_level0_col3\" class=\"col_heading level0 col3\" >Has Figure</th>\n",
+              "      <th id=\"T_326c3_level0_col4\" class=\"col_heading level0 col4\" >Has Table</th>\n",
+              "      <th id=\"T_326c3_level0_col5\" class=\"col_heading level0 col5\" >Required Inputs</th>\n",
+              "      <th id=\"T_326c3_level0_col6\" class=\"col_heading level0 col6\" >Params</th>\n",
+              "      <th id=\"T_326c3_level0_col7\" class=\"col_heading level0 col7\" >Tags</th>\n",
+              "      <th id=\"T_326c3_level0_col8\" class=\"col_heading level0 col8\" >Tasks</th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row0_col0\" class=\"data row0 col0\" >validmind.model_validation.ClusterSizeDistribution</td>\n",
+              "      <td id=\"T_326c3_row0_col1\" class=\"data row0 col1\" >Cluster Size Distribution</td>\n",
+              "      <td id=\"T_326c3_row0_col2\" class=\"data row0 col2\" >Assesses the performance of clustering models by comparing the distribution of cluster sizes in model predictions...</td>\n",
+              "      <td id=\"T_326c3_row0_col3\" class=\"data row0 col3\" >True</td>\n",
+              "      <td id=\"T_326c3_row0_col4\" class=\"data row0 col4\" >False</td>\n",
+              "      <td id=\"T_326c3_row0_col5\" class=\"data row0 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_326c3_row0_col6\" class=\"data row0 col6\" >{}</td>\n",
+              "      <td id=\"T_326c3_row0_col7\" class=\"data row0 col7\" >['sklearn', 'model_performance']</td>\n",
+              "      <td id=\"T_326c3_row0_col8\" class=\"data row0 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row1_col0\" class=\"data row1 col0\" >validmind.model_validation.TimeSeriesR2SquareBySegments</td>\n",
+              "      <td id=\"T_326c3_row1_col1\" class=\"data row1 col1\" >Time Series R2 Square By Segments</td>\n",
+              "      <td id=\"T_326c3_row1_col2\" class=\"data row1 col2\" >Evaluates the R-Squared values of regression models over specified time segments in time series data to assess...</td>\n",
+              "      <td id=\"T_326c3_row1_col3\" class=\"data row1 col3\" >True</td>\n",
+              "      <td id=\"T_326c3_row1_col4\" class=\"data row1 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row1_col5\" class=\"data row1 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_326c3_row1_col6\" class=\"data row1 col6\" >{'segments': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_326c3_row1_col7\" class=\"data row1 col7\" >['model_performance', 'sklearn']</td>\n",
+              "      <td id=\"T_326c3_row1_col8\" class=\"data row1 col8\" >['regression', 'time_series_forecasting']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row2_col0\" class=\"data row2 col0\" >validmind.model_validation.sklearn.AdjustedMutualInformation</td>\n",
+              "      <td id=\"T_326c3_row2_col1\" class=\"data row2 col1\" >Adjusted Mutual Information</td>\n",
+              "      <td id=\"T_326c3_row2_col2\" class=\"data row2 col2\" >Evaluates clustering model performance by measuring mutual information between true and predicted labels, adjusting...</td>\n",
+              "      <td id=\"T_326c3_row2_col3\" class=\"data row2 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row2_col4\" class=\"data row2 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row2_col5\" class=\"data row2 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_326c3_row2_col6\" class=\"data row2 col6\" >{}</td>\n",
+              "      <td id=\"T_326c3_row2_col7\" class=\"data row2 col7\" >['sklearn', 'model_performance', 'clustering']</td>\n",
+              "      <td id=\"T_326c3_row2_col8\" class=\"data row2 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row3_col0\" class=\"data row3 col0\" >validmind.model_validation.sklearn.AdjustedRandIndex</td>\n",
+              "      <td id=\"T_326c3_row3_col1\" class=\"data row3 col1\" >Adjusted Rand Index</td>\n",
+              "      <td id=\"T_326c3_row3_col2\" class=\"data row3 col2\" >Measures the similarity between two data clusters using the Adjusted Rand Index (ARI) metric in clustering machine...</td>\n",
+              "      <td id=\"T_326c3_row3_col3\" class=\"data row3 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row3_col4\" class=\"data row3 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row3_col5\" class=\"data row3 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_326c3_row3_col6\" class=\"data row3 col6\" >{}</td>\n",
+              "      <td id=\"T_326c3_row3_col7\" class=\"data row3 col7\" >['sklearn', 'model_performance', 'clustering']</td>\n",
+              "      <td id=\"T_326c3_row3_col8\" class=\"data row3 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row4_col0\" class=\"data row4 col0\" >validmind.model_validation.sklearn.CalibrationCurve</td>\n",
+              "      <td id=\"T_326c3_row4_col1\" class=\"data row4 col1\" >Calibration Curve</td>\n",
+              "      <td id=\"T_326c3_row4_col2\" class=\"data row4 col2\" >Evaluates the calibration of probability estimates by comparing predicted probabilities against observed...</td>\n",
+              "      <td id=\"T_326c3_row4_col3\" class=\"data row4 col3\" >True</td>\n",
+              "      <td id=\"T_326c3_row4_col4\" class=\"data row4 col4\" >False</td>\n",
+              "      <td id=\"T_326c3_row4_col5\" class=\"data row4 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_326c3_row4_col6\" class=\"data row4 col6\" >{'n_bins': {'type': 'int', 'default': 10}}</td>\n",
+              "      <td id=\"T_326c3_row4_col7\" class=\"data row4 col7\" >['sklearn', 'model_performance', 'classification']</td>\n",
+              "      <td id=\"T_326c3_row4_col8\" class=\"data row4 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row5_col0\" class=\"data row5 col0\" >validmind.model_validation.sklearn.ClassifierPerformance</td>\n",
+              "      <td id=\"T_326c3_row5_col1\" class=\"data row5 col1\" >Classifier Performance</td>\n",
+              "      <td id=\"T_326c3_row5_col2\" class=\"data row5 col2\" >Evaluates performance of binary or multiclass classification models using precision, recall, F1-Score, accuracy,...</td>\n",
+              "      <td id=\"T_326c3_row5_col3\" class=\"data row5 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row5_col4\" class=\"data row5 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row5_col5\" class=\"data row5 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_326c3_row5_col6\" class=\"data row5 col6\" >{'average': {'type': 'str', 'default': 'macro'}}</td>\n",
+              "      <td id=\"T_326c3_row5_col7\" class=\"data row5 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_326c3_row5_col8\" class=\"data row5 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row6_col0\" class=\"data row6 col0\" >validmind.model_validation.sklearn.ClassifierThresholdOptimization</td>\n",
+              "      <td id=\"T_326c3_row6_col1\" class=\"data row6 col1\" >Classifier Threshold Optimization</td>\n",
+              "      <td id=\"T_326c3_row6_col2\" class=\"data row6 col2\" >Analyzes and visualizes different threshold optimization methods for binary classification models....</td>\n",
+              "      <td id=\"T_326c3_row6_col3\" class=\"data row6 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row6_col4\" class=\"data row6 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row6_col5\" class=\"data row6 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_326c3_row6_col6\" class=\"data row6 col6\" >{'methods': {'type': None, 'default': None}, 'target_recall': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_326c3_row6_col7\" class=\"data row6 col7\" >['model_validation', 'threshold_optimization', 'classification_metrics']</td>\n",
+              "      <td id=\"T_326c3_row6_col8\" class=\"data row6 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row7_col0\" class=\"data row7 col0\" >validmind.model_validation.sklearn.ClusterCosineSimilarity</td>\n",
+              "      <td id=\"T_326c3_row7_col1\" class=\"data row7 col1\" >Cluster Cosine Similarity</td>\n",
+              "      <td id=\"T_326c3_row7_col2\" class=\"data row7 col2\" >Measures the intra-cluster similarity of a clustering model using cosine similarity....</td>\n",
+              "      <td id=\"T_326c3_row7_col3\" class=\"data row7 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row7_col4\" class=\"data row7 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row7_col5\" class=\"data row7 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_326c3_row7_col6\" class=\"data row7 col6\" >{}</td>\n",
+              "      <td id=\"T_326c3_row7_col7\" class=\"data row7 col7\" >['sklearn', 'model_performance', 'clustering']</td>\n",
+              "      <td id=\"T_326c3_row7_col8\" class=\"data row7 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row8_col0\" class=\"data row8 col0\" >validmind.model_validation.sklearn.ClusterPerformanceMetrics</td>\n",
+              "      <td id=\"T_326c3_row8_col1\" class=\"data row8 col1\" >Cluster Performance Metrics</td>\n",
+              "      <td id=\"T_326c3_row8_col2\" class=\"data row8 col2\" >Evaluates the performance of clustering machine learning models using multiple established metrics....</td>\n",
+              "      <td id=\"T_326c3_row8_col3\" class=\"data row8 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row8_col4\" class=\"data row8 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row8_col5\" class=\"data row8 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_326c3_row8_col6\" class=\"data row8 col6\" >{}</td>\n",
+              "      <td id=\"T_326c3_row8_col7\" class=\"data row8 col7\" >['sklearn', 'model_performance', 'clustering']</td>\n",
+              "      <td id=\"T_326c3_row8_col8\" class=\"data row8 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row9_col0\" class=\"data row9 col0\" >validmind.model_validation.sklearn.CompletenessScore</td>\n",
+              "      <td id=\"T_326c3_row9_col1\" class=\"data row9 col1\" >Completeness Score</td>\n",
+              "      <td id=\"T_326c3_row9_col2\" class=\"data row9 col2\" >Evaluates a clustering model's capacity to categorize instances from a single class into the same cluster....</td>\n",
+              "      <td id=\"T_326c3_row9_col3\" class=\"data row9 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row9_col4\" class=\"data row9 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row9_col5\" class=\"data row9 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_326c3_row9_col6\" class=\"data row9 col6\" >{}</td>\n",
+              "      <td id=\"T_326c3_row9_col7\" class=\"data row9 col7\" >['sklearn', 'model_performance', 'clustering']</td>\n",
+              "      <td id=\"T_326c3_row9_col8\" class=\"data row9 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row10_col0\" class=\"data row10 col0\" >validmind.model_validation.sklearn.ConfusionMatrix</td>\n",
+              "      <td id=\"T_326c3_row10_col1\" class=\"data row10 col1\" >Confusion Matrix</td>\n",
+              "      <td id=\"T_326c3_row10_col2\" class=\"data row10 col2\" >Evaluates and visually represents the classification ML model's predictive performance using a Confusion Matrix...</td>\n",
+              "      <td id=\"T_326c3_row10_col3\" class=\"data row10 col3\" >True</td>\n",
+              "      <td id=\"T_326c3_row10_col4\" class=\"data row10 col4\" >False</td>\n",
+              "      <td id=\"T_326c3_row10_col5\" class=\"data row10 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_326c3_row10_col6\" class=\"data row10 col6\" >{'threshold': {'type': 'float', 'default': 0.5}}</td>\n",
+              "      <td id=\"T_326c3_row10_col7\" class=\"data row10 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_326c3_row10_col8\" class=\"data row10 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row11_col0\" class=\"data row11 col0\" >validmind.model_validation.sklearn.FeatureImportance</td>\n",
+              "      <td id=\"T_326c3_row11_col1\" class=\"data row11 col1\" >Feature Importance</td>\n",
+              "      <td id=\"T_326c3_row11_col2\" class=\"data row11 col2\" >Compute feature importance scores for a given model and generate a summary table...</td>\n",
+              "      <td id=\"T_326c3_row11_col3\" class=\"data row11 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row11_col4\" class=\"data row11 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row11_col5\" class=\"data row11 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_326c3_row11_col6\" class=\"data row11 col6\" >{'num_features': {'type': 'int', 'default': 3}}</td>\n",
+              "      <td id=\"T_326c3_row11_col7\" class=\"data row11 col7\" >['model_explainability', 'sklearn']</td>\n",
+              "      <td id=\"T_326c3_row11_col8\" class=\"data row11 col8\" >['regression', 'time_series_forecasting']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row12_col0\" class=\"data row12 col0\" >validmind.model_validation.sklearn.FowlkesMallowsScore</td>\n",
+              "      <td id=\"T_326c3_row12_col1\" class=\"data row12 col1\" >Fowlkes Mallows Score</td>\n",
+              "      <td id=\"T_326c3_row12_col2\" class=\"data row12 col2\" >Evaluates the similarity between predicted and actual cluster assignments in a model using the Fowlkes-Mallows...</td>\n",
+              "      <td id=\"T_326c3_row12_col3\" class=\"data row12 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row12_col4\" class=\"data row12 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row12_col5\" class=\"data row12 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_326c3_row12_col6\" class=\"data row12 col6\" >{}</td>\n",
+              "      <td id=\"T_326c3_row12_col7\" class=\"data row12 col7\" >['sklearn', 'model_performance']</td>\n",
+              "      <td id=\"T_326c3_row12_col8\" class=\"data row12 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row13_col0\" class=\"data row13 col0\" >validmind.model_validation.sklearn.HomogeneityScore</td>\n",
+              "      <td id=\"T_326c3_row13_col1\" class=\"data row13 col1\" >Homogeneity Score</td>\n",
+              "      <td id=\"T_326c3_row13_col2\" class=\"data row13 col2\" >Assesses clustering homogeneity by comparing true and predicted labels, scoring from 0 (heterogeneous) to 1...</td>\n",
+              "      <td id=\"T_326c3_row13_col3\" class=\"data row13 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row13_col4\" class=\"data row13 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row13_col5\" class=\"data row13 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_326c3_row13_col6\" class=\"data row13 col6\" >{}</td>\n",
+              "      <td id=\"T_326c3_row13_col7\" class=\"data row13 col7\" >['sklearn', 'model_performance']</td>\n",
+              "      <td id=\"T_326c3_row13_col8\" class=\"data row13 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row14_col0\" class=\"data row14 col0\" >validmind.model_validation.sklearn.HyperParametersTuning</td>\n",
+              "      <td id=\"T_326c3_row14_col1\" class=\"data row14 col1\" >Hyper Parameters Tuning</td>\n",
+              "      <td id=\"T_326c3_row14_col2\" class=\"data row14 col2\" >Performs exhaustive grid search over specified parameter ranges to find optimal model configurations...</td>\n",
+              "      <td id=\"T_326c3_row14_col3\" class=\"data row14 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row14_col4\" class=\"data row14 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row14_col5\" class=\"data row14 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_326c3_row14_col6\" class=\"data row14 col6\" >{'param_grid': {'type': 'dict', 'default': None}, 'scoring': {'type': None, 'default': None}, 'thresholds': {'type': None, 'default': None}, 'fit_params': {'type': 'dict', 'default': None}}</td>\n",
+              "      <td id=\"T_326c3_row14_col7\" class=\"data row14 col7\" >['sklearn', 'model_performance']</td>\n",
+              "      <td id=\"T_326c3_row14_col8\" class=\"data row14 col8\" >['clustering', 'classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row15_col0\" class=\"data row15 col0\" >validmind.model_validation.sklearn.KMeansClustersOptimization</td>\n",
+              "      <td id=\"T_326c3_row15_col1\" class=\"data row15 col1\" >K Means Clusters Optimization</td>\n",
+              "      <td id=\"T_326c3_row15_col2\" class=\"data row15 col2\" >Optimizes the number of clusters in K-means models using Elbow and Silhouette methods....</td>\n",
+              "      <td id=\"T_326c3_row15_col3\" class=\"data row15 col3\" >True</td>\n",
+              "      <td id=\"T_326c3_row15_col4\" class=\"data row15 col4\" >False</td>\n",
+              "      <td id=\"T_326c3_row15_col5\" class=\"data row15 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_326c3_row15_col6\" class=\"data row15 col6\" >{'n_clusters': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_326c3_row15_col7\" class=\"data row15 col7\" >['sklearn', 'model_performance', 'kmeans']</td>\n",
+              "      <td id=\"T_326c3_row15_col8\" class=\"data row15 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row16_col0\" class=\"data row16 col0\" >validmind.model_validation.sklearn.MinimumAccuracy</td>\n",
+              "      <td id=\"T_326c3_row16_col1\" class=\"data row16 col1\" >Minimum Accuracy</td>\n",
+              "      <td id=\"T_326c3_row16_col2\" class=\"data row16 col2\" >Checks if the model's prediction accuracy meets or surpasses a specified threshold....</td>\n",
+              "      <td id=\"T_326c3_row16_col3\" class=\"data row16 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row16_col4\" class=\"data row16 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row16_col5\" class=\"data row16 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_326c3_row16_col6\" class=\"data row16 col6\" >{'min_threshold': {'type': 'float', 'default': 0.7}}</td>\n",
+              "      <td id=\"T_326c3_row16_col7\" class=\"data row16 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_326c3_row16_col8\" class=\"data row16 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row17_col0\" class=\"data row17 col0\" >validmind.model_validation.sklearn.MinimumF1Score</td>\n",
+              "      <td id=\"T_326c3_row17_col1\" class=\"data row17 col1\" >Minimum F1 Score</td>\n",
+              "      <td id=\"T_326c3_row17_col2\" class=\"data row17 col2\" >Assesses if the model's F1 score on the validation set meets a predefined minimum threshold, ensuring balanced...</td>\n",
+              "      <td id=\"T_326c3_row17_col3\" class=\"data row17 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row17_col4\" class=\"data row17 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row17_col5\" class=\"data row17 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_326c3_row17_col6\" class=\"data row17 col6\" >{'min_threshold': {'type': 'float', 'default': 0.5}}</td>\n",
+              "      <td id=\"T_326c3_row17_col7\" class=\"data row17 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_326c3_row17_col8\" class=\"data row17 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row18_col0\" class=\"data row18 col0\" >validmind.model_validation.sklearn.MinimumROCAUCScore</td>\n",
+              "      <td id=\"T_326c3_row18_col1\" class=\"data row18 col1\" >Minimum ROCAUC Score</td>\n",
+              "      <td id=\"T_326c3_row18_col2\" class=\"data row18 col2\" >Validates model by checking if the ROC AUC score meets or surpasses a specified threshold....</td>\n",
+              "      <td id=\"T_326c3_row18_col3\" class=\"data row18 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row18_col4\" class=\"data row18 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row18_col5\" class=\"data row18 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_326c3_row18_col6\" class=\"data row18 col6\" >{'min_threshold': {'type': 'float', 'default': 0.5}}</td>\n",
+              "      <td id=\"T_326c3_row18_col7\" class=\"data row18 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_326c3_row18_col8\" class=\"data row18 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row19_col0\" class=\"data row19 col0\" >validmind.model_validation.sklearn.ModelParameters</td>\n",
+              "      <td id=\"T_326c3_row19_col1\" class=\"data row19 col1\" >Model Parameters</td>\n",
+              "      <td id=\"T_326c3_row19_col2\" class=\"data row19 col2\" >Extracts and displays model parameters in a structured format for transparency and reproducibility....</td>\n",
+              "      <td id=\"T_326c3_row19_col3\" class=\"data row19 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row19_col4\" class=\"data row19 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row19_col5\" class=\"data row19 col5\" >['model']</td>\n",
+              "      <td id=\"T_326c3_row19_col6\" class=\"data row19 col6\" >{'model_params': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_326c3_row19_col7\" class=\"data row19 col7\" >['model_training', 'metadata']</td>\n",
+              "      <td id=\"T_326c3_row19_col8\" class=\"data row19 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row20_col0\" class=\"data row20 col0\" >validmind.model_validation.sklearn.ModelsPerformanceComparison</td>\n",
+              "      <td id=\"T_326c3_row20_col1\" class=\"data row20 col1\" >Models Performance Comparison</td>\n",
+              "      <td id=\"T_326c3_row20_col2\" class=\"data row20 col2\" >Evaluates and compares the performance of multiple Machine Learning models using various metrics like accuracy,...</td>\n",
+              "      <td id=\"T_326c3_row20_col3\" class=\"data row20 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row20_col4\" class=\"data row20 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row20_col5\" class=\"data row20 col5\" >['dataset', 'models']</td>\n",
+              "      <td id=\"T_326c3_row20_col6\" class=\"data row20 col6\" >{}</td>\n",
+              "      <td id=\"T_326c3_row20_col7\" class=\"data row20 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'model_comparison']</td>\n",
+              "      <td id=\"T_326c3_row20_col8\" class=\"data row20 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row21_col0\" class=\"data row21 col0\" >validmind.model_validation.sklearn.OverfitDiagnosis</td>\n",
+              "      <td id=\"T_326c3_row21_col1\" class=\"data row21 col1\" >Overfit Diagnosis</td>\n",
+              "      <td id=\"T_326c3_row21_col2\" class=\"data row21 col2\" >Assesses potential overfitting in a model's predictions, identifying regions where performance between training and...</td>\n",
+              "      <td id=\"T_326c3_row21_col3\" class=\"data row21 col3\" >True</td>\n",
+              "      <td id=\"T_326c3_row21_col4\" class=\"data row21 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row21_col5\" class=\"data row21 col5\" >['model', 'datasets']</td>\n",
+              "      <td id=\"T_326c3_row21_col6\" class=\"data row21 col6\" >{'metric': {'type': 'str', 'default': None}, 'cut_off_threshold': {'type': 'float', 'default': 0.04}}</td>\n",
+              "      <td id=\"T_326c3_row21_col7\" class=\"data row21 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'linear_regression', 'model_diagnosis']</td>\n",
+              "      <td id=\"T_326c3_row21_col8\" class=\"data row21 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row22_col0\" class=\"data row22 col0\" >validmind.model_validation.sklearn.PermutationFeatureImportance</td>\n",
+              "      <td id=\"T_326c3_row22_col1\" class=\"data row22 col1\" >Permutation Feature Importance</td>\n",
+              "      <td id=\"T_326c3_row22_col2\" class=\"data row22 col2\" >Assesses the significance of each feature in a model by evaluating the impact on model performance when feature...</td>\n",
+              "      <td id=\"T_326c3_row22_col3\" class=\"data row22 col3\" >True</td>\n",
+              "      <td id=\"T_326c3_row22_col4\" class=\"data row22 col4\" >False</td>\n",
+              "      <td id=\"T_326c3_row22_col5\" class=\"data row22 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_326c3_row22_col6\" class=\"data row22 col6\" >{'fontsize': {'type': None, 'default': None}, 'figure_height': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_326c3_row22_col7\" class=\"data row22 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'feature_importance', 'visualization']</td>\n",
+              "      <td id=\"T_326c3_row22_col8\" class=\"data row22 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row23_col0\" class=\"data row23 col0\" >validmind.model_validation.sklearn.PopulationStabilityIndex</td>\n",
+              "      <td id=\"T_326c3_row23_col1\" class=\"data row23 col1\" >Population Stability Index</td>\n",
+              "      <td id=\"T_326c3_row23_col2\" class=\"data row23 col2\" >Assesses the Population Stability Index (PSI) to quantify the stability of an ML model's predictions across...</td>\n",
+              "      <td id=\"T_326c3_row23_col3\" class=\"data row23 col3\" >True</td>\n",
+              "      <td id=\"T_326c3_row23_col4\" class=\"data row23 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row23_col5\" class=\"data row23 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_326c3_row23_col6\" class=\"data row23 col6\" >{'num_bins': {'type': 'int', 'default': 10}, 'mode': {'type': 'str', 'default': 'fixed'}}</td>\n",
+              "      <td id=\"T_326c3_row23_col7\" class=\"data row23 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_326c3_row23_col8\" class=\"data row23 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row24_col0\" class=\"data row24 col0\" >validmind.model_validation.sklearn.PrecisionRecallCurve</td>\n",
+              "      <td id=\"T_326c3_row24_col1\" class=\"data row24 col1\" >Precision Recall Curve</td>\n",
+              "      <td id=\"T_326c3_row24_col2\" class=\"data row24 col2\" >Evaluates the precision-recall trade-off for binary classification models and visualizes the Precision-Recall curve....</td>\n",
+              "      <td id=\"T_326c3_row24_col3\" class=\"data row24 col3\" >True</td>\n",
+              "      <td id=\"T_326c3_row24_col4\" class=\"data row24 col4\" >False</td>\n",
+              "      <td id=\"T_326c3_row24_col5\" class=\"data row24 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_326c3_row24_col6\" class=\"data row24 col6\" >{}</td>\n",
+              "      <td id=\"T_326c3_row24_col7\" class=\"data row24 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_326c3_row24_col8\" class=\"data row24 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row25_col0\" class=\"data row25 col0\" >validmind.model_validation.sklearn.ROCCurve</td>\n",
+              "      <td id=\"T_326c3_row25_col1\" class=\"data row25 col1\" >ROC Curve</td>\n",
+              "      <td id=\"T_326c3_row25_col2\" class=\"data row25 col2\" >Evaluates binary classification model performance by generating and plotting the Receiver Operating Characteristic...</td>\n",
+              "      <td id=\"T_326c3_row25_col3\" class=\"data row25 col3\" >True</td>\n",
+              "      <td id=\"T_326c3_row25_col4\" class=\"data row25 col4\" >False</td>\n",
+              "      <td id=\"T_326c3_row25_col5\" class=\"data row25 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_326c3_row25_col6\" class=\"data row25 col6\" >{}</td>\n",
+              "      <td id=\"T_326c3_row25_col7\" class=\"data row25 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_326c3_row25_col8\" class=\"data row25 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row26_col0\" class=\"data row26 col0\" >validmind.model_validation.sklearn.RegressionErrors</td>\n",
+              "      <td id=\"T_326c3_row26_col1\" class=\"data row26 col1\" >Regression Errors</td>\n",
+              "      <td id=\"T_326c3_row26_col2\" class=\"data row26 col2\" >Assesses the performance and error distribution of a regression model using various error metrics....</td>\n",
+              "      <td id=\"T_326c3_row26_col3\" class=\"data row26 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row26_col4\" class=\"data row26 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row26_col5\" class=\"data row26 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_326c3_row26_col6\" class=\"data row26 col6\" >{}</td>\n",
+              "      <td id=\"T_326c3_row26_col7\" class=\"data row26 col7\" >['sklearn', 'model_performance']</td>\n",
+              "      <td id=\"T_326c3_row26_col8\" class=\"data row26 col8\" >['regression', 'classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row27_col0\" class=\"data row27 col0\" >validmind.model_validation.sklearn.RegressionErrorsComparison</td>\n",
+              "      <td id=\"T_326c3_row27_col1\" class=\"data row27 col1\" >Regression Errors Comparison</td>\n",
+              "      <td id=\"T_326c3_row27_col2\" class=\"data row27 col2\" >Assesses multiple regression error metrics to compare model performance across different datasets, emphasizing...</td>\n",
+              "      <td id=\"T_326c3_row27_col3\" class=\"data row27 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row27_col4\" class=\"data row27 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row27_col5\" class=\"data row27 col5\" >['datasets', 'models']</td>\n",
+              "      <td id=\"T_326c3_row27_col6\" class=\"data row27 col6\" >{}</td>\n",
+              "      <td id=\"T_326c3_row27_col7\" class=\"data row27 col7\" >['model_performance', 'sklearn']</td>\n",
+              "      <td id=\"T_326c3_row27_col8\" class=\"data row27 col8\" >['regression', 'time_series_forecasting']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row28_col0\" class=\"data row28 col0\" >validmind.model_validation.sklearn.RegressionPerformance</td>\n",
+              "      <td id=\"T_326c3_row28_col1\" class=\"data row28 col1\" >Regression Performance</td>\n",
+              "      <td id=\"T_326c3_row28_col2\" class=\"data row28 col2\" >Evaluates the performance of a regression model using five different metrics: MAE, MSE, RMSE, MAPE, and MBD....</td>\n",
+              "      <td id=\"T_326c3_row28_col3\" class=\"data row28 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row28_col4\" class=\"data row28 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row28_col5\" class=\"data row28 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_326c3_row28_col6\" class=\"data row28 col6\" >{}</td>\n",
+              "      <td id=\"T_326c3_row28_col7\" class=\"data row28 col7\" >['sklearn', 'model_performance']</td>\n",
+              "      <td id=\"T_326c3_row28_col8\" class=\"data row28 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row29_col0\" class=\"data row29 col0\" >validmind.model_validation.sklearn.RegressionR2Square</td>\n",
+              "      <td id=\"T_326c3_row29_col1\" class=\"data row29 col1\" >Regression R2 Square</td>\n",
+              "      <td id=\"T_326c3_row29_col2\" class=\"data row29 col2\" >Assesses the overall goodness-of-fit of a regression model by evaluating R-squared (R2) and Adjusted R-squared (Adj...</td>\n",
+              "      <td id=\"T_326c3_row29_col3\" class=\"data row29 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row29_col4\" class=\"data row29 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row29_col5\" class=\"data row29 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_326c3_row29_col6\" class=\"data row29 col6\" >{}</td>\n",
+              "      <td id=\"T_326c3_row29_col7\" class=\"data row29 col7\" >['sklearn', 'model_performance']</td>\n",
+              "      <td id=\"T_326c3_row29_col8\" class=\"data row29 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row30_col0\" class=\"data row30 col0\" >validmind.model_validation.sklearn.RegressionR2SquareComparison</td>\n",
+              "      <td id=\"T_326c3_row30_col1\" class=\"data row30 col1\" >Regression R2 Square Comparison</td>\n",
+              "      <td id=\"T_326c3_row30_col2\" class=\"data row30 col2\" >Compares R-Squared and Adjusted R-Squared values for different regression models across multiple datasets to assess...</td>\n",
+              "      <td id=\"T_326c3_row30_col3\" class=\"data row30 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row30_col4\" class=\"data row30 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row30_col5\" class=\"data row30 col5\" >['datasets', 'models']</td>\n",
+              "      <td id=\"T_326c3_row30_col6\" class=\"data row30 col6\" >{}</td>\n",
+              "      <td id=\"T_326c3_row30_col7\" class=\"data row30 col7\" >['model_performance', 'sklearn']</td>\n",
+              "      <td id=\"T_326c3_row30_col8\" class=\"data row30 col8\" >['regression', 'time_series_forecasting']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row31_col0\" class=\"data row31 col0\" >validmind.model_validation.sklearn.RobustnessDiagnosis</td>\n",
+              "      <td id=\"T_326c3_row31_col1\" class=\"data row31 col1\" >Robustness Diagnosis</td>\n",
+              "      <td id=\"T_326c3_row31_col2\" class=\"data row31 col2\" >Assesses the robustness of a machine learning model by evaluating performance decay under noisy conditions....</td>\n",
+              "      <td id=\"T_326c3_row31_col3\" class=\"data row31 col3\" >True</td>\n",
+              "      <td id=\"T_326c3_row31_col4\" class=\"data row31 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row31_col5\" class=\"data row31 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_326c3_row31_col6\" class=\"data row31 col6\" >{'metric': {'type': 'str', 'default': None}, 'scaling_factor_std_dev_list': {'type': None, 'default': [0.1, 0.2, 0.3, 0.4, 0.5]}, 'performance_decay_threshold': {'type': 'float', 'default': 0.05}}</td>\n",
+              "      <td id=\"T_326c3_row31_col7\" class=\"data row31 col7\" >['sklearn', 'model_diagnosis', 'visualization']</td>\n",
+              "      <td id=\"T_326c3_row31_col8\" class=\"data row31 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row32_col0\" class=\"data row32 col0\" >validmind.model_validation.sklearn.SHAPGlobalImportance</td>\n",
+              "      <td id=\"T_326c3_row32_col1\" class=\"data row32 col1\" >SHAP Global Importance</td>\n",
+              "      <td id=\"T_326c3_row32_col2\" class=\"data row32 col2\" >Evaluates and visualizes global feature importance using SHAP values for model explanation and risk identification....</td>\n",
+              "      <td id=\"T_326c3_row32_col3\" class=\"data row32 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row32_col4\" class=\"data row32 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row32_col5\" class=\"data row32 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_326c3_row32_col6\" class=\"data row32 col6\" >{'kernel_explainer_samples': {'type': 'int', 'default': 10}, 'tree_or_linear_explainer_samples': {'type': 'int', 'default': 200}, 'class_of_interest': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_326c3_row32_col7\" class=\"data row32 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'feature_importance', 'visualization']</td>\n",
+              "      <td id=\"T_326c3_row32_col8\" class=\"data row32 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row33_col0\" class=\"data row33 col0\" >validmind.model_validation.sklearn.ScoreProbabilityAlignment</td>\n",
+              "      <td id=\"T_326c3_row33_col1\" class=\"data row33 col1\" >Score Probability Alignment</td>\n",
+              "      <td id=\"T_326c3_row33_col2\" class=\"data row33 col2\" >Analyzes the alignment between credit scores and predicted probabilities....</td>\n",
+              "      <td id=\"T_326c3_row33_col3\" class=\"data row33 col3\" >True</td>\n",
+              "      <td id=\"T_326c3_row33_col4\" class=\"data row33 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row33_col5\" class=\"data row33 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_326c3_row33_col6\" class=\"data row33 col6\" >{'score_column': {'type': 'str', 'default': 'score'}, 'n_bins': {'type': 'int', 'default': 10}}</td>\n",
+              "      <td id=\"T_326c3_row33_col7\" class=\"data row33 col7\" >['visualization', 'credit_risk', 'calibration']</td>\n",
+              "      <td id=\"T_326c3_row33_col8\" class=\"data row33 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row34_col0\" class=\"data row34 col0\" >validmind.model_validation.sklearn.SilhouettePlot</td>\n",
+              "      <td id=\"T_326c3_row34_col1\" class=\"data row34 col1\" >Silhouette Plot</td>\n",
+              "      <td id=\"T_326c3_row34_col2\" class=\"data row34 col2\" >Calculates and visualizes Silhouette Score, assessing the degree of data point suitability to its cluster in ML...</td>\n",
+              "      <td id=\"T_326c3_row34_col3\" class=\"data row34 col3\" >True</td>\n",
+              "      <td id=\"T_326c3_row34_col4\" class=\"data row34 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row34_col5\" class=\"data row34 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_326c3_row34_col6\" class=\"data row34 col6\" >{}</td>\n",
+              "      <td id=\"T_326c3_row34_col7\" class=\"data row34 col7\" >['sklearn', 'model_performance']</td>\n",
+              "      <td id=\"T_326c3_row34_col8\" class=\"data row34 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row35_col0\" class=\"data row35 col0\" >validmind.model_validation.sklearn.TrainingTestDegradation</td>\n",
+              "      <td id=\"T_326c3_row35_col1\" class=\"data row35 col1\" >Training Test Degradation</td>\n",
+              "      <td id=\"T_326c3_row35_col2\" class=\"data row35 col2\" >Tests if model performance degradation between training and test datasets exceeds a predefined threshold....</td>\n",
+              "      <td id=\"T_326c3_row35_col3\" class=\"data row35 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row35_col4\" class=\"data row35 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row35_col5\" class=\"data row35 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_326c3_row35_col6\" class=\"data row35 col6\" >{'max_threshold': {'type': 'float', 'default': 0.1}}</td>\n",
+              "      <td id=\"T_326c3_row35_col7\" class=\"data row35 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_326c3_row35_col8\" class=\"data row35 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row36_col0\" class=\"data row36 col0\" >validmind.model_validation.sklearn.VMeasure</td>\n",
+              "      <td id=\"T_326c3_row36_col1\" class=\"data row36 col1\" >V Measure</td>\n",
+              "      <td id=\"T_326c3_row36_col2\" class=\"data row36 col2\" >Evaluates homogeneity and completeness of a clustering model using the V Measure Score....</td>\n",
+              "      <td id=\"T_326c3_row36_col3\" class=\"data row36 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row36_col4\" class=\"data row36 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row36_col5\" class=\"data row36 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_326c3_row36_col6\" class=\"data row36 col6\" >{}</td>\n",
+              "      <td id=\"T_326c3_row36_col7\" class=\"data row36 col7\" >['sklearn', 'model_performance']</td>\n",
+              "      <td id=\"T_326c3_row36_col8\" class=\"data row36 col8\" >['clustering']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row37_col0\" class=\"data row37 col0\" >validmind.model_validation.sklearn.WeakspotsDiagnosis</td>\n",
+              "      <td id=\"T_326c3_row37_col1\" class=\"data row37 col1\" >Weakspots Diagnosis</td>\n",
+              "      <td id=\"T_326c3_row37_col2\" class=\"data row37 col2\" >Identifies and visualizes weak spots in a machine learning model's performance across various sections of the...</td>\n",
+              "      <td id=\"T_326c3_row37_col3\" class=\"data row37 col3\" >True</td>\n",
+              "      <td id=\"T_326c3_row37_col4\" class=\"data row37 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row37_col5\" class=\"data row37 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_326c3_row37_col6\" class=\"data row37 col6\" >{'features_columns': {'type': None, 'default': None}, 'metrics': {'type': None, 'default': None}, 'thresholds': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_326c3_row37_col7\" class=\"data row37 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_diagnosis', 'visualization']</td>\n",
+              "      <td id=\"T_326c3_row37_col8\" class=\"data row37 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row38_col0\" class=\"data row38 col0\" >validmind.ongoing_monitoring.CalibrationCurveDrift</td>\n",
+              "      <td id=\"T_326c3_row38_col1\" class=\"data row38 col1\" >Calibration Curve Drift</td>\n",
+              "      <td id=\"T_326c3_row38_col2\" class=\"data row38 col2\" >Evaluates changes in probability calibration between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_326c3_row38_col3\" class=\"data row38 col3\" >True</td>\n",
+              "      <td id=\"T_326c3_row38_col4\" class=\"data row38 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row38_col5\" class=\"data row38 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_326c3_row38_col6\" class=\"data row38 col6\" >{'n_bins': {'type': 'int', 'default': 10}, 'drift_pct_threshold': {'type': 'float', 'default': 20}}</td>\n",
+              "      <td id=\"T_326c3_row38_col7\" class=\"data row38 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_326c3_row38_col8\" class=\"data row38 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row39_col0\" class=\"data row39 col0\" >validmind.ongoing_monitoring.ClassDiscriminationDrift</td>\n",
+              "      <td id=\"T_326c3_row39_col1\" class=\"data row39 col1\" >Class Discrimination Drift</td>\n",
+              "      <td id=\"T_326c3_row39_col2\" class=\"data row39 col2\" >Compares classification discrimination metrics between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_326c3_row39_col3\" class=\"data row39 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row39_col4\" class=\"data row39 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row39_col5\" class=\"data row39 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_326c3_row39_col6\" class=\"data row39 col6\" >{'drift_pct_threshold': {'type': '_empty', 'default': 20}}</td>\n",
+              "      <td id=\"T_326c3_row39_col7\" class=\"data row39 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_326c3_row39_col8\" class=\"data row39 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row40_col0\" class=\"data row40 col0\" >validmind.ongoing_monitoring.ClassificationAccuracyDrift</td>\n",
+              "      <td id=\"T_326c3_row40_col1\" class=\"data row40 col1\" >Classification Accuracy Drift</td>\n",
+              "      <td id=\"T_326c3_row40_col2\" class=\"data row40 col2\" >Compares classification accuracy metrics between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_326c3_row40_col3\" class=\"data row40 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row40_col4\" class=\"data row40 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row40_col5\" class=\"data row40 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_326c3_row40_col6\" class=\"data row40 col6\" >{'drift_pct_threshold': {'type': '_empty', 'default': 20}}</td>\n",
+              "      <td id=\"T_326c3_row40_col7\" class=\"data row40 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_326c3_row40_col8\" class=\"data row40 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row41_col0\" class=\"data row41 col0\" >validmind.ongoing_monitoring.ConfusionMatrixDrift</td>\n",
+              "      <td id=\"T_326c3_row41_col1\" class=\"data row41 col1\" >Confusion Matrix Drift</td>\n",
+              "      <td id=\"T_326c3_row41_col2\" class=\"data row41 col2\" >Compares confusion matrix metrics between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_326c3_row41_col3\" class=\"data row41 col3\" >False</td>\n",
+              "      <td id=\"T_326c3_row41_col4\" class=\"data row41 col4\" >True</td>\n",
+              "      <td id=\"T_326c3_row41_col5\" class=\"data row41 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_326c3_row41_col6\" class=\"data row41 col6\" >{'drift_pct_threshold': {'type': '_empty', 'default': 20}}</td>\n",
+              "      <td id=\"T_326c3_row41_col7\" class=\"data row41 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_326c3_row41_col8\" class=\"data row41 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_326c3_row42_col0\" class=\"data row42 col0\" >validmind.ongoing_monitoring.ROCCurveDrift</td>\n",
+              "      <td id=\"T_326c3_row42_col1\" class=\"data row42 col1\" >ROC Curve Drift</td>\n",
+              "      <td id=\"T_326c3_row42_col2\" class=\"data row42 col2\" >Compares ROC curves between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_326c3_row42_col3\" class=\"data row42 col3\" >True</td>\n",
+              "      <td id=\"T_326c3_row42_col4\" class=\"data row42 col4\" >False</td>\n",
+              "      <td id=\"T_326c3_row42_col5\" class=\"data row42 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_326c3_row42_col6\" class=\"data row42 col6\" >{}</td>\n",
+              "      <td id=\"T_326c3_row42_col7\" class=\"data row42 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_326c3_row42_col8\" class=\"data row42 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "  </tbody>\n",
+              "</table>\n"
+            ],
+            "text/plain": [
+              "<pandas.io.formats.style.Styler at 0x1052e6790>"
+            ]
+          },
+          "execution_count": null,
+          "metadata": {},
+          "output_type": "execute_result"
+        }
       ],
-      "text/plain": [
-       "<pandas.io.formats.style.Styler at 0x10516c880>"
+      "source": [
+        "list_tests(filter=\"sklearn\")"
       ]
-     },
-     "execution_count": 7,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "list_tests(task=\"classification\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Use the `tags` parameter to find tests based on their tags, such as `model_performance` or `visualization`:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Use the `task` parameter to find tests that match a specific task type,  such as `classification`:"
+      ]
+    },
     {
-     "data": {
-      "text/html": [
-       "<style type=\"text/css\">\n",
-       "#T_4d8bf th {\n",
-       "  text-align: left;\n",
-       "}\n",
-       "#T_4d8bf_row0_col0, #T_4d8bf_row0_col1, #T_4d8bf_row0_col2, #T_4d8bf_row0_col3, #T_4d8bf_row0_col4, #T_4d8bf_row0_col5, #T_4d8bf_row0_col6, #T_4d8bf_row0_col7, #T_4d8bf_row0_col8, #T_4d8bf_row1_col0, #T_4d8bf_row1_col1, #T_4d8bf_row1_col2, #T_4d8bf_row1_col3, #T_4d8bf_row1_col4, #T_4d8bf_row1_col5, #T_4d8bf_row1_col6, #T_4d8bf_row1_col7, #T_4d8bf_row1_col8, #T_4d8bf_row2_col0, #T_4d8bf_row2_col1, #T_4d8bf_row2_col2, #T_4d8bf_row2_col3, #T_4d8bf_row2_col4, #T_4d8bf_row2_col5, #T_4d8bf_row2_col6, #T_4d8bf_row2_col7, #T_4d8bf_row2_col8, #T_4d8bf_row3_col0, #T_4d8bf_row3_col1, #T_4d8bf_row3_col2, #T_4d8bf_row3_col3, #T_4d8bf_row3_col4, #T_4d8bf_row3_col5, #T_4d8bf_row3_col6, #T_4d8bf_row3_col7, #T_4d8bf_row3_col8, #T_4d8bf_row4_col0, #T_4d8bf_row4_col1, #T_4d8bf_row4_col2, #T_4d8bf_row4_col3, #T_4d8bf_row4_col4, #T_4d8bf_row4_col5, #T_4d8bf_row4_col6, #T_4d8bf_row4_col7, #T_4d8bf_row4_col8, #T_4d8bf_row5_col0, #T_4d8bf_row5_col1, #T_4d8bf_row5_col2, #T_4d8bf_row5_col3, #T_4d8bf_row5_col4, #T_4d8bf_row5_col5, #T_4d8bf_row5_col6, #T_4d8bf_row5_col7, #T_4d8bf_row5_col8, #T_4d8bf_row6_col0, #T_4d8bf_row6_col1, #T_4d8bf_row6_col2, #T_4d8bf_row6_col3, #T_4d8bf_row6_col4, #T_4d8bf_row6_col5, #T_4d8bf_row6_col6, #T_4d8bf_row6_col7, #T_4d8bf_row6_col8 {\n",
-       "  text-align: left;\n",
-       "}\n",
-       "</style>\n",
-       "<table id=\"T_4d8bf\">\n",
-       "  <thead>\n",
-       "    <tr>\n",
-       "      <th id=\"T_4d8bf_level0_col0\" class=\"col_heading level0 col0\" >ID</th>\n",
-       "      <th id=\"T_4d8bf_level0_col1\" class=\"col_heading level0 col1\" >Name</th>\n",
-       "      <th id=\"T_4d8bf_level0_col2\" class=\"col_heading level0 col2\" >Description</th>\n",
-       "      <th id=\"T_4d8bf_level0_col3\" class=\"col_heading level0 col3\" >Has Figure</th>\n",
-       "      <th id=\"T_4d8bf_level0_col4\" class=\"col_heading level0 col4\" >Has Table</th>\n",
-       "      <th id=\"T_4d8bf_level0_col5\" class=\"col_heading level0 col5\" >Required Inputs</th>\n",
-       "      <th id=\"T_4d8bf_level0_col6\" class=\"col_heading level0 col6\" >Params</th>\n",
-       "      <th id=\"T_4d8bf_level0_col7\" class=\"col_heading level0 col7\" >Tags</th>\n",
-       "      <th id=\"T_4d8bf_level0_col8\" class=\"col_heading level0 col8\" >Tasks</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <td id=\"T_4d8bf_row0_col0\" class=\"data row0 col0\" >validmind.model_validation.RegressionResidualsPlot</td>\n",
-       "      <td id=\"T_4d8bf_row0_col1\" class=\"data row0 col1\" >Regression Residuals Plot</td>\n",
-       "      <td id=\"T_4d8bf_row0_col2\" class=\"data row0 col2\" >Evaluates regression model performance using residual distribution and actual vs. predicted plots....</td>\n",
-       "      <td id=\"T_4d8bf_row0_col3\" class=\"data row0 col3\" >True</td>\n",
-       "      <td id=\"T_4d8bf_row0_col4\" class=\"data row0 col4\" >False</td>\n",
-       "      <td id=\"T_4d8bf_row0_col5\" class=\"data row0 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_4d8bf_row0_col6\" class=\"data row0 col6\" >{'bin_size': {'type': 'float', 'default': 0.1}}</td>\n",
-       "      <td id=\"T_4d8bf_row0_col7\" class=\"data row0 col7\" >['model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_4d8bf_row0_col8\" class=\"data row0 col8\" >['regression']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_4d8bf_row1_col0\" class=\"data row1 col0\" >validmind.model_validation.sklearn.ConfusionMatrix</td>\n",
-       "      <td id=\"T_4d8bf_row1_col1\" class=\"data row1 col1\" >Confusion Matrix</td>\n",
-       "      <td id=\"T_4d8bf_row1_col2\" class=\"data row1 col2\" >Evaluates and visually represents the classification ML model's predictive performance using a Confusion Matrix...</td>\n",
-       "      <td id=\"T_4d8bf_row1_col3\" class=\"data row1 col3\" >True</td>\n",
-       "      <td id=\"T_4d8bf_row1_col4\" class=\"data row1 col4\" >False</td>\n",
-       "      <td id=\"T_4d8bf_row1_col5\" class=\"data row1 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_4d8bf_row1_col6\" class=\"data row1 col6\" >{'threshold': {'type': 'float', 'default': 0.5}}</td>\n",
-       "      <td id=\"T_4d8bf_row1_col7\" class=\"data row1 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_4d8bf_row1_col8\" class=\"data row1 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_4d8bf_row2_col0\" class=\"data row2 col0\" >validmind.model_validation.sklearn.PrecisionRecallCurve</td>\n",
-       "      <td id=\"T_4d8bf_row2_col1\" class=\"data row2 col1\" >Precision Recall Curve</td>\n",
-       "      <td id=\"T_4d8bf_row2_col2\" class=\"data row2 col2\" >Evaluates the precision-recall trade-off for binary classification models and visualizes the Precision-Recall curve....</td>\n",
-       "      <td id=\"T_4d8bf_row2_col3\" class=\"data row2 col3\" >True</td>\n",
-       "      <td id=\"T_4d8bf_row2_col4\" class=\"data row2 col4\" >False</td>\n",
-       "      <td id=\"T_4d8bf_row2_col5\" class=\"data row2 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_4d8bf_row2_col6\" class=\"data row2 col6\" >{}</td>\n",
-       "      <td id=\"T_4d8bf_row2_col7\" class=\"data row2 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_4d8bf_row2_col8\" class=\"data row2 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_4d8bf_row3_col0\" class=\"data row3 col0\" >validmind.model_validation.sklearn.ROCCurve</td>\n",
-       "      <td id=\"T_4d8bf_row3_col1\" class=\"data row3 col1\" >ROC Curve</td>\n",
-       "      <td id=\"T_4d8bf_row3_col2\" class=\"data row3 col2\" >Evaluates binary classification model performance by generating and plotting the Receiver Operating Characteristic...</td>\n",
-       "      <td id=\"T_4d8bf_row3_col3\" class=\"data row3 col3\" >True</td>\n",
-       "      <td id=\"T_4d8bf_row3_col4\" class=\"data row3 col4\" >False</td>\n",
-       "      <td id=\"T_4d8bf_row3_col5\" class=\"data row3 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_4d8bf_row3_col6\" class=\"data row3 col6\" >{}</td>\n",
-       "      <td id=\"T_4d8bf_row3_col7\" class=\"data row3 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_4d8bf_row3_col8\" class=\"data row3 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_4d8bf_row4_col0\" class=\"data row4 col0\" >validmind.model_validation.sklearn.TrainingTestDegradation</td>\n",
-       "      <td id=\"T_4d8bf_row4_col1\" class=\"data row4 col1\" >Training Test Degradation</td>\n",
-       "      <td id=\"T_4d8bf_row4_col2\" class=\"data row4 col2\" >Tests if model performance degradation between training and test datasets exceeds a predefined threshold....</td>\n",
-       "      <td id=\"T_4d8bf_row4_col3\" class=\"data row4 col3\" >False</td>\n",
-       "      <td id=\"T_4d8bf_row4_col4\" class=\"data row4 col4\" >True</td>\n",
-       "      <td id=\"T_4d8bf_row4_col5\" class=\"data row4 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_4d8bf_row4_col6\" class=\"data row4 col6\" >{'max_threshold': {'type': 'float', 'default': 0.1}}</td>\n",
-       "      <td id=\"T_4d8bf_row4_col7\" class=\"data row4 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_4d8bf_row4_col8\" class=\"data row4 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_4d8bf_row5_col0\" class=\"data row5 col0\" >validmind.ongoing_monitoring.CalibrationCurveDrift</td>\n",
-       "      <td id=\"T_4d8bf_row5_col1\" class=\"data row5 col1\" >Calibration Curve Drift</td>\n",
-       "      <td id=\"T_4d8bf_row5_col2\" class=\"data row5 col2\" >Evaluates changes in probability calibration between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_4d8bf_row5_col3\" class=\"data row5 col3\" >True</td>\n",
-       "      <td id=\"T_4d8bf_row5_col4\" class=\"data row5 col4\" >True</td>\n",
-       "      <td id=\"T_4d8bf_row5_col5\" class=\"data row5 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_4d8bf_row5_col6\" class=\"data row5 col6\" >{'n_bins': {'type': 'int', 'default': 10}, 'drift_pct_threshold': {'type': 'float', 'default': 20}}</td>\n",
-       "      <td id=\"T_4d8bf_row5_col7\" class=\"data row5 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_4d8bf_row5_col8\" class=\"data row5 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_4d8bf_row6_col0\" class=\"data row6 col0\" >validmind.ongoing_monitoring.ROCCurveDrift</td>\n",
-       "      <td id=\"T_4d8bf_row6_col1\" class=\"data row6 col1\" >ROC Curve Drift</td>\n",
-       "      <td id=\"T_4d8bf_row6_col2\" class=\"data row6 col2\" >Compares ROC curves between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_4d8bf_row6_col3\" class=\"data row6 col3\" >True</td>\n",
-       "      <td id=\"T_4d8bf_row6_col4\" class=\"data row6 col4\" >False</td>\n",
-       "      <td id=\"T_4d8bf_row6_col5\" class=\"data row6 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_4d8bf_row6_col6\" class=\"data row6 col6\" >{}</td>\n",
-       "      <td id=\"T_4d8bf_row6_col7\" class=\"data row6 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_4d8bf_row6_col8\" class=\"data row6 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n"
+      "cell_type": "code",
+      "execution_count": 7,
+      "metadata": {},
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style type=\"text/css\">\n",
+              "#T_56dd5 th {\n",
+              "  text-align: left;\n",
+              "}\n",
+              "#T_56dd5_row0_col0, #T_56dd5_row0_col1, #T_56dd5_row0_col2, #T_56dd5_row0_col3, #T_56dd5_row0_col4, #T_56dd5_row0_col5, #T_56dd5_row0_col6, #T_56dd5_row0_col7, #T_56dd5_row0_col8, #T_56dd5_row1_col0, #T_56dd5_row1_col1, #T_56dd5_row1_col2, #T_56dd5_row1_col3, #T_56dd5_row1_col4, #T_56dd5_row1_col5, #T_56dd5_row1_col6, #T_56dd5_row1_col7, #T_56dd5_row1_col8, #T_56dd5_row2_col0, #T_56dd5_row2_col1, #T_56dd5_row2_col2, #T_56dd5_row2_col3, #T_56dd5_row2_col4, #T_56dd5_row2_col5, #T_56dd5_row2_col6, #T_56dd5_row2_col7, #T_56dd5_row2_col8, #T_56dd5_row3_col0, #T_56dd5_row3_col1, #T_56dd5_row3_col2, #T_56dd5_row3_col3, #T_56dd5_row3_col4, #T_56dd5_row3_col5, #T_56dd5_row3_col6, #T_56dd5_row3_col7, #T_56dd5_row3_col8, #T_56dd5_row4_col0, #T_56dd5_row4_col1, #T_56dd5_row4_col2, #T_56dd5_row4_col3, #T_56dd5_row4_col4, #T_56dd5_row4_col5, #T_56dd5_row4_col6, #T_56dd5_row4_col7, #T_56dd5_row4_col8, #T_56dd5_row5_col0, #T_56dd5_row5_col1, #T_56dd5_row5_col2, #T_56dd5_row5_col3, #T_56dd5_row5_col4, #T_56dd5_row5_col5, #T_56dd5_row5_col6, #T_56dd5_row5_col7, #T_56dd5_row5_col8, #T_56dd5_row6_col0, #T_56dd5_row6_col1, #T_56dd5_row6_col2, #T_56dd5_row6_col3, #T_56dd5_row6_col4, #T_56dd5_row6_col5, #T_56dd5_row6_col6, #T_56dd5_row6_col7, #T_56dd5_row6_col8, #T_56dd5_row7_col0, #T_56dd5_row7_col1, #T_56dd5_row7_col2, #T_56dd5_row7_col3, #T_56dd5_row7_col4, #T_56dd5_row7_col5, #T_56dd5_row7_col6, #T_56dd5_row7_col7, #T_56dd5_row7_col8, #T_56dd5_row8_col0, #T_56dd5_row8_col1, #T_56dd5_row8_col2, #T_56dd5_row8_col3, #T_56dd5_row8_col4, #T_56dd5_row8_col5, #T_56dd5_row8_col6, #T_56dd5_row8_col7, #T_56dd5_row8_col8, #T_56dd5_row9_col0, #T_56dd5_row9_col1, #T_56dd5_row9_col2, #T_56dd5_row9_col3, #T_56dd5_row9_col4, #T_56dd5_row9_col5, #T_56dd5_row9_col6, #T_56dd5_row9_col7, #T_56dd5_row9_col8, #T_56dd5_row10_col0, #T_56dd5_row10_col1, #T_56dd5_row10_col2, #T_56dd5_row10_col3, #T_56dd5_row10_col4, #T_56dd5_row10_col5, #T_56dd5_row10_col6, #T_56dd5_row10_col7, #T_56dd5_row10_col8, #T_56dd5_row11_col0, #T_56dd5_row11_col1, #T_56dd5_row11_col2, #T_56dd5_row11_col3, #T_56dd5_row11_col4, #T_56dd5_row11_col5, #T_56dd5_row11_col6, #T_56dd5_row11_col7, #T_56dd5_row11_col8, #T_56dd5_row12_col0, #T_56dd5_row12_col1, #T_56dd5_row12_col2, #T_56dd5_row12_col3, #T_56dd5_row12_col4, #T_56dd5_row12_col5, #T_56dd5_row12_col6, #T_56dd5_row12_col7, #T_56dd5_row12_col8, #T_56dd5_row13_col0, #T_56dd5_row13_col1, #T_56dd5_row13_col2, #T_56dd5_row13_col3, #T_56dd5_row13_col4, #T_56dd5_row13_col5, #T_56dd5_row13_col6, #T_56dd5_row13_col7, #T_56dd5_row13_col8, #T_56dd5_row14_col0, #T_56dd5_row14_col1, #T_56dd5_row14_col2, #T_56dd5_row14_col3, #T_56dd5_row14_col4, #T_56dd5_row14_col5, #T_56dd5_row14_col6, #T_56dd5_row14_col7, #T_56dd5_row14_col8, #T_56dd5_row15_col0, #T_56dd5_row15_col1, #T_56dd5_row15_col2, #T_56dd5_row15_col3, #T_56dd5_row15_col4, #T_56dd5_row15_col5, #T_56dd5_row15_col6, #T_56dd5_row15_col7, #T_56dd5_row15_col8, #T_56dd5_row16_col0, #T_56dd5_row16_col1, #T_56dd5_row16_col2, #T_56dd5_row16_col3, #T_56dd5_row16_col4, #T_56dd5_row16_col5, #T_56dd5_row16_col6, #T_56dd5_row16_col7, #T_56dd5_row16_col8, #T_56dd5_row17_col0, #T_56dd5_row17_col1, #T_56dd5_row17_col2, #T_56dd5_row17_col3, #T_56dd5_row17_col4, #T_56dd5_row17_col5, #T_56dd5_row17_col6, #T_56dd5_row17_col7, #T_56dd5_row17_col8, #T_56dd5_row18_col0, #T_56dd5_row18_col1, #T_56dd5_row18_col2, #T_56dd5_row18_col3, #T_56dd5_row18_col4, #T_56dd5_row18_col5, #T_56dd5_row18_col6, #T_56dd5_row18_col7, #T_56dd5_row18_col8, #T_56dd5_row19_col0, #T_56dd5_row19_col1, #T_56dd5_row19_col2, #T_56dd5_row19_col3, #T_56dd5_row19_col4, #T_56dd5_row19_col5, #T_56dd5_row19_col6, #T_56dd5_row19_col7, #T_56dd5_row19_col8, #T_56dd5_row20_col0, #T_56dd5_row20_col1, #T_56dd5_row20_col2, #T_56dd5_row20_col3, #T_56dd5_row20_col4, #T_56dd5_row20_col5, #T_56dd5_row20_col6, #T_56dd5_row20_col7, #T_56dd5_row20_col8, #T_56dd5_row21_col0, #T_56dd5_row21_col1, #T_56dd5_row21_col2, #T_56dd5_row21_col3, #T_56dd5_row21_col4, #T_56dd5_row21_col5, #T_56dd5_row21_col6, #T_56dd5_row21_col7, #T_56dd5_row21_col8, #T_56dd5_row22_col0, #T_56dd5_row22_col1, #T_56dd5_row22_col2, #T_56dd5_row22_col3, #T_56dd5_row22_col4, #T_56dd5_row22_col5, #T_56dd5_row22_col6, #T_56dd5_row22_col7, #T_56dd5_row22_col8, #T_56dd5_row23_col0, #T_56dd5_row23_col1, #T_56dd5_row23_col2, #T_56dd5_row23_col3, #T_56dd5_row23_col4, #T_56dd5_row23_col5, #T_56dd5_row23_col6, #T_56dd5_row23_col7, #T_56dd5_row23_col8, #T_56dd5_row24_col0, #T_56dd5_row24_col1, #T_56dd5_row24_col2, #T_56dd5_row24_col3, #T_56dd5_row24_col4, #T_56dd5_row24_col5, #T_56dd5_row24_col6, #T_56dd5_row24_col7, #T_56dd5_row24_col8, #T_56dd5_row25_col0, #T_56dd5_row25_col1, #T_56dd5_row25_col2, #T_56dd5_row25_col3, #T_56dd5_row25_col4, #T_56dd5_row25_col5, #T_56dd5_row25_col6, #T_56dd5_row25_col7, #T_56dd5_row25_col8, #T_56dd5_row26_col0, #T_56dd5_row26_col1, #T_56dd5_row26_col2, #T_56dd5_row26_col3, #T_56dd5_row26_col4, #T_56dd5_row26_col5, #T_56dd5_row26_col6, #T_56dd5_row26_col7, #T_56dd5_row26_col8, #T_56dd5_row27_col0, #T_56dd5_row27_col1, #T_56dd5_row27_col2, #T_56dd5_row27_col3, #T_56dd5_row27_col4, #T_56dd5_row27_col5, #T_56dd5_row27_col6, #T_56dd5_row27_col7, #T_56dd5_row27_col8, #T_56dd5_row28_col0, #T_56dd5_row28_col1, #T_56dd5_row28_col2, #T_56dd5_row28_col3, #T_56dd5_row28_col4, #T_56dd5_row28_col5, #T_56dd5_row28_col6, #T_56dd5_row28_col7, #T_56dd5_row28_col8, #T_56dd5_row29_col0, #T_56dd5_row29_col1, #T_56dd5_row29_col2, #T_56dd5_row29_col3, #T_56dd5_row29_col4, #T_56dd5_row29_col5, #T_56dd5_row29_col6, #T_56dd5_row29_col7, #T_56dd5_row29_col8, #T_56dd5_row30_col0, #T_56dd5_row30_col1, #T_56dd5_row30_col2, #T_56dd5_row30_col3, #T_56dd5_row30_col4, #T_56dd5_row30_col5, #T_56dd5_row30_col6, #T_56dd5_row30_col7, #T_56dd5_row30_col8, #T_56dd5_row31_col0, #T_56dd5_row31_col1, #T_56dd5_row31_col2, #T_56dd5_row31_col3, #T_56dd5_row31_col4, #T_56dd5_row31_col5, #T_56dd5_row31_col6, #T_56dd5_row31_col7, #T_56dd5_row31_col8, #T_56dd5_row32_col0, #T_56dd5_row32_col1, #T_56dd5_row32_col2, #T_56dd5_row32_col3, #T_56dd5_row32_col4, #T_56dd5_row32_col5, #T_56dd5_row32_col6, #T_56dd5_row32_col7, #T_56dd5_row32_col8, #T_56dd5_row33_col0, #T_56dd5_row33_col1, #T_56dd5_row33_col2, #T_56dd5_row33_col3, #T_56dd5_row33_col4, #T_56dd5_row33_col5, #T_56dd5_row33_col6, #T_56dd5_row33_col7, #T_56dd5_row33_col8, #T_56dd5_row34_col0, #T_56dd5_row34_col1, #T_56dd5_row34_col2, #T_56dd5_row34_col3, #T_56dd5_row34_col4, #T_56dd5_row34_col5, #T_56dd5_row34_col6, #T_56dd5_row34_col7, #T_56dd5_row34_col8, #T_56dd5_row35_col0, #T_56dd5_row35_col1, #T_56dd5_row35_col2, #T_56dd5_row35_col3, #T_56dd5_row35_col4, #T_56dd5_row35_col5, #T_56dd5_row35_col6, #T_56dd5_row35_col7, #T_56dd5_row35_col8, #T_56dd5_row36_col0, #T_56dd5_row36_col1, #T_56dd5_row36_col2, #T_56dd5_row36_col3, #T_56dd5_row36_col4, #T_56dd5_row36_col5, #T_56dd5_row36_col6, #T_56dd5_row36_col7, #T_56dd5_row36_col8, #T_56dd5_row37_col0, #T_56dd5_row37_col1, #T_56dd5_row37_col2, #T_56dd5_row37_col3, #T_56dd5_row37_col4, #T_56dd5_row37_col5, #T_56dd5_row37_col6, #T_56dd5_row37_col7, #T_56dd5_row37_col8, #T_56dd5_row38_col0, #T_56dd5_row38_col1, #T_56dd5_row38_col2, #T_56dd5_row38_col3, #T_56dd5_row38_col4, #T_56dd5_row38_col5, #T_56dd5_row38_col6, #T_56dd5_row38_col7, #T_56dd5_row38_col8, #T_56dd5_row39_col0, #T_56dd5_row39_col1, #T_56dd5_row39_col2, #T_56dd5_row39_col3, #T_56dd5_row39_col4, #T_56dd5_row39_col5, #T_56dd5_row39_col6, #T_56dd5_row39_col7, #T_56dd5_row39_col8, #T_56dd5_row40_col0, #T_56dd5_row40_col1, #T_56dd5_row40_col2, #T_56dd5_row40_col3, #T_56dd5_row40_col4, #T_56dd5_row40_col5, #T_56dd5_row40_col6, #T_56dd5_row40_col7, #T_56dd5_row40_col8, #T_56dd5_row41_col0, #T_56dd5_row41_col1, #T_56dd5_row41_col2, #T_56dd5_row41_col3, #T_56dd5_row41_col4, #T_56dd5_row41_col5, #T_56dd5_row41_col6, #T_56dd5_row41_col7, #T_56dd5_row41_col8, #T_56dd5_row42_col0, #T_56dd5_row42_col1, #T_56dd5_row42_col2, #T_56dd5_row42_col3, #T_56dd5_row42_col4, #T_56dd5_row42_col5, #T_56dd5_row42_col6, #T_56dd5_row42_col7, #T_56dd5_row42_col8, #T_56dd5_row43_col0, #T_56dd5_row43_col1, #T_56dd5_row43_col2, #T_56dd5_row43_col3, #T_56dd5_row43_col4, #T_56dd5_row43_col5, #T_56dd5_row43_col6, #T_56dd5_row43_col7, #T_56dd5_row43_col8, #T_56dd5_row44_col0, #T_56dd5_row44_col1, #T_56dd5_row44_col2, #T_56dd5_row44_col3, #T_56dd5_row44_col4, #T_56dd5_row44_col5, #T_56dd5_row44_col6, #T_56dd5_row44_col7, #T_56dd5_row44_col8, #T_56dd5_row45_col0, #T_56dd5_row45_col1, #T_56dd5_row45_col2, #T_56dd5_row45_col3, #T_56dd5_row45_col4, #T_56dd5_row45_col5, #T_56dd5_row45_col6, #T_56dd5_row45_col7, #T_56dd5_row45_col8, #T_56dd5_row46_col0, #T_56dd5_row46_col1, #T_56dd5_row46_col2, #T_56dd5_row46_col3, #T_56dd5_row46_col4, #T_56dd5_row46_col5, #T_56dd5_row46_col6, #T_56dd5_row46_col7, #T_56dd5_row46_col8, #T_56dd5_row47_col0, #T_56dd5_row47_col1, #T_56dd5_row47_col2, #T_56dd5_row47_col3, #T_56dd5_row47_col4, #T_56dd5_row47_col5, #T_56dd5_row47_col6, #T_56dd5_row47_col7, #T_56dd5_row47_col8, #T_56dd5_row48_col0, #T_56dd5_row48_col1, #T_56dd5_row48_col2, #T_56dd5_row48_col3, #T_56dd5_row48_col4, #T_56dd5_row48_col5, #T_56dd5_row48_col6, #T_56dd5_row48_col7, #T_56dd5_row48_col8, #T_56dd5_row49_col0, #T_56dd5_row49_col1, #T_56dd5_row49_col2, #T_56dd5_row49_col3, #T_56dd5_row49_col4, #T_56dd5_row49_col5, #T_56dd5_row49_col6, #T_56dd5_row49_col7, #T_56dd5_row49_col8, #T_56dd5_row50_col0, #T_56dd5_row50_col1, #T_56dd5_row50_col2, #T_56dd5_row50_col3, #T_56dd5_row50_col4, #T_56dd5_row50_col5, #T_56dd5_row50_col6, #T_56dd5_row50_col7, #T_56dd5_row50_col8, #T_56dd5_row51_col0, #T_56dd5_row51_col1, #T_56dd5_row51_col2, #T_56dd5_row51_col3, #T_56dd5_row51_col4, #T_56dd5_row51_col5, #T_56dd5_row51_col6, #T_56dd5_row51_col7, #T_56dd5_row51_col8, #T_56dd5_row52_col0, #T_56dd5_row52_col1, #T_56dd5_row52_col2, #T_56dd5_row52_col3, #T_56dd5_row52_col4, #T_56dd5_row52_col5, #T_56dd5_row52_col6, #T_56dd5_row52_col7, #T_56dd5_row52_col8, #T_56dd5_row53_col0, #T_56dd5_row53_col1, #T_56dd5_row53_col2, #T_56dd5_row53_col3, #T_56dd5_row53_col4, #T_56dd5_row53_col5, #T_56dd5_row53_col6, #T_56dd5_row53_col7, #T_56dd5_row53_col8, #T_56dd5_row54_col0, #T_56dd5_row54_col1, #T_56dd5_row54_col2, #T_56dd5_row54_col3, #T_56dd5_row54_col4, #T_56dd5_row54_col5, #T_56dd5_row54_col6, #T_56dd5_row54_col7, #T_56dd5_row54_col8, #T_56dd5_row55_col0, #T_56dd5_row55_col1, #T_56dd5_row55_col2, #T_56dd5_row55_col3, #T_56dd5_row55_col4, #T_56dd5_row55_col5, #T_56dd5_row55_col6, #T_56dd5_row55_col7, #T_56dd5_row55_col8, #T_56dd5_row56_col0, #T_56dd5_row56_col1, #T_56dd5_row56_col2, #T_56dd5_row56_col3, #T_56dd5_row56_col4, #T_56dd5_row56_col5, #T_56dd5_row56_col6, #T_56dd5_row56_col7, #T_56dd5_row56_col8, #T_56dd5_row57_col0, #T_56dd5_row57_col1, #T_56dd5_row57_col2, #T_56dd5_row57_col3, #T_56dd5_row57_col4, #T_56dd5_row57_col5, #T_56dd5_row57_col6, #T_56dd5_row57_col7, #T_56dd5_row57_col8, #T_56dd5_row58_col0, #T_56dd5_row58_col1, #T_56dd5_row58_col2, #T_56dd5_row58_col3, #T_56dd5_row58_col4, #T_56dd5_row58_col5, #T_56dd5_row58_col6, #T_56dd5_row58_col7, #T_56dd5_row58_col8, #T_56dd5_row59_col0, #T_56dd5_row59_col1, #T_56dd5_row59_col2, #T_56dd5_row59_col3, #T_56dd5_row59_col4, #T_56dd5_row59_col5, #T_56dd5_row59_col6, #T_56dd5_row59_col7, #T_56dd5_row59_col8, #T_56dd5_row60_col0, #T_56dd5_row60_col1, #T_56dd5_row60_col2, #T_56dd5_row60_col3, #T_56dd5_row60_col4, #T_56dd5_row60_col5, #T_56dd5_row60_col6, #T_56dd5_row60_col7, #T_56dd5_row60_col8, #T_56dd5_row61_col0, #T_56dd5_row61_col1, #T_56dd5_row61_col2, #T_56dd5_row61_col3, #T_56dd5_row61_col4, #T_56dd5_row61_col5, #T_56dd5_row61_col6, #T_56dd5_row61_col7, #T_56dd5_row61_col8, #T_56dd5_row62_col0, #T_56dd5_row62_col1, #T_56dd5_row62_col2, #T_56dd5_row62_col3, #T_56dd5_row62_col4, #T_56dd5_row62_col5, #T_56dd5_row62_col6, #T_56dd5_row62_col7, #T_56dd5_row62_col8, #T_56dd5_row63_col0, #T_56dd5_row63_col1, #T_56dd5_row63_col2, #T_56dd5_row63_col3, #T_56dd5_row63_col4, #T_56dd5_row63_col5, #T_56dd5_row63_col6, #T_56dd5_row63_col7, #T_56dd5_row63_col8, #T_56dd5_row64_col0, #T_56dd5_row64_col1, #T_56dd5_row64_col2, #T_56dd5_row64_col3, #T_56dd5_row64_col4, #T_56dd5_row64_col5, #T_56dd5_row64_col6, #T_56dd5_row64_col7, #T_56dd5_row64_col8, #T_56dd5_row65_col0, #T_56dd5_row65_col1, #T_56dd5_row65_col2, #T_56dd5_row65_col3, #T_56dd5_row65_col4, #T_56dd5_row65_col5, #T_56dd5_row65_col6, #T_56dd5_row65_col7, #T_56dd5_row65_col8, #T_56dd5_row66_col0, #T_56dd5_row66_col1, #T_56dd5_row66_col2, #T_56dd5_row66_col3, #T_56dd5_row66_col4, #T_56dd5_row66_col5, #T_56dd5_row66_col6, #T_56dd5_row66_col7, #T_56dd5_row66_col8, #T_56dd5_row67_col0, #T_56dd5_row67_col1, #T_56dd5_row67_col2, #T_56dd5_row67_col3, #T_56dd5_row67_col4, #T_56dd5_row67_col5, #T_56dd5_row67_col6, #T_56dd5_row67_col7, #T_56dd5_row67_col8, #T_56dd5_row68_col0, #T_56dd5_row68_col1, #T_56dd5_row68_col2, #T_56dd5_row68_col3, #T_56dd5_row68_col4, #T_56dd5_row68_col5, #T_56dd5_row68_col6, #T_56dd5_row68_col7, #T_56dd5_row68_col8, #T_56dd5_row69_col0, #T_56dd5_row69_col1, #T_56dd5_row69_col2, #T_56dd5_row69_col3, #T_56dd5_row69_col4, #T_56dd5_row69_col5, #T_56dd5_row69_col6, #T_56dd5_row69_col7, #T_56dd5_row69_col8, #T_56dd5_row70_col0, #T_56dd5_row70_col1, #T_56dd5_row70_col2, #T_56dd5_row70_col3, #T_56dd5_row70_col4, #T_56dd5_row70_col5, #T_56dd5_row70_col6, #T_56dd5_row70_col7, #T_56dd5_row70_col8, #T_56dd5_row71_col0, #T_56dd5_row71_col1, #T_56dd5_row71_col2, #T_56dd5_row71_col3, #T_56dd5_row71_col4, #T_56dd5_row71_col5, #T_56dd5_row71_col6, #T_56dd5_row71_col7, #T_56dd5_row71_col8, #T_56dd5_row72_col0, #T_56dd5_row72_col1, #T_56dd5_row72_col2, #T_56dd5_row72_col3, #T_56dd5_row72_col4, #T_56dd5_row72_col5, #T_56dd5_row72_col6, #T_56dd5_row72_col7, #T_56dd5_row72_col8, #T_56dd5_row73_col0, #T_56dd5_row73_col1, #T_56dd5_row73_col2, #T_56dd5_row73_col3, #T_56dd5_row73_col4, #T_56dd5_row73_col5, #T_56dd5_row73_col6, #T_56dd5_row73_col7, #T_56dd5_row73_col8, #T_56dd5_row74_col0, #T_56dd5_row74_col1, #T_56dd5_row74_col2, #T_56dd5_row74_col3, #T_56dd5_row74_col4, #T_56dd5_row74_col5, #T_56dd5_row74_col6, #T_56dd5_row74_col7, #T_56dd5_row74_col8, #T_56dd5_row75_col0, #T_56dd5_row75_col1, #T_56dd5_row75_col2, #T_56dd5_row75_col3, #T_56dd5_row75_col4, #T_56dd5_row75_col5, #T_56dd5_row75_col6, #T_56dd5_row75_col7, #T_56dd5_row75_col8 {\n",
+              "  text-align: left;\n",
+              "}\n",
+              "</style>\n",
+              "<table id=\"T_56dd5\">\n",
+              "  <thead>\n",
+              "    <tr>\n",
+              "      <th id=\"T_56dd5_level0_col0\" class=\"col_heading level0 col0\" >ID</th>\n",
+              "      <th id=\"T_56dd5_level0_col1\" class=\"col_heading level0 col1\" >Name</th>\n",
+              "      <th id=\"T_56dd5_level0_col2\" class=\"col_heading level0 col2\" >Description</th>\n",
+              "      <th id=\"T_56dd5_level0_col3\" class=\"col_heading level0 col3\" >Has Figure</th>\n",
+              "      <th id=\"T_56dd5_level0_col4\" class=\"col_heading level0 col4\" >Has Table</th>\n",
+              "      <th id=\"T_56dd5_level0_col5\" class=\"col_heading level0 col5\" >Required Inputs</th>\n",
+              "      <th id=\"T_56dd5_level0_col6\" class=\"col_heading level0 col6\" >Params</th>\n",
+              "      <th id=\"T_56dd5_level0_col7\" class=\"col_heading level0 col7\" >Tags</th>\n",
+              "      <th id=\"T_56dd5_level0_col8\" class=\"col_heading level0 col8\" >Tasks</th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row0_col0\" class=\"data row0 col0\" >validmind.data_validation.BivariateScatterPlots</td>\n",
+              "      <td id=\"T_56dd5_row0_col1\" class=\"data row0 col1\" >Bivariate Scatter Plots</td>\n",
+              "      <td id=\"T_56dd5_row0_col2\" class=\"data row0 col2\" >Generates bivariate scatterplots to visually inspect relationships between pairs of numerical predictor variables...</td>\n",
+              "      <td id=\"T_56dd5_row0_col3\" class=\"data row0 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row0_col4\" class=\"data row0 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row0_col5\" class=\"data row0 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row0_col6\" class=\"data row0 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row0_col7\" class=\"data row0 col7\" >['tabular_data', 'numerical_data', 'visualization']</td>\n",
+              "      <td id=\"T_56dd5_row0_col8\" class=\"data row0 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row1_col0\" class=\"data row1 col0\" >validmind.data_validation.ChiSquaredFeaturesTable</td>\n",
+              "      <td id=\"T_56dd5_row1_col1\" class=\"data row1 col1\" >Chi Squared Features Table</td>\n",
+              "      <td id=\"T_56dd5_row1_col2\" class=\"data row1 col2\" >Assesses the statistical association between categorical features and a target variable using the Chi-Squared test....</td>\n",
+              "      <td id=\"T_56dd5_row1_col3\" class=\"data row1 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row1_col4\" class=\"data row1 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row1_col5\" class=\"data row1 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row1_col6\" class=\"data row1 col6\" >{'p_threshold': {'type': '_empty', 'default': 0.05}}</td>\n",
+              "      <td id=\"T_56dd5_row1_col7\" class=\"data row1 col7\" >['tabular_data', 'categorical_data', 'statistical_test']</td>\n",
+              "      <td id=\"T_56dd5_row1_col8\" class=\"data row1 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row2_col0\" class=\"data row2 col0\" >validmind.data_validation.ClassImbalance</td>\n",
+              "      <td id=\"T_56dd5_row2_col1\" class=\"data row2 col1\" >Class Imbalance</td>\n",
+              "      <td id=\"T_56dd5_row2_col2\" class=\"data row2 col2\" >Evaluates and quantifies class distribution imbalance in a dataset used by a machine learning model....</td>\n",
+              "      <td id=\"T_56dd5_row2_col3\" class=\"data row2 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row2_col4\" class=\"data row2 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row2_col5\" class=\"data row2 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row2_col6\" class=\"data row2 col6\" >{'min_percent_threshold': {'type': 'int', 'default': 10}}</td>\n",
+              "      <td id=\"T_56dd5_row2_col7\" class=\"data row2 col7\" >['tabular_data', 'binary_classification', 'multiclass_classification', 'data_quality']</td>\n",
+              "      <td id=\"T_56dd5_row2_col8\" class=\"data row2 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row3_col0\" class=\"data row3 col0\" >validmind.data_validation.DatasetDescription</td>\n",
+              "      <td id=\"T_56dd5_row3_col1\" class=\"data row3 col1\" >Dataset Description</td>\n",
+              "      <td id=\"T_56dd5_row3_col2\" class=\"data row3 col2\" >Provides comprehensive analysis and statistical summaries of each column in a machine learning model's dataset....</td>\n",
+              "      <td id=\"T_56dd5_row3_col3\" class=\"data row3 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row3_col4\" class=\"data row3 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row3_col5\" class=\"data row3 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row3_col6\" class=\"data row3 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row3_col7\" class=\"data row3 col7\" >['tabular_data', 'time_series_data', 'text_data']</td>\n",
+              "      <td id=\"T_56dd5_row3_col8\" class=\"data row3 col8\" >['classification', 'regression', 'text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row4_col0\" class=\"data row4 col0\" >validmind.data_validation.DatasetSplit</td>\n",
+              "      <td id=\"T_56dd5_row4_col1\" class=\"data row4 col1\" >Dataset Split</td>\n",
+              "      <td id=\"T_56dd5_row4_col2\" class=\"data row4 col2\" >Evaluates and visualizes the distribution proportions among training, testing, and validation datasets of an ML...</td>\n",
+              "      <td id=\"T_56dd5_row4_col3\" class=\"data row4 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row4_col4\" class=\"data row4 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row4_col5\" class=\"data row4 col5\" >['datasets']</td>\n",
+              "      <td id=\"T_56dd5_row4_col6\" class=\"data row4 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row4_col7\" class=\"data row4 col7\" >['tabular_data', 'time_series_data', 'text_data']</td>\n",
+              "      <td id=\"T_56dd5_row4_col8\" class=\"data row4 col8\" >['classification', 'regression', 'text_classification', 'text_summarization']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row5_col0\" class=\"data row5 col0\" >validmind.data_validation.DescriptiveStatistics</td>\n",
+              "      <td id=\"T_56dd5_row5_col1\" class=\"data row5 col1\" >Descriptive Statistics</td>\n",
+              "      <td id=\"T_56dd5_row5_col2\" class=\"data row5 col2\" >Performs a detailed descriptive statistical analysis of both numerical and categorical data within a model's...</td>\n",
+              "      <td id=\"T_56dd5_row5_col3\" class=\"data row5 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row5_col4\" class=\"data row5 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row5_col5\" class=\"data row5 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row5_col6\" class=\"data row5 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row5_col7\" class=\"data row5 col7\" >['tabular_data', 'time_series_data', 'data_quality']</td>\n",
+              "      <td id=\"T_56dd5_row5_col8\" class=\"data row5 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row6_col0\" class=\"data row6 col0\" >validmind.data_validation.Duplicates</td>\n",
+              "      <td id=\"T_56dd5_row6_col1\" class=\"data row6 col1\" >Duplicates</td>\n",
+              "      <td id=\"T_56dd5_row6_col2\" class=\"data row6 col2\" >Tests dataset for duplicate entries, ensuring model reliability via data quality verification....</td>\n",
+              "      <td id=\"T_56dd5_row6_col3\" class=\"data row6 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row6_col4\" class=\"data row6 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row6_col5\" class=\"data row6 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row6_col6\" class=\"data row6 col6\" >{'min_threshold': {'type': '_empty', 'default': 1}}</td>\n",
+              "      <td id=\"T_56dd5_row6_col7\" class=\"data row6 col7\" >['tabular_data', 'data_quality', 'text_data']</td>\n",
+              "      <td id=\"T_56dd5_row6_col8\" class=\"data row6 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row7_col0\" class=\"data row7 col0\" >validmind.data_validation.FeatureTargetCorrelationPlot</td>\n",
+              "      <td id=\"T_56dd5_row7_col1\" class=\"data row7 col1\" >Feature Target Correlation Plot</td>\n",
+              "      <td id=\"T_56dd5_row7_col2\" class=\"data row7 col2\" >Visualizes the correlation between input features and the model's target output in a color-coded horizontal bar...</td>\n",
+              "      <td id=\"T_56dd5_row7_col3\" class=\"data row7 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row7_col4\" class=\"data row7 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row7_col5\" class=\"data row7 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row7_col6\" class=\"data row7 col6\" >{'fig_height': {'type': '_empty', 'default': 600}}</td>\n",
+              "      <td id=\"T_56dd5_row7_col7\" class=\"data row7 col7\" >['tabular_data', 'visualization', 'correlation']</td>\n",
+              "      <td id=\"T_56dd5_row7_col8\" class=\"data row7 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row8_col0\" class=\"data row8 col0\" >validmind.data_validation.HighCardinality</td>\n",
+              "      <td id=\"T_56dd5_row8_col1\" class=\"data row8 col1\" >High Cardinality</td>\n",
+              "      <td id=\"T_56dd5_row8_col2\" class=\"data row8 col2\" >Assesses the number of unique values in categorical columns to detect high cardinality and potential overfitting....</td>\n",
+              "      <td id=\"T_56dd5_row8_col3\" class=\"data row8 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row8_col4\" class=\"data row8 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row8_col5\" class=\"data row8 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row8_col6\" class=\"data row8 col6\" >{'num_threshold': {'type': 'int', 'default': 100}, 'percent_threshold': {'type': 'float', 'default': 0.1}, 'threshold_type': {'type': 'str', 'default': 'percent'}}</td>\n",
+              "      <td id=\"T_56dd5_row8_col7\" class=\"data row8 col7\" >['tabular_data', 'data_quality', 'categorical_data']</td>\n",
+              "      <td id=\"T_56dd5_row8_col8\" class=\"data row8 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row9_col0\" class=\"data row9 col0\" >validmind.data_validation.HighPearsonCorrelation</td>\n",
+              "      <td id=\"T_56dd5_row9_col1\" class=\"data row9 col1\" >High Pearson Correlation</td>\n",
+              "      <td id=\"T_56dd5_row9_col2\" class=\"data row9 col2\" >Identifies highly correlated feature pairs in a dataset suggesting feature redundancy or multicollinearity....</td>\n",
+              "      <td id=\"T_56dd5_row9_col3\" class=\"data row9 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row9_col4\" class=\"data row9 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row9_col5\" class=\"data row9 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row9_col6\" class=\"data row9 col6\" >{'max_threshold': {'type': 'float', 'default': 0.3}, 'top_n_correlations': {'type': 'int', 'default': 10}, 'feature_columns': {'type': 'list', 'default': None}}</td>\n",
+              "      <td id=\"T_56dd5_row9_col7\" class=\"data row9 col7\" >['tabular_data', 'data_quality', 'correlation']</td>\n",
+              "      <td id=\"T_56dd5_row9_col8\" class=\"data row9 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row10_col0\" class=\"data row10 col0\" >validmind.data_validation.IQROutliersBarPlot</td>\n",
+              "      <td id=\"T_56dd5_row10_col1\" class=\"data row10 col1\" >IQR Outliers Bar Plot</td>\n",
+              "      <td id=\"T_56dd5_row10_col2\" class=\"data row10 col2\" >Visualizes outlier distribution across percentiles in numerical data using the Interquartile Range (IQR) method....</td>\n",
+              "      <td id=\"T_56dd5_row10_col3\" class=\"data row10 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row10_col4\" class=\"data row10 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row10_col5\" class=\"data row10 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row10_col6\" class=\"data row10 col6\" >{'threshold': {'type': 'float', 'default': 1.5}, 'fig_width': {'type': 'int', 'default': 800}}</td>\n",
+              "      <td id=\"T_56dd5_row10_col7\" class=\"data row10 col7\" >['tabular_data', 'visualization', 'numerical_data']</td>\n",
+              "      <td id=\"T_56dd5_row10_col8\" class=\"data row10 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row11_col0\" class=\"data row11 col0\" >validmind.data_validation.IQROutliersTable</td>\n",
+              "      <td id=\"T_56dd5_row11_col1\" class=\"data row11 col1\" >IQR Outliers Table</td>\n",
+              "      <td id=\"T_56dd5_row11_col2\" class=\"data row11 col2\" >Determines and summarizes outliers in numerical features using the Interquartile Range method....</td>\n",
+              "      <td id=\"T_56dd5_row11_col3\" class=\"data row11 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row11_col4\" class=\"data row11 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row11_col5\" class=\"data row11 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row11_col6\" class=\"data row11 col6\" >{'threshold': {'type': 'float', 'default': 1.5}}</td>\n",
+              "      <td id=\"T_56dd5_row11_col7\" class=\"data row11 col7\" >['tabular_data', 'numerical_data']</td>\n",
+              "      <td id=\"T_56dd5_row11_col8\" class=\"data row11 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row12_col0\" class=\"data row12 col0\" >validmind.data_validation.IsolationForestOutliers</td>\n",
+              "      <td id=\"T_56dd5_row12_col1\" class=\"data row12 col1\" >Isolation Forest Outliers</td>\n",
+              "      <td id=\"T_56dd5_row12_col2\" class=\"data row12 col2\" >Detects outliers in a dataset using the Isolation Forest algorithm and visualizes results through scatter plots....</td>\n",
+              "      <td id=\"T_56dd5_row12_col3\" class=\"data row12 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row12_col4\" class=\"data row12 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row12_col5\" class=\"data row12 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row12_col6\" class=\"data row12 col6\" >{'random_state': {'type': 'int', 'default': 0}, 'contamination': {'type': 'float', 'default': 0.1}, 'feature_columns': {'type': 'list', 'default': None}}</td>\n",
+              "      <td id=\"T_56dd5_row12_col7\" class=\"data row12 col7\" >['tabular_data', 'anomaly_detection']</td>\n",
+              "      <td id=\"T_56dd5_row12_col8\" class=\"data row12 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row13_col0\" class=\"data row13 col0\" >validmind.data_validation.JarqueBera</td>\n",
+              "      <td id=\"T_56dd5_row13_col1\" class=\"data row13 col1\" >Jarque Bera</td>\n",
+              "      <td id=\"T_56dd5_row13_col2\" class=\"data row13 col2\" >Assesses normality of dataset features in an ML model using the Jarque-Bera test....</td>\n",
+              "      <td id=\"T_56dd5_row13_col3\" class=\"data row13 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row13_col4\" class=\"data row13 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row13_col5\" class=\"data row13 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row13_col6\" class=\"data row13 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row13_col7\" class=\"data row13 col7\" >['tabular_data', 'data_distribution', 'statistical_test', 'statsmodels']</td>\n",
+              "      <td id=\"T_56dd5_row13_col8\" class=\"data row13 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row14_col0\" class=\"data row14 col0\" >validmind.data_validation.MissingValues</td>\n",
+              "      <td id=\"T_56dd5_row14_col1\" class=\"data row14 col1\" >Missing Values</td>\n",
+              "      <td id=\"T_56dd5_row14_col2\" class=\"data row14 col2\" >Evaluates dataset quality by ensuring missing value ratio across all features does not exceed a set threshold....</td>\n",
+              "      <td id=\"T_56dd5_row14_col3\" class=\"data row14 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row14_col4\" class=\"data row14 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row14_col5\" class=\"data row14 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row14_col6\" class=\"data row14 col6\" >{'min_threshold': {'type': 'int', 'default': 1}}</td>\n",
+              "      <td id=\"T_56dd5_row14_col7\" class=\"data row14 col7\" >['tabular_data', 'data_quality']</td>\n",
+              "      <td id=\"T_56dd5_row14_col8\" class=\"data row14 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row15_col0\" class=\"data row15 col0\" >validmind.data_validation.MissingValuesBarPlot</td>\n",
+              "      <td id=\"T_56dd5_row15_col1\" class=\"data row15 col1\" >Missing Values Bar Plot</td>\n",
+              "      <td id=\"T_56dd5_row15_col2\" class=\"data row15 col2\" >Assesses the percentage and distribution of missing values in the dataset via a bar plot, with emphasis on...</td>\n",
+              "      <td id=\"T_56dd5_row15_col3\" class=\"data row15 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row15_col4\" class=\"data row15 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row15_col5\" class=\"data row15 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row15_col6\" class=\"data row15 col6\" >{'threshold': {'type': 'int', 'default': 80}, 'fig_height': {'type': 'int', 'default': 600}}</td>\n",
+              "      <td id=\"T_56dd5_row15_col7\" class=\"data row15 col7\" >['tabular_data', 'data_quality', 'visualization']</td>\n",
+              "      <td id=\"T_56dd5_row15_col8\" class=\"data row15 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row16_col0\" class=\"data row16 col0\" >validmind.data_validation.MutualInformation</td>\n",
+              "      <td id=\"T_56dd5_row16_col1\" class=\"data row16 col1\" >Mutual Information</td>\n",
+              "      <td id=\"T_56dd5_row16_col2\" class=\"data row16 col2\" >Calculates mutual information scores between features and target variable to evaluate feature relevance....</td>\n",
+              "      <td id=\"T_56dd5_row16_col3\" class=\"data row16 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row16_col4\" class=\"data row16 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row16_col5\" class=\"data row16 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row16_col6\" class=\"data row16 col6\" >{'min_threshold': {'type': 'float', 'default': 0.01}, 'task': {'type': 'str', 'default': 'classification'}}</td>\n",
+              "      <td id=\"T_56dd5_row16_col7\" class=\"data row16 col7\" >['feature_selection', 'data_analysis']</td>\n",
+              "      <td id=\"T_56dd5_row16_col8\" class=\"data row16 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row17_col0\" class=\"data row17 col0\" >validmind.data_validation.PearsonCorrelationMatrix</td>\n",
+              "      <td id=\"T_56dd5_row17_col1\" class=\"data row17 col1\" >Pearson Correlation Matrix</td>\n",
+              "      <td id=\"T_56dd5_row17_col2\" class=\"data row17 col2\" >Evaluates linear dependency between numerical variables in a dataset via a Pearson Correlation coefficient heat map....</td>\n",
+              "      <td id=\"T_56dd5_row17_col3\" class=\"data row17 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row17_col4\" class=\"data row17 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row17_col5\" class=\"data row17 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row17_col6\" class=\"data row17 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row17_col7\" class=\"data row17 col7\" >['tabular_data', 'numerical_data', 'correlation']</td>\n",
+              "      <td id=\"T_56dd5_row17_col8\" class=\"data row17 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row18_col0\" class=\"data row18 col0\" >validmind.data_validation.ProtectedClassesDescription</td>\n",
+              "      <td id=\"T_56dd5_row18_col1\" class=\"data row18 col1\" >Protected Classes Description</td>\n",
+              "      <td id=\"T_56dd5_row18_col2\" class=\"data row18 col2\" >Visualizes the distribution of protected classes in the dataset relative to the target variable...</td>\n",
+              "      <td id=\"T_56dd5_row18_col3\" class=\"data row18 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row18_col4\" class=\"data row18 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row18_col5\" class=\"data row18 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row18_col6\" class=\"data row18 col6\" >{'protected_classes': {'type': '_empty', 'default': None}}</td>\n",
+              "      <td id=\"T_56dd5_row18_col7\" class=\"data row18 col7\" >['bias_and_fairness', 'descriptive_statistics']</td>\n",
+              "      <td id=\"T_56dd5_row18_col8\" class=\"data row18 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row19_col0\" class=\"data row19 col0\" >validmind.data_validation.RunsTest</td>\n",
+              "      <td id=\"T_56dd5_row19_col1\" class=\"data row19 col1\" >Runs Test</td>\n",
+              "      <td id=\"T_56dd5_row19_col2\" class=\"data row19 col2\" >Executes Runs Test on ML model to detect non-random patterns in output data sequence....</td>\n",
+              "      <td id=\"T_56dd5_row19_col3\" class=\"data row19 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row19_col4\" class=\"data row19 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row19_col5\" class=\"data row19 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row19_col6\" class=\"data row19 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row19_col7\" class=\"data row19 col7\" >['tabular_data', 'statistical_test', 'statsmodels']</td>\n",
+              "      <td id=\"T_56dd5_row19_col8\" class=\"data row19 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row20_col0\" class=\"data row20 col0\" >validmind.data_validation.ScatterPlot</td>\n",
+              "      <td id=\"T_56dd5_row20_col1\" class=\"data row20 col1\" >Scatter Plot</td>\n",
+              "      <td id=\"T_56dd5_row20_col2\" class=\"data row20 col2\" >Assesses visual relationships, patterns, and outliers among features in a dataset through scatter plot matrices....</td>\n",
+              "      <td id=\"T_56dd5_row20_col3\" class=\"data row20 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row20_col4\" class=\"data row20 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row20_col5\" class=\"data row20 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row20_col6\" class=\"data row20 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row20_col7\" class=\"data row20 col7\" >['tabular_data', 'visualization']</td>\n",
+              "      <td id=\"T_56dd5_row20_col8\" class=\"data row20 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row21_col0\" class=\"data row21 col0\" >validmind.data_validation.ScoreBandDefaultRates</td>\n",
+              "      <td id=\"T_56dd5_row21_col1\" class=\"data row21 col1\" >Score Band Default Rates</td>\n",
+              "      <td id=\"T_56dd5_row21_col2\" class=\"data row21 col2\" >Analyzes default rates and population distribution across credit score bands....</td>\n",
+              "      <td id=\"T_56dd5_row21_col3\" class=\"data row21 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row21_col4\" class=\"data row21 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row21_col5\" class=\"data row21 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row21_col6\" class=\"data row21 col6\" >{'score_column': {'type': 'str', 'default': 'score'}, 'score_bands': {'type': 'list', 'default': None}}</td>\n",
+              "      <td id=\"T_56dd5_row21_col7\" class=\"data row21 col7\" >['visualization', 'credit_risk', 'scorecard']</td>\n",
+              "      <td id=\"T_56dd5_row21_col8\" class=\"data row21 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row22_col0\" class=\"data row22 col0\" >validmind.data_validation.ShapiroWilk</td>\n",
+              "      <td id=\"T_56dd5_row22_col1\" class=\"data row22 col1\" >Shapiro Wilk</td>\n",
+              "      <td id=\"T_56dd5_row22_col2\" class=\"data row22 col2\" >Evaluates feature-wise normality of training data using the Shapiro-Wilk test....</td>\n",
+              "      <td id=\"T_56dd5_row22_col3\" class=\"data row22 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row22_col4\" class=\"data row22 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row22_col5\" class=\"data row22 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row22_col6\" class=\"data row22 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row22_col7\" class=\"data row22 col7\" >['tabular_data', 'data_distribution', 'statistical_test']</td>\n",
+              "      <td id=\"T_56dd5_row22_col8\" class=\"data row22 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row23_col0\" class=\"data row23 col0\" >validmind.data_validation.Skewness</td>\n",
+              "      <td id=\"T_56dd5_row23_col1\" class=\"data row23 col1\" >Skewness</td>\n",
+              "      <td id=\"T_56dd5_row23_col2\" class=\"data row23 col2\" >Evaluates the skewness of numerical data in a dataset to check against a defined threshold, aiming to ensure data...</td>\n",
+              "      <td id=\"T_56dd5_row23_col3\" class=\"data row23 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row23_col4\" class=\"data row23 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row23_col5\" class=\"data row23 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row23_col6\" class=\"data row23 col6\" >{'max_threshold': {'type': '_empty', 'default': 1}}</td>\n",
+              "      <td id=\"T_56dd5_row23_col7\" class=\"data row23 col7\" >['data_quality', 'tabular_data']</td>\n",
+              "      <td id=\"T_56dd5_row23_col8\" class=\"data row23 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row24_col0\" class=\"data row24 col0\" >validmind.data_validation.TabularCategoricalBarPlots</td>\n",
+              "      <td id=\"T_56dd5_row24_col1\" class=\"data row24 col1\" >Tabular Categorical Bar Plots</td>\n",
+              "      <td id=\"T_56dd5_row24_col2\" class=\"data row24 col2\" >Generates and visualizes bar plots for each category in categorical features to evaluate the dataset's composition....</td>\n",
+              "      <td id=\"T_56dd5_row24_col3\" class=\"data row24 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row24_col4\" class=\"data row24 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row24_col5\" class=\"data row24 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row24_col6\" class=\"data row24 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row24_col7\" class=\"data row24 col7\" >['tabular_data', 'visualization']</td>\n",
+              "      <td id=\"T_56dd5_row24_col8\" class=\"data row24 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row25_col0\" class=\"data row25 col0\" >validmind.data_validation.TabularDateTimeHistograms</td>\n",
+              "      <td id=\"T_56dd5_row25_col1\" class=\"data row25 col1\" >Tabular Date Time Histograms</td>\n",
+              "      <td id=\"T_56dd5_row25_col2\" class=\"data row25 col2\" >Generates histograms to provide graphical insight into the distribution of time intervals in a model's datetime...</td>\n",
+              "      <td id=\"T_56dd5_row25_col3\" class=\"data row25 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row25_col4\" class=\"data row25 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row25_col5\" class=\"data row25 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row25_col6\" class=\"data row25 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row25_col7\" class=\"data row25 col7\" >['time_series_data', 'visualization']</td>\n",
+              "      <td id=\"T_56dd5_row25_col8\" class=\"data row25 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row26_col0\" class=\"data row26 col0\" >validmind.data_validation.TabularDescriptionTables</td>\n",
+              "      <td id=\"T_56dd5_row26_col1\" class=\"data row26 col1\" >Tabular Description Tables</td>\n",
+              "      <td id=\"T_56dd5_row26_col2\" class=\"data row26 col2\" >Summarizes key descriptive statistics for numerical, categorical, and datetime variables in a dataset....</td>\n",
+              "      <td id=\"T_56dd5_row26_col3\" class=\"data row26 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row26_col4\" class=\"data row26 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row26_col5\" class=\"data row26 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row26_col6\" class=\"data row26 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row26_col7\" class=\"data row26 col7\" >['tabular_data']</td>\n",
+              "      <td id=\"T_56dd5_row26_col8\" class=\"data row26 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row27_col0\" class=\"data row27 col0\" >validmind.data_validation.TabularNumericalHistograms</td>\n",
+              "      <td id=\"T_56dd5_row27_col1\" class=\"data row27 col1\" >Tabular Numerical Histograms</td>\n",
+              "      <td id=\"T_56dd5_row27_col2\" class=\"data row27 col2\" >Generates histograms for each numerical feature in a dataset to provide visual insights into data distribution and...</td>\n",
+              "      <td id=\"T_56dd5_row27_col3\" class=\"data row27 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row27_col4\" class=\"data row27 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row27_col5\" class=\"data row27 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row27_col6\" class=\"data row27 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row27_col7\" class=\"data row27 col7\" >['tabular_data', 'visualization']</td>\n",
+              "      <td id=\"T_56dd5_row27_col8\" class=\"data row27 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row28_col0\" class=\"data row28 col0\" >validmind.data_validation.TargetRateBarPlots</td>\n",
+              "      <td id=\"T_56dd5_row28_col1\" class=\"data row28 col1\" >Target Rate Bar Plots</td>\n",
+              "      <td id=\"T_56dd5_row28_col2\" class=\"data row28 col2\" >Generates bar plots visualizing the default rates of categorical features for a classification machine learning...</td>\n",
+              "      <td id=\"T_56dd5_row28_col3\" class=\"data row28 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row28_col4\" class=\"data row28 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row28_col5\" class=\"data row28 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row28_col6\" class=\"data row28 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row28_col7\" class=\"data row28 col7\" >['tabular_data', 'visualization', 'categorical_data']</td>\n",
+              "      <td id=\"T_56dd5_row28_col8\" class=\"data row28 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row29_col0\" class=\"data row29 col0\" >validmind.data_validation.TooManyZeroValues</td>\n",
+              "      <td id=\"T_56dd5_row29_col1\" class=\"data row29 col1\" >Too Many Zero Values</td>\n",
+              "      <td id=\"T_56dd5_row29_col2\" class=\"data row29 col2\" >Identifies numerical columns in a dataset that contain an excessive number of zero values, defined by a threshold...</td>\n",
+              "      <td id=\"T_56dd5_row29_col3\" class=\"data row29 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row29_col4\" class=\"data row29 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row29_col5\" class=\"data row29 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row29_col6\" class=\"data row29 col6\" >{'max_percent_threshold': {'type': 'float', 'default': 0.03}}</td>\n",
+              "      <td id=\"T_56dd5_row29_col7\" class=\"data row29 col7\" >['tabular_data']</td>\n",
+              "      <td id=\"T_56dd5_row29_col8\" class=\"data row29 col8\" >['regression', 'classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row30_col0\" class=\"data row30 col0\" >validmind.data_validation.UniqueRows</td>\n",
+              "      <td id=\"T_56dd5_row30_col1\" class=\"data row30 col1\" >Unique Rows</td>\n",
+              "      <td id=\"T_56dd5_row30_col2\" class=\"data row30 col2\" >Verifies the diversity of the dataset by ensuring that the count of unique rows exceeds a prescribed threshold....</td>\n",
+              "      <td id=\"T_56dd5_row30_col3\" class=\"data row30 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row30_col4\" class=\"data row30 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row30_col5\" class=\"data row30 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row30_col6\" class=\"data row30 col6\" >{'min_percent_threshold': {'type': 'float', 'default': 1}}</td>\n",
+              "      <td id=\"T_56dd5_row30_col7\" class=\"data row30 col7\" >['tabular_data']</td>\n",
+              "      <td id=\"T_56dd5_row30_col8\" class=\"data row30 col8\" >['regression', 'classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row31_col0\" class=\"data row31 col0\" >validmind.data_validation.WOEBinPlots</td>\n",
+              "      <td id=\"T_56dd5_row31_col1\" class=\"data row31 col1\" >WOE Bin Plots</td>\n",
+              "      <td id=\"T_56dd5_row31_col2\" class=\"data row31 col2\" >Generates visualizations of Weight of Evidence (WoE) and Information Value (IV) for understanding predictive power...</td>\n",
+              "      <td id=\"T_56dd5_row31_col3\" class=\"data row31 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row31_col4\" class=\"data row31 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row31_col5\" class=\"data row31 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row31_col6\" class=\"data row31 col6\" >{'breaks_adj': {'type': 'list', 'default': None}, 'fig_height': {'type': 'int', 'default': 600}, 'fig_width': {'type': 'int', 'default': 500}}</td>\n",
+              "      <td id=\"T_56dd5_row31_col7\" class=\"data row31 col7\" >['tabular_data', 'visualization', 'categorical_data']</td>\n",
+              "      <td id=\"T_56dd5_row31_col8\" class=\"data row31 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row32_col0\" class=\"data row32 col0\" >validmind.data_validation.WOEBinTable</td>\n",
+              "      <td id=\"T_56dd5_row32_col1\" class=\"data row32 col1\" >WOE Bin Table</td>\n",
+              "      <td id=\"T_56dd5_row32_col2\" class=\"data row32 col2\" >Assesses the Weight of Evidence (WoE) and Information Value (IV) of each feature to evaluate its predictive power...</td>\n",
+              "      <td id=\"T_56dd5_row32_col3\" class=\"data row32 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row32_col4\" class=\"data row32 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row32_col5\" class=\"data row32 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row32_col6\" class=\"data row32 col6\" >{'breaks_adj': {'type': 'list', 'default': None}}</td>\n",
+              "      <td id=\"T_56dd5_row32_col7\" class=\"data row32 col7\" >['tabular_data', 'categorical_data']</td>\n",
+              "      <td id=\"T_56dd5_row32_col8\" class=\"data row32 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row33_col0\" class=\"data row33 col0\" >validmind.model_validation.FeaturesAUC</td>\n",
+              "      <td id=\"T_56dd5_row33_col1\" class=\"data row33 col1\" >Features AUC</td>\n",
+              "      <td id=\"T_56dd5_row33_col2\" class=\"data row33 col2\" >Evaluates the discriminatory power of each individual feature within a binary classification model by calculating...</td>\n",
+              "      <td id=\"T_56dd5_row33_col3\" class=\"data row33 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row33_col4\" class=\"data row33 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row33_col5\" class=\"data row33 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row33_col6\" class=\"data row33 col6\" >{'fontsize': {'type': 'int', 'default': 12}, 'figure_height': {'type': 'int', 'default': 500}}</td>\n",
+              "      <td id=\"T_56dd5_row33_col7\" class=\"data row33 col7\" >['feature_importance', 'AUC', 'visualization']</td>\n",
+              "      <td id=\"T_56dd5_row33_col8\" class=\"data row33 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row34_col0\" class=\"data row34 col0\" >validmind.model_validation.sklearn.CalibrationCurve</td>\n",
+              "      <td id=\"T_56dd5_row34_col1\" class=\"data row34 col1\" >Calibration Curve</td>\n",
+              "      <td id=\"T_56dd5_row34_col2\" class=\"data row34 col2\" >Evaluates the calibration of probability estimates by comparing predicted probabilities against observed...</td>\n",
+              "      <td id=\"T_56dd5_row34_col3\" class=\"data row34 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row34_col4\" class=\"data row34 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row34_col5\" class=\"data row34 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_56dd5_row34_col6\" class=\"data row34 col6\" >{'n_bins': {'type': 'int', 'default': 10}}</td>\n",
+              "      <td id=\"T_56dd5_row34_col7\" class=\"data row34 col7\" >['sklearn', 'model_performance', 'classification']</td>\n",
+              "      <td id=\"T_56dd5_row34_col8\" class=\"data row34 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row35_col0\" class=\"data row35 col0\" >validmind.model_validation.sklearn.ClassifierPerformance</td>\n",
+              "      <td id=\"T_56dd5_row35_col1\" class=\"data row35 col1\" >Classifier Performance</td>\n",
+              "      <td id=\"T_56dd5_row35_col2\" class=\"data row35 col2\" >Evaluates performance of binary or multiclass classification models using precision, recall, F1-Score, accuracy,...</td>\n",
+              "      <td id=\"T_56dd5_row35_col3\" class=\"data row35 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row35_col4\" class=\"data row35 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row35_col5\" class=\"data row35 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row35_col6\" class=\"data row35 col6\" >{'average': {'type': 'str', 'default': 'macro'}}</td>\n",
+              "      <td id=\"T_56dd5_row35_col7\" class=\"data row35 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_56dd5_row35_col8\" class=\"data row35 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row36_col0\" class=\"data row36 col0\" >validmind.model_validation.sklearn.ClassifierThresholdOptimization</td>\n",
+              "      <td id=\"T_56dd5_row36_col1\" class=\"data row36 col1\" >Classifier Threshold Optimization</td>\n",
+              "      <td id=\"T_56dd5_row36_col2\" class=\"data row36 col2\" >Analyzes and visualizes different threshold optimization methods for binary classification models....</td>\n",
+              "      <td id=\"T_56dd5_row36_col3\" class=\"data row36 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row36_col4\" class=\"data row36 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row36_col5\" class=\"data row36 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row36_col6\" class=\"data row36 col6\" >{'methods': {'type': None, 'default': None}, 'target_recall': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_56dd5_row36_col7\" class=\"data row36 col7\" >['model_validation', 'threshold_optimization', 'classification_metrics']</td>\n",
+              "      <td id=\"T_56dd5_row36_col8\" class=\"data row36 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row37_col0\" class=\"data row37 col0\" >validmind.model_validation.sklearn.ConfusionMatrix</td>\n",
+              "      <td id=\"T_56dd5_row37_col1\" class=\"data row37 col1\" >Confusion Matrix</td>\n",
+              "      <td id=\"T_56dd5_row37_col2\" class=\"data row37 col2\" >Evaluates and visually represents the classification ML model's predictive performance using a Confusion Matrix...</td>\n",
+              "      <td id=\"T_56dd5_row37_col3\" class=\"data row37 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row37_col4\" class=\"data row37 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row37_col5\" class=\"data row37 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row37_col6\" class=\"data row37 col6\" >{'threshold': {'type': 'float', 'default': 0.5}}</td>\n",
+              "      <td id=\"T_56dd5_row37_col7\" class=\"data row37 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_56dd5_row37_col8\" class=\"data row37 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row38_col0\" class=\"data row38 col0\" >validmind.model_validation.sklearn.HyperParametersTuning</td>\n",
+              "      <td id=\"T_56dd5_row38_col1\" class=\"data row38 col1\" >Hyper Parameters Tuning</td>\n",
+              "      <td id=\"T_56dd5_row38_col2\" class=\"data row38 col2\" >Performs exhaustive grid search over specified parameter ranges to find optimal model configurations...</td>\n",
+              "      <td id=\"T_56dd5_row38_col3\" class=\"data row38 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row38_col4\" class=\"data row38 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row38_col5\" class=\"data row38 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_56dd5_row38_col6\" class=\"data row38 col6\" >{'param_grid': {'type': 'dict', 'default': None}, 'scoring': {'type': None, 'default': None}, 'thresholds': {'type': None, 'default': None}, 'fit_params': {'type': 'dict', 'default': None}}</td>\n",
+              "      <td id=\"T_56dd5_row38_col7\" class=\"data row38 col7\" >['sklearn', 'model_performance']</td>\n",
+              "      <td id=\"T_56dd5_row38_col8\" class=\"data row38 col8\" >['clustering', 'classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row39_col0\" class=\"data row39 col0\" >validmind.model_validation.sklearn.MinimumAccuracy</td>\n",
+              "      <td id=\"T_56dd5_row39_col1\" class=\"data row39 col1\" >Minimum Accuracy</td>\n",
+              "      <td id=\"T_56dd5_row39_col2\" class=\"data row39 col2\" >Checks if the model's prediction accuracy meets or surpasses a specified threshold....</td>\n",
+              "      <td id=\"T_56dd5_row39_col3\" class=\"data row39 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row39_col4\" class=\"data row39 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row39_col5\" class=\"data row39 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row39_col6\" class=\"data row39 col6\" >{'min_threshold': {'type': 'float', 'default': 0.7}}</td>\n",
+              "      <td id=\"T_56dd5_row39_col7\" class=\"data row39 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_56dd5_row39_col8\" class=\"data row39 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row40_col0\" class=\"data row40 col0\" >validmind.model_validation.sklearn.MinimumF1Score</td>\n",
+              "      <td id=\"T_56dd5_row40_col1\" class=\"data row40 col1\" >Minimum F1 Score</td>\n",
+              "      <td id=\"T_56dd5_row40_col2\" class=\"data row40 col2\" >Assesses if the model's F1 score on the validation set meets a predefined minimum threshold, ensuring balanced...</td>\n",
+              "      <td id=\"T_56dd5_row40_col3\" class=\"data row40 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row40_col4\" class=\"data row40 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row40_col5\" class=\"data row40 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row40_col6\" class=\"data row40 col6\" >{'min_threshold': {'type': 'float', 'default': 0.5}}</td>\n",
+              "      <td id=\"T_56dd5_row40_col7\" class=\"data row40 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_56dd5_row40_col8\" class=\"data row40 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row41_col0\" class=\"data row41 col0\" >validmind.model_validation.sklearn.MinimumROCAUCScore</td>\n",
+              "      <td id=\"T_56dd5_row41_col1\" class=\"data row41 col1\" >Minimum ROCAUC Score</td>\n",
+              "      <td id=\"T_56dd5_row41_col2\" class=\"data row41 col2\" >Validates model by checking if the ROC AUC score meets or surpasses a specified threshold....</td>\n",
+              "      <td id=\"T_56dd5_row41_col3\" class=\"data row41 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row41_col4\" class=\"data row41 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row41_col5\" class=\"data row41 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row41_col6\" class=\"data row41 col6\" >{'min_threshold': {'type': 'float', 'default': 0.5}}</td>\n",
+              "      <td id=\"T_56dd5_row41_col7\" class=\"data row41 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_56dd5_row41_col8\" class=\"data row41 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row42_col0\" class=\"data row42 col0\" >validmind.model_validation.sklearn.ModelParameters</td>\n",
+              "      <td id=\"T_56dd5_row42_col1\" class=\"data row42 col1\" >Model Parameters</td>\n",
+              "      <td id=\"T_56dd5_row42_col2\" class=\"data row42 col2\" >Extracts and displays model parameters in a structured format for transparency and reproducibility....</td>\n",
+              "      <td id=\"T_56dd5_row42_col3\" class=\"data row42 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row42_col4\" class=\"data row42 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row42_col5\" class=\"data row42 col5\" >['model']</td>\n",
+              "      <td id=\"T_56dd5_row42_col6\" class=\"data row42 col6\" >{'model_params': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_56dd5_row42_col7\" class=\"data row42 col7\" >['model_training', 'metadata']</td>\n",
+              "      <td id=\"T_56dd5_row42_col8\" class=\"data row42 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row43_col0\" class=\"data row43 col0\" >validmind.model_validation.sklearn.ModelsPerformanceComparison</td>\n",
+              "      <td id=\"T_56dd5_row43_col1\" class=\"data row43 col1\" >Models Performance Comparison</td>\n",
+              "      <td id=\"T_56dd5_row43_col2\" class=\"data row43 col2\" >Evaluates and compares the performance of multiple Machine Learning models using various metrics like accuracy,...</td>\n",
+              "      <td id=\"T_56dd5_row43_col3\" class=\"data row43 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row43_col4\" class=\"data row43 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row43_col5\" class=\"data row43 col5\" >['dataset', 'models']</td>\n",
+              "      <td id=\"T_56dd5_row43_col6\" class=\"data row43 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row43_col7\" class=\"data row43 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'model_comparison']</td>\n",
+              "      <td id=\"T_56dd5_row43_col8\" class=\"data row43 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row44_col0\" class=\"data row44 col0\" >validmind.model_validation.sklearn.OverfitDiagnosis</td>\n",
+              "      <td id=\"T_56dd5_row44_col1\" class=\"data row44 col1\" >Overfit Diagnosis</td>\n",
+              "      <td id=\"T_56dd5_row44_col2\" class=\"data row44 col2\" >Assesses potential overfitting in a model's predictions, identifying regions where performance between training and...</td>\n",
+              "      <td id=\"T_56dd5_row44_col3\" class=\"data row44 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row44_col4\" class=\"data row44 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row44_col5\" class=\"data row44 col5\" >['model', 'datasets']</td>\n",
+              "      <td id=\"T_56dd5_row44_col6\" class=\"data row44 col6\" >{'metric': {'type': 'str', 'default': None}, 'cut_off_threshold': {'type': 'float', 'default': 0.04}}</td>\n",
+              "      <td id=\"T_56dd5_row44_col7\" class=\"data row44 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'linear_regression', 'model_diagnosis']</td>\n",
+              "      <td id=\"T_56dd5_row44_col8\" class=\"data row44 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row45_col0\" class=\"data row45 col0\" >validmind.model_validation.sklearn.PermutationFeatureImportance</td>\n",
+              "      <td id=\"T_56dd5_row45_col1\" class=\"data row45 col1\" >Permutation Feature Importance</td>\n",
+              "      <td id=\"T_56dd5_row45_col2\" class=\"data row45 col2\" >Assesses the significance of each feature in a model by evaluating the impact on model performance when feature...</td>\n",
+              "      <td id=\"T_56dd5_row45_col3\" class=\"data row45 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row45_col4\" class=\"data row45 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row45_col5\" class=\"data row45 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_56dd5_row45_col6\" class=\"data row45 col6\" >{'fontsize': {'type': None, 'default': None}, 'figure_height': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_56dd5_row45_col7\" class=\"data row45 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'feature_importance', 'visualization']</td>\n",
+              "      <td id=\"T_56dd5_row45_col8\" class=\"data row45 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row46_col0\" class=\"data row46 col0\" >validmind.model_validation.sklearn.PopulationStabilityIndex</td>\n",
+              "      <td id=\"T_56dd5_row46_col1\" class=\"data row46 col1\" >Population Stability Index</td>\n",
+              "      <td id=\"T_56dd5_row46_col2\" class=\"data row46 col2\" >Assesses the Population Stability Index (PSI) to quantify the stability of an ML model's predictions across...</td>\n",
+              "      <td id=\"T_56dd5_row46_col3\" class=\"data row46 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row46_col4\" class=\"data row46 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row46_col5\" class=\"data row46 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row46_col6\" class=\"data row46 col6\" >{'num_bins': {'type': 'int', 'default': 10}, 'mode': {'type': 'str', 'default': 'fixed'}}</td>\n",
+              "      <td id=\"T_56dd5_row46_col7\" class=\"data row46 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_56dd5_row46_col8\" class=\"data row46 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row47_col0\" class=\"data row47 col0\" >validmind.model_validation.sklearn.PrecisionRecallCurve</td>\n",
+              "      <td id=\"T_56dd5_row47_col1\" class=\"data row47 col1\" >Precision Recall Curve</td>\n",
+              "      <td id=\"T_56dd5_row47_col2\" class=\"data row47 col2\" >Evaluates the precision-recall trade-off for binary classification models and visualizes the Precision-Recall curve....</td>\n",
+              "      <td id=\"T_56dd5_row47_col3\" class=\"data row47 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row47_col4\" class=\"data row47 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row47_col5\" class=\"data row47 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_56dd5_row47_col6\" class=\"data row47 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row47_col7\" class=\"data row47 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_56dd5_row47_col8\" class=\"data row47 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row48_col0\" class=\"data row48 col0\" >validmind.model_validation.sklearn.ROCCurve</td>\n",
+              "      <td id=\"T_56dd5_row48_col1\" class=\"data row48 col1\" >ROC Curve</td>\n",
+              "      <td id=\"T_56dd5_row48_col2\" class=\"data row48 col2\" >Evaluates binary classification model performance by generating and plotting the Receiver Operating Characteristic...</td>\n",
+              "      <td id=\"T_56dd5_row48_col3\" class=\"data row48 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row48_col4\" class=\"data row48 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row48_col5\" class=\"data row48 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_56dd5_row48_col6\" class=\"data row48 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row48_col7\" class=\"data row48 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_56dd5_row48_col8\" class=\"data row48 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row49_col0\" class=\"data row49 col0\" >validmind.model_validation.sklearn.RegressionErrors</td>\n",
+              "      <td id=\"T_56dd5_row49_col1\" class=\"data row49 col1\" >Regression Errors</td>\n",
+              "      <td id=\"T_56dd5_row49_col2\" class=\"data row49 col2\" >Assesses the performance and error distribution of a regression model using various error metrics....</td>\n",
+              "      <td id=\"T_56dd5_row49_col3\" class=\"data row49 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row49_col4\" class=\"data row49 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row49_col5\" class=\"data row49 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_56dd5_row49_col6\" class=\"data row49 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row49_col7\" class=\"data row49 col7\" >['sklearn', 'model_performance']</td>\n",
+              "      <td id=\"T_56dd5_row49_col8\" class=\"data row49 col8\" >['regression', 'classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row50_col0\" class=\"data row50 col0\" >validmind.model_validation.sklearn.RobustnessDiagnosis</td>\n",
+              "      <td id=\"T_56dd5_row50_col1\" class=\"data row50 col1\" >Robustness Diagnosis</td>\n",
+              "      <td id=\"T_56dd5_row50_col2\" class=\"data row50 col2\" >Assesses the robustness of a machine learning model by evaluating performance decay under noisy conditions....</td>\n",
+              "      <td id=\"T_56dd5_row50_col3\" class=\"data row50 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row50_col4\" class=\"data row50 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row50_col5\" class=\"data row50 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row50_col6\" class=\"data row50 col6\" >{'metric': {'type': 'str', 'default': None}, 'scaling_factor_std_dev_list': {'type': None, 'default': [0.1, 0.2, 0.3, 0.4, 0.5]}, 'performance_decay_threshold': {'type': 'float', 'default': 0.05}}</td>\n",
+              "      <td id=\"T_56dd5_row50_col7\" class=\"data row50 col7\" >['sklearn', 'model_diagnosis', 'visualization']</td>\n",
+              "      <td id=\"T_56dd5_row50_col8\" class=\"data row50 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row51_col0\" class=\"data row51 col0\" >validmind.model_validation.sklearn.SHAPGlobalImportance</td>\n",
+              "      <td id=\"T_56dd5_row51_col1\" class=\"data row51 col1\" >SHAP Global Importance</td>\n",
+              "      <td id=\"T_56dd5_row51_col2\" class=\"data row51 col2\" >Evaluates and visualizes global feature importance using SHAP values for model explanation and risk identification....</td>\n",
+              "      <td id=\"T_56dd5_row51_col3\" class=\"data row51 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row51_col4\" class=\"data row51 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row51_col5\" class=\"data row51 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_56dd5_row51_col6\" class=\"data row51 col6\" >{'kernel_explainer_samples': {'type': 'int', 'default': 10}, 'tree_or_linear_explainer_samples': {'type': 'int', 'default': 200}, 'class_of_interest': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_56dd5_row51_col7\" class=\"data row51 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'feature_importance', 'visualization']</td>\n",
+              "      <td id=\"T_56dd5_row51_col8\" class=\"data row51 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row52_col0\" class=\"data row52 col0\" >validmind.model_validation.sklearn.ScoreProbabilityAlignment</td>\n",
+              "      <td id=\"T_56dd5_row52_col1\" class=\"data row52 col1\" >Score Probability Alignment</td>\n",
+              "      <td id=\"T_56dd5_row52_col2\" class=\"data row52 col2\" >Analyzes the alignment between credit scores and predicted probabilities....</td>\n",
+              "      <td id=\"T_56dd5_row52_col3\" class=\"data row52 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row52_col4\" class=\"data row52 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row52_col5\" class=\"data row52 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_56dd5_row52_col6\" class=\"data row52 col6\" >{'score_column': {'type': 'str', 'default': 'score'}, 'n_bins': {'type': 'int', 'default': 10}}</td>\n",
+              "      <td id=\"T_56dd5_row52_col7\" class=\"data row52 col7\" >['visualization', 'credit_risk', 'calibration']</td>\n",
+              "      <td id=\"T_56dd5_row52_col8\" class=\"data row52 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row53_col0\" class=\"data row53 col0\" >validmind.model_validation.sklearn.TrainingTestDegradation</td>\n",
+              "      <td id=\"T_56dd5_row53_col1\" class=\"data row53 col1\" >Training Test Degradation</td>\n",
+              "      <td id=\"T_56dd5_row53_col2\" class=\"data row53 col2\" >Tests if model performance degradation between training and test datasets exceeds a predefined threshold....</td>\n",
+              "      <td id=\"T_56dd5_row53_col3\" class=\"data row53 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row53_col4\" class=\"data row53 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row53_col5\" class=\"data row53 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row53_col6\" class=\"data row53 col6\" >{'max_threshold': {'type': 'float', 'default': 0.1}}</td>\n",
+              "      <td id=\"T_56dd5_row53_col7\" class=\"data row53 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_56dd5_row53_col8\" class=\"data row53 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row54_col0\" class=\"data row54 col0\" >validmind.model_validation.sklearn.WeakspotsDiagnosis</td>\n",
+              "      <td id=\"T_56dd5_row54_col1\" class=\"data row54 col1\" >Weakspots Diagnosis</td>\n",
+              "      <td id=\"T_56dd5_row54_col2\" class=\"data row54 col2\" >Identifies and visualizes weak spots in a machine learning model's performance across various sections of the...</td>\n",
+              "      <td id=\"T_56dd5_row54_col3\" class=\"data row54 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row54_col4\" class=\"data row54 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row54_col5\" class=\"data row54 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row54_col6\" class=\"data row54 col6\" >{'features_columns': {'type': None, 'default': None}, 'metrics': {'type': None, 'default': None}, 'thresholds': {'type': None, 'default': None}}</td>\n",
+              "      <td id=\"T_56dd5_row54_col7\" class=\"data row54 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_diagnosis', 'visualization']</td>\n",
+              "      <td id=\"T_56dd5_row54_col8\" class=\"data row54 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row55_col0\" class=\"data row55 col0\" >validmind.model_validation.statsmodels.CumulativePredictionProbabilities</td>\n",
+              "      <td id=\"T_56dd5_row55_col1\" class=\"data row55 col1\" >Cumulative Prediction Probabilities</td>\n",
+              "      <td id=\"T_56dd5_row55_col2\" class=\"data row55 col2\" >Visualizes cumulative probabilities of positive and negative classes for both training and testing in classification models....</td>\n",
+              "      <td id=\"T_56dd5_row55_col3\" class=\"data row55 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row55_col4\" class=\"data row55 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row55_col5\" class=\"data row55 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row55_col6\" class=\"data row55 col6\" >{'title': {'type': 'str', 'default': 'Cumulative Probabilities'}}</td>\n",
+              "      <td id=\"T_56dd5_row55_col7\" class=\"data row55 col7\" >['visualization', 'credit_risk']</td>\n",
+              "      <td id=\"T_56dd5_row55_col8\" class=\"data row55 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row56_col0\" class=\"data row56 col0\" >validmind.model_validation.statsmodels.GINITable</td>\n",
+              "      <td id=\"T_56dd5_row56_col1\" class=\"data row56 col1\" >GINI Table</td>\n",
+              "      <td id=\"T_56dd5_row56_col2\" class=\"data row56 col2\" >Evaluates classification model performance using AUC, GINI, and KS metrics for training and test datasets....</td>\n",
+              "      <td id=\"T_56dd5_row56_col3\" class=\"data row56 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row56_col4\" class=\"data row56 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row56_col5\" class=\"data row56 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row56_col6\" class=\"data row56 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row56_col7\" class=\"data row56 col7\" >['model_performance']</td>\n",
+              "      <td id=\"T_56dd5_row56_col8\" class=\"data row56 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row57_col0\" class=\"data row57 col0\" >validmind.model_validation.statsmodels.KolmogorovSmirnov</td>\n",
+              "      <td id=\"T_56dd5_row57_col1\" class=\"data row57 col1\" >Kolmogorov Smirnov</td>\n",
+              "      <td id=\"T_56dd5_row57_col2\" class=\"data row57 col2\" >Assesses whether each feature in the dataset aligns with a normal distribution using the Kolmogorov-Smirnov test....</td>\n",
+              "      <td id=\"T_56dd5_row57_col3\" class=\"data row57 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row57_col4\" class=\"data row57 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row57_col5\" class=\"data row57 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_56dd5_row57_col6\" class=\"data row57 col6\" >{'dist': {'type': 'str', 'default': 'norm'}}</td>\n",
+              "      <td id=\"T_56dd5_row57_col7\" class=\"data row57 col7\" >['tabular_data', 'data_distribution', 'statistical_test', 'statsmodels']</td>\n",
+              "      <td id=\"T_56dd5_row57_col8\" class=\"data row57 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row58_col0\" class=\"data row58 col0\" >validmind.model_validation.statsmodels.Lilliefors</td>\n",
+              "      <td id=\"T_56dd5_row58_col1\" class=\"data row58 col1\" >Lilliefors</td>\n",
+              "      <td id=\"T_56dd5_row58_col2\" class=\"data row58 col2\" >Assesses the normality of feature distributions in an ML model's training dataset using the Lilliefors test....</td>\n",
+              "      <td id=\"T_56dd5_row58_col3\" class=\"data row58 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row58_col4\" class=\"data row58 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row58_col5\" class=\"data row58 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row58_col6\" class=\"data row58 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row58_col7\" class=\"data row58 col7\" >['tabular_data', 'data_distribution', 'statistical_test', 'statsmodels']</td>\n",
+              "      <td id=\"T_56dd5_row58_col8\" class=\"data row58 col8\" >['classification', 'regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row59_col0\" class=\"data row59 col0\" >validmind.model_validation.statsmodels.PredictionProbabilitiesHistogram</td>\n",
+              "      <td id=\"T_56dd5_row59_col1\" class=\"data row59 col1\" >Prediction Probabilities Histogram</td>\n",
+              "      <td id=\"T_56dd5_row59_col2\" class=\"data row59 col2\" >Assesses the predictive probability distribution for binary classification to evaluate model performance and...</td>\n",
+              "      <td id=\"T_56dd5_row59_col3\" class=\"data row59 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row59_col4\" class=\"data row59 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row59_col5\" class=\"data row59 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row59_col6\" class=\"data row59 col6\" >{'title': {'type': 'str', 'default': 'Histogram of Predictive Probabilities'}}</td>\n",
+              "      <td id=\"T_56dd5_row59_col7\" class=\"data row59 col7\" >['visualization', 'credit_risk']</td>\n",
+              "      <td id=\"T_56dd5_row59_col8\" class=\"data row59 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row60_col0\" class=\"data row60 col0\" >validmind.model_validation.statsmodels.ScorecardHistogram</td>\n",
+              "      <td id=\"T_56dd5_row60_col1\" class=\"data row60 col1\" >Scorecard Histogram</td>\n",
+              "      <td id=\"T_56dd5_row60_col2\" class=\"data row60 col2\" >The Scorecard Histogram test evaluates the distribution of credit scores between default and non-default instances,...</td>\n",
+              "      <td id=\"T_56dd5_row60_col3\" class=\"data row60 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row60_col4\" class=\"data row60 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row60_col5\" class=\"data row60 col5\" >['dataset']</td>\n",
+              "      <td id=\"T_56dd5_row60_col6\" class=\"data row60 col6\" >{'title': {'type': 'str', 'default': 'Histogram of Scores'}, 'score_column': {'type': 'str', 'default': 'score'}}</td>\n",
+              "      <td id=\"T_56dd5_row60_col7\" class=\"data row60 col7\" >['visualization', 'credit_risk', 'logistic_regression']</td>\n",
+              "      <td id=\"T_56dd5_row60_col8\" class=\"data row60 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row61_col0\" class=\"data row61 col0\" >validmind.ongoing_monitoring.CalibrationCurveDrift</td>\n",
+              "      <td id=\"T_56dd5_row61_col1\" class=\"data row61 col1\" >Calibration Curve Drift</td>\n",
+              "      <td id=\"T_56dd5_row61_col2\" class=\"data row61 col2\" >Evaluates changes in probability calibration between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_56dd5_row61_col3\" class=\"data row61 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row61_col4\" class=\"data row61 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row61_col5\" class=\"data row61 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row61_col6\" class=\"data row61 col6\" >{'n_bins': {'type': 'int', 'default': 10}, 'drift_pct_threshold': {'type': 'float', 'default': 20}}</td>\n",
+              "      <td id=\"T_56dd5_row61_col7\" class=\"data row61 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_56dd5_row61_col8\" class=\"data row61 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row62_col0\" class=\"data row62 col0\" >validmind.ongoing_monitoring.ClassDiscriminationDrift</td>\n",
+              "      <td id=\"T_56dd5_row62_col1\" class=\"data row62 col1\" >Class Discrimination Drift</td>\n",
+              "      <td id=\"T_56dd5_row62_col2\" class=\"data row62 col2\" >Compares classification discrimination metrics between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_56dd5_row62_col3\" class=\"data row62 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row62_col4\" class=\"data row62 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row62_col5\" class=\"data row62 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row62_col6\" class=\"data row62 col6\" >{'drift_pct_threshold': {'type': '_empty', 'default': 20}}</td>\n",
+              "      <td id=\"T_56dd5_row62_col7\" class=\"data row62 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_56dd5_row62_col8\" class=\"data row62 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row63_col0\" class=\"data row63 col0\" >validmind.ongoing_monitoring.ClassImbalanceDrift</td>\n",
+              "      <td id=\"T_56dd5_row63_col1\" class=\"data row63 col1\" >Class Imbalance Drift</td>\n",
+              "      <td id=\"T_56dd5_row63_col2\" class=\"data row63 col2\" >Evaluates drift in class distribution between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_56dd5_row63_col3\" class=\"data row63 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row63_col4\" class=\"data row63 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row63_col5\" class=\"data row63 col5\" >['datasets']</td>\n",
+              "      <td id=\"T_56dd5_row63_col6\" class=\"data row63 col6\" >{'drift_pct_threshold': {'type': 'float', 'default': 5.0}, 'title': {'type': 'str', 'default': 'Class Distribution Drift'}}</td>\n",
+              "      <td id=\"T_56dd5_row63_col7\" class=\"data row63 col7\" >['tabular_data', 'binary_classification', 'multiclass_classification']</td>\n",
+              "      <td id=\"T_56dd5_row63_col8\" class=\"data row63 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row64_col0\" class=\"data row64 col0\" >validmind.ongoing_monitoring.ClassificationAccuracyDrift</td>\n",
+              "      <td id=\"T_56dd5_row64_col1\" class=\"data row64 col1\" >Classification Accuracy Drift</td>\n",
+              "      <td id=\"T_56dd5_row64_col2\" class=\"data row64 col2\" >Compares classification accuracy metrics between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_56dd5_row64_col3\" class=\"data row64 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row64_col4\" class=\"data row64 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row64_col5\" class=\"data row64 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row64_col6\" class=\"data row64 col6\" >{'drift_pct_threshold': {'type': '_empty', 'default': 20}}</td>\n",
+              "      <td id=\"T_56dd5_row64_col7\" class=\"data row64 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_56dd5_row64_col8\" class=\"data row64 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row65_col0\" class=\"data row65 col0\" >validmind.ongoing_monitoring.ConfusionMatrixDrift</td>\n",
+              "      <td id=\"T_56dd5_row65_col1\" class=\"data row65 col1\" >Confusion Matrix Drift</td>\n",
+              "      <td id=\"T_56dd5_row65_col2\" class=\"data row65 col2\" >Compares confusion matrix metrics between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_56dd5_row65_col3\" class=\"data row65 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row65_col4\" class=\"data row65 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row65_col5\" class=\"data row65 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row65_col6\" class=\"data row65 col6\" >{'drift_pct_threshold': {'type': '_empty', 'default': 20}}</td>\n",
+              "      <td id=\"T_56dd5_row65_col7\" class=\"data row65 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance']</td>\n",
+              "      <td id=\"T_56dd5_row65_col8\" class=\"data row65 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row66_col0\" class=\"data row66 col0\" >validmind.ongoing_monitoring.CumulativePredictionProbabilitiesDrift</td>\n",
+              "      <td id=\"T_56dd5_row66_col1\" class=\"data row66 col1\" >Cumulative Prediction Probabilities Drift</td>\n",
+              "      <td id=\"T_56dd5_row66_col2\" class=\"data row66 col2\" >Compares cumulative prediction probability distributions between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_56dd5_row66_col3\" class=\"data row66 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row66_col4\" class=\"data row66 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row66_col5\" class=\"data row66 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row66_col6\" class=\"data row66 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row66_col7\" class=\"data row66 col7\" >['visualization', 'credit_risk']</td>\n",
+              "      <td id=\"T_56dd5_row66_col8\" class=\"data row66 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row67_col0\" class=\"data row67 col0\" >validmind.ongoing_monitoring.PredictionProbabilitiesHistogramDrift</td>\n",
+              "      <td id=\"T_56dd5_row67_col1\" class=\"data row67 col1\" >Prediction Probabilities Histogram Drift</td>\n",
+              "      <td id=\"T_56dd5_row67_col2\" class=\"data row67 col2\" >Compares prediction probability distributions between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_56dd5_row67_col3\" class=\"data row67 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row67_col4\" class=\"data row67 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row67_col5\" class=\"data row67 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row67_col6\" class=\"data row67 col6\" >{'title': {'type': '_empty', 'default': 'Prediction Probabilities Histogram Drift'}, 'drift_pct_threshold': {'type': 'float', 'default': 20.0}}</td>\n",
+              "      <td id=\"T_56dd5_row67_col7\" class=\"data row67 col7\" >['visualization', 'credit_risk']</td>\n",
+              "      <td id=\"T_56dd5_row67_col8\" class=\"data row67 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row68_col0\" class=\"data row68 col0\" >validmind.ongoing_monitoring.ROCCurveDrift</td>\n",
+              "      <td id=\"T_56dd5_row68_col1\" class=\"data row68 col1\" >ROC Curve Drift</td>\n",
+              "      <td id=\"T_56dd5_row68_col2\" class=\"data row68 col2\" >Compares ROC curves between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_56dd5_row68_col3\" class=\"data row68 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row68_col4\" class=\"data row68 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row68_col5\" class=\"data row68 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row68_col6\" class=\"data row68 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row68_col7\" class=\"data row68 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_56dd5_row68_col8\" class=\"data row68 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row69_col0\" class=\"data row69 col0\" >validmind.ongoing_monitoring.ScoreBandsDrift</td>\n",
+              "      <td id=\"T_56dd5_row69_col1\" class=\"data row69 col1\" >Score Bands Drift</td>\n",
+              "      <td id=\"T_56dd5_row69_col2\" class=\"data row69 col2\" >Analyzes drift in population distribution and default rates across score bands....</td>\n",
+              "      <td id=\"T_56dd5_row69_col3\" class=\"data row69 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row69_col4\" class=\"data row69 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row69_col5\" class=\"data row69 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row69_col6\" class=\"data row69 col6\" >{'score_column': {'type': 'str', 'default': 'score'}, 'score_bands': {'type': 'list', 'default': None}, 'drift_threshold': {'type': 'float', 'default': 20.0}}</td>\n",
+              "      <td id=\"T_56dd5_row69_col7\" class=\"data row69 col7\" >['visualization', 'credit_risk', 'scorecard']</td>\n",
+              "      <td id=\"T_56dd5_row69_col8\" class=\"data row69 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row70_col0\" class=\"data row70 col0\" >validmind.ongoing_monitoring.ScorecardHistogramDrift</td>\n",
+              "      <td id=\"T_56dd5_row70_col1\" class=\"data row70 col1\" >Scorecard Histogram Drift</td>\n",
+              "      <td id=\"T_56dd5_row70_col2\" class=\"data row70 col2\" >Compares score distributions between reference and monitoring datasets for each class....</td>\n",
+              "      <td id=\"T_56dd5_row70_col3\" class=\"data row70 col3\" >True</td>\n",
+              "      <td id=\"T_56dd5_row70_col4\" class=\"data row70 col4\" >True</td>\n",
+              "      <td id=\"T_56dd5_row70_col5\" class=\"data row70 col5\" >['datasets']</td>\n",
+              "      <td id=\"T_56dd5_row70_col6\" class=\"data row70 col6\" >{'score_column': {'type': 'str', 'default': 'score'}, 'title': {'type': 'str', 'default': 'Scorecard Histogram Drift'}, 'drift_pct_threshold': {'type': 'float', 'default': 20.0}}</td>\n",
+              "      <td id=\"T_56dd5_row70_col7\" class=\"data row70 col7\" >['visualization', 'credit_risk', 'logistic_regression']</td>\n",
+              "      <td id=\"T_56dd5_row70_col8\" class=\"data row70 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row71_col0\" class=\"data row71 col0\" >validmind.unit_metrics.classification.Accuracy</td>\n",
+              "      <td id=\"T_56dd5_row71_col1\" class=\"data row71 col1\" >Accuracy</td>\n",
+              "      <td id=\"T_56dd5_row71_col2\" class=\"data row71 col2\" >Calculates the accuracy of a model</td>\n",
+              "      <td id=\"T_56dd5_row71_col3\" class=\"data row71 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row71_col4\" class=\"data row71 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row71_col5\" class=\"data row71 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_56dd5_row71_col6\" class=\"data row71 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row71_col7\" class=\"data row71 col7\" >['classification']</td>\n",
+              "      <td id=\"T_56dd5_row71_col8\" class=\"data row71 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row72_col0\" class=\"data row72 col0\" >validmind.unit_metrics.classification.F1</td>\n",
+              "      <td id=\"T_56dd5_row72_col1\" class=\"data row72 col1\" >F1</td>\n",
+              "      <td id=\"T_56dd5_row72_col2\" class=\"data row72 col2\" >Calculates the F1 score for a classification model.</td>\n",
+              "      <td id=\"T_56dd5_row72_col3\" class=\"data row72 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row72_col4\" class=\"data row72 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row72_col5\" class=\"data row72 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_56dd5_row72_col6\" class=\"data row72 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row72_col7\" class=\"data row72 col7\" >['classification']</td>\n",
+              "      <td id=\"T_56dd5_row72_col8\" class=\"data row72 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row73_col0\" class=\"data row73 col0\" >validmind.unit_metrics.classification.Precision</td>\n",
+              "      <td id=\"T_56dd5_row73_col1\" class=\"data row73 col1\" >Precision</td>\n",
+              "      <td id=\"T_56dd5_row73_col2\" class=\"data row73 col2\" >Calculates the precision for a classification model.</td>\n",
+              "      <td id=\"T_56dd5_row73_col3\" class=\"data row73 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row73_col4\" class=\"data row73 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row73_col5\" class=\"data row73 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_56dd5_row73_col6\" class=\"data row73 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row73_col7\" class=\"data row73 col7\" >['classification']</td>\n",
+              "      <td id=\"T_56dd5_row73_col8\" class=\"data row73 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row74_col0\" class=\"data row74 col0\" >validmind.unit_metrics.classification.ROC_AUC</td>\n",
+              "      <td id=\"T_56dd5_row74_col1\" class=\"data row74 col1\" >ROC AUC</td>\n",
+              "      <td id=\"T_56dd5_row74_col2\" class=\"data row74 col2\" >Calculates the ROC AUC for a classification model.</td>\n",
+              "      <td id=\"T_56dd5_row74_col3\" class=\"data row74 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row74_col4\" class=\"data row74 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row74_col5\" class=\"data row74 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_56dd5_row74_col6\" class=\"data row74 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row74_col7\" class=\"data row74 col7\" >['classification']</td>\n",
+              "      <td id=\"T_56dd5_row74_col8\" class=\"data row74 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_56dd5_row75_col0\" class=\"data row75 col0\" >validmind.unit_metrics.classification.Recall</td>\n",
+              "      <td id=\"T_56dd5_row75_col1\" class=\"data row75 col1\" >Recall</td>\n",
+              "      <td id=\"T_56dd5_row75_col2\" class=\"data row75 col2\" >Calculates the recall for a classification model.</td>\n",
+              "      <td id=\"T_56dd5_row75_col3\" class=\"data row75 col3\" >False</td>\n",
+              "      <td id=\"T_56dd5_row75_col4\" class=\"data row75 col4\" >False</td>\n",
+              "      <td id=\"T_56dd5_row75_col5\" class=\"data row75 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_56dd5_row75_col6\" class=\"data row75 col6\" >{}</td>\n",
+              "      <td id=\"T_56dd5_row75_col7\" class=\"data row75 col7\" >['classification']</td>\n",
+              "      <td id=\"T_56dd5_row75_col8\" class=\"data row75 col8\" >['classification']</td>\n",
+              "    </tr>\n",
+              "  </tbody>\n",
+              "</table>\n"
+            ],
+            "text/plain": [
+              "<pandas.io.formats.style.Styler at 0x10516c880>"
+            ]
+          },
+          "execution_count": null,
+          "metadata": {},
+          "output_type": "execute_result"
+        }
       ],
-      "text/plain": [
-       "<pandas.io.formats.style.Styler at 0x36a280f40>"
+      "source": [
+        "list_tests(task=\"classification\")"
       ]
-     },
-     "execution_count": 8,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "list_tests(tags=[\"model_performance\", \"visualization\"])"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Use `filter`, `task`, and `tags` together to create more specific queries.\n",
-    "\n",
-    "For example, apply all three to find tests compatible with `sklearn` models, designed for `classification` tasks:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Use the `tags` parameter to find tests based on their tags, such as `model_performance` or `visualization`:"
+      ]
+    },
     {
-     "data": {
-      "text/html": [
-       "<style type=\"text/css\">\n",
-       "#T_36394 th {\n",
-       "  text-align: left;\n",
-       "}\n",
-       "#T_36394_row0_col0, #T_36394_row0_col1, #T_36394_row0_col2, #T_36394_row0_col3, #T_36394_row0_col4, #T_36394_row0_col5, #T_36394_row0_col6, #T_36394_row0_col7, #T_36394_row0_col8, #T_36394_row1_col0, #T_36394_row1_col1, #T_36394_row1_col2, #T_36394_row1_col3, #T_36394_row1_col4, #T_36394_row1_col5, #T_36394_row1_col6, #T_36394_row1_col7, #T_36394_row1_col8, #T_36394_row2_col0, #T_36394_row2_col1, #T_36394_row2_col2, #T_36394_row2_col3, #T_36394_row2_col4, #T_36394_row2_col5, #T_36394_row2_col6, #T_36394_row2_col7, #T_36394_row2_col8, #T_36394_row3_col0, #T_36394_row3_col1, #T_36394_row3_col2, #T_36394_row3_col3, #T_36394_row3_col4, #T_36394_row3_col5, #T_36394_row3_col6, #T_36394_row3_col7, #T_36394_row3_col8, #T_36394_row4_col0, #T_36394_row4_col1, #T_36394_row4_col2, #T_36394_row4_col3, #T_36394_row4_col4, #T_36394_row4_col5, #T_36394_row4_col6, #T_36394_row4_col7, #T_36394_row4_col8, #T_36394_row5_col0, #T_36394_row5_col1, #T_36394_row5_col2, #T_36394_row5_col3, #T_36394_row5_col4, #T_36394_row5_col5, #T_36394_row5_col6, #T_36394_row5_col7, #T_36394_row5_col8 {\n",
-       "  text-align: left;\n",
-       "}\n",
-       "</style>\n",
-       "<table id=\"T_36394\">\n",
-       "  <thead>\n",
-       "    <tr>\n",
-       "      <th id=\"T_36394_level0_col0\" class=\"col_heading level0 col0\" >ID</th>\n",
-       "      <th id=\"T_36394_level0_col1\" class=\"col_heading level0 col1\" >Name</th>\n",
-       "      <th id=\"T_36394_level0_col2\" class=\"col_heading level0 col2\" >Description</th>\n",
-       "      <th id=\"T_36394_level0_col3\" class=\"col_heading level0 col3\" >Has Figure</th>\n",
-       "      <th id=\"T_36394_level0_col4\" class=\"col_heading level0 col4\" >Has Table</th>\n",
-       "      <th id=\"T_36394_level0_col5\" class=\"col_heading level0 col5\" >Required Inputs</th>\n",
-       "      <th id=\"T_36394_level0_col6\" class=\"col_heading level0 col6\" >Params</th>\n",
-       "      <th id=\"T_36394_level0_col7\" class=\"col_heading level0 col7\" >Tags</th>\n",
-       "      <th id=\"T_36394_level0_col8\" class=\"col_heading level0 col8\" >Tasks</th>\n",
-       "    </tr>\n",
-       "  </thead>\n",
-       "  <tbody>\n",
-       "    <tr>\n",
-       "      <td id=\"T_36394_row0_col0\" class=\"data row0 col0\" >validmind.model_validation.sklearn.ConfusionMatrix</td>\n",
-       "      <td id=\"T_36394_row0_col1\" class=\"data row0 col1\" >Confusion Matrix</td>\n",
-       "      <td id=\"T_36394_row0_col2\" class=\"data row0 col2\" >Evaluates and visually represents the classification ML model's predictive performance using a Confusion Matrix...</td>\n",
-       "      <td id=\"T_36394_row0_col3\" class=\"data row0 col3\" >True</td>\n",
-       "      <td id=\"T_36394_row0_col4\" class=\"data row0 col4\" >False</td>\n",
-       "      <td id=\"T_36394_row0_col5\" class=\"data row0 col5\" >['dataset', 'model']</td>\n",
-       "      <td id=\"T_36394_row0_col6\" class=\"data row0 col6\" >{'threshold': {'type': 'float', 'default': 0.5}}</td>\n",
-       "      <td id=\"T_36394_row0_col7\" class=\"data row0 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_36394_row0_col8\" class=\"data row0 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_36394_row1_col0\" class=\"data row1 col0\" >validmind.model_validation.sklearn.PrecisionRecallCurve</td>\n",
-       "      <td id=\"T_36394_row1_col1\" class=\"data row1 col1\" >Precision Recall Curve</td>\n",
-       "      <td id=\"T_36394_row1_col2\" class=\"data row1 col2\" >Evaluates the precision-recall trade-off for binary classification models and visualizes the Precision-Recall curve....</td>\n",
-       "      <td id=\"T_36394_row1_col3\" class=\"data row1 col3\" >True</td>\n",
-       "      <td id=\"T_36394_row1_col4\" class=\"data row1 col4\" >False</td>\n",
-       "      <td id=\"T_36394_row1_col5\" class=\"data row1 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_36394_row1_col6\" class=\"data row1 col6\" >{}</td>\n",
-       "      <td id=\"T_36394_row1_col7\" class=\"data row1 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_36394_row1_col8\" class=\"data row1 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_36394_row2_col0\" class=\"data row2 col0\" >validmind.model_validation.sklearn.ROCCurve</td>\n",
-       "      <td id=\"T_36394_row2_col1\" class=\"data row2 col1\" >ROC Curve</td>\n",
-       "      <td id=\"T_36394_row2_col2\" class=\"data row2 col2\" >Evaluates binary classification model performance by generating and plotting the Receiver Operating Characteristic...</td>\n",
-       "      <td id=\"T_36394_row2_col3\" class=\"data row2 col3\" >True</td>\n",
-       "      <td id=\"T_36394_row2_col4\" class=\"data row2 col4\" >False</td>\n",
-       "      <td id=\"T_36394_row2_col5\" class=\"data row2 col5\" >['model', 'dataset']</td>\n",
-       "      <td id=\"T_36394_row2_col6\" class=\"data row2 col6\" >{}</td>\n",
-       "      <td id=\"T_36394_row2_col7\" class=\"data row2 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_36394_row2_col8\" class=\"data row2 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_36394_row3_col0\" class=\"data row3 col0\" >validmind.model_validation.sklearn.TrainingTestDegradation</td>\n",
-       "      <td id=\"T_36394_row3_col1\" class=\"data row3 col1\" >Training Test Degradation</td>\n",
-       "      <td id=\"T_36394_row3_col2\" class=\"data row3 col2\" >Tests if model performance degradation between training and test datasets exceeds a predefined threshold....</td>\n",
-       "      <td id=\"T_36394_row3_col3\" class=\"data row3 col3\" >False</td>\n",
-       "      <td id=\"T_36394_row3_col4\" class=\"data row3 col4\" >True</td>\n",
-       "      <td id=\"T_36394_row3_col5\" class=\"data row3 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_36394_row3_col6\" class=\"data row3 col6\" >{'max_threshold': {'type': 'float', 'default': 0.1}}</td>\n",
-       "      <td id=\"T_36394_row3_col7\" class=\"data row3 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_36394_row3_col8\" class=\"data row3 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_36394_row4_col0\" class=\"data row4 col0\" >validmind.ongoing_monitoring.CalibrationCurveDrift</td>\n",
-       "      <td id=\"T_36394_row4_col1\" class=\"data row4 col1\" >Calibration Curve Drift</td>\n",
-       "      <td id=\"T_36394_row4_col2\" class=\"data row4 col2\" >Evaluates changes in probability calibration between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_36394_row4_col3\" class=\"data row4 col3\" >True</td>\n",
-       "      <td id=\"T_36394_row4_col4\" class=\"data row4 col4\" >True</td>\n",
-       "      <td id=\"T_36394_row4_col5\" class=\"data row4 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_36394_row4_col6\" class=\"data row4 col6\" >{'n_bins': {'type': 'int', 'default': 10}, 'drift_pct_threshold': {'type': 'float', 'default': 20}}</td>\n",
-       "      <td id=\"T_36394_row4_col7\" class=\"data row4 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_36394_row4_col8\" class=\"data row4 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "    <tr>\n",
-       "      <td id=\"T_36394_row5_col0\" class=\"data row5 col0\" >validmind.ongoing_monitoring.ROCCurveDrift</td>\n",
-       "      <td id=\"T_36394_row5_col1\" class=\"data row5 col1\" >ROC Curve Drift</td>\n",
-       "      <td id=\"T_36394_row5_col2\" class=\"data row5 col2\" >Compares ROC curves between reference and monitoring datasets....</td>\n",
-       "      <td id=\"T_36394_row5_col3\" class=\"data row5 col3\" >True</td>\n",
-       "      <td id=\"T_36394_row5_col4\" class=\"data row5 col4\" >False</td>\n",
-       "      <td id=\"T_36394_row5_col5\" class=\"data row5 col5\" >['datasets', 'model']</td>\n",
-       "      <td id=\"T_36394_row5_col6\" class=\"data row5 col6\" >{}</td>\n",
-       "      <td id=\"T_36394_row5_col7\" class=\"data row5 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
-       "      <td id=\"T_36394_row5_col8\" class=\"data row5 col8\" >['classification', 'text_classification']</td>\n",
-       "    </tr>\n",
-       "  </tbody>\n",
-       "</table>\n"
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style type=\"text/css\">\n",
+              "#T_4d8bf th {\n",
+              "  text-align: left;\n",
+              "}\n",
+              "#T_4d8bf_row0_col0, #T_4d8bf_row0_col1, #T_4d8bf_row0_col2, #T_4d8bf_row0_col3, #T_4d8bf_row0_col4, #T_4d8bf_row0_col5, #T_4d8bf_row0_col6, #T_4d8bf_row0_col7, #T_4d8bf_row0_col8, #T_4d8bf_row1_col0, #T_4d8bf_row1_col1, #T_4d8bf_row1_col2, #T_4d8bf_row1_col3, #T_4d8bf_row1_col4, #T_4d8bf_row1_col5, #T_4d8bf_row1_col6, #T_4d8bf_row1_col7, #T_4d8bf_row1_col8, #T_4d8bf_row2_col0, #T_4d8bf_row2_col1, #T_4d8bf_row2_col2, #T_4d8bf_row2_col3, #T_4d8bf_row2_col4, #T_4d8bf_row2_col5, #T_4d8bf_row2_col6, #T_4d8bf_row2_col7, #T_4d8bf_row2_col8, #T_4d8bf_row3_col0, #T_4d8bf_row3_col1, #T_4d8bf_row3_col2, #T_4d8bf_row3_col3, #T_4d8bf_row3_col4, #T_4d8bf_row3_col5, #T_4d8bf_row3_col6, #T_4d8bf_row3_col7, #T_4d8bf_row3_col8, #T_4d8bf_row4_col0, #T_4d8bf_row4_col1, #T_4d8bf_row4_col2, #T_4d8bf_row4_col3, #T_4d8bf_row4_col4, #T_4d8bf_row4_col5, #T_4d8bf_row4_col6, #T_4d8bf_row4_col7, #T_4d8bf_row4_col8, #T_4d8bf_row5_col0, #T_4d8bf_row5_col1, #T_4d8bf_row5_col2, #T_4d8bf_row5_col3, #T_4d8bf_row5_col4, #T_4d8bf_row5_col5, #T_4d8bf_row5_col6, #T_4d8bf_row5_col7, #T_4d8bf_row5_col8, #T_4d8bf_row6_col0, #T_4d8bf_row6_col1, #T_4d8bf_row6_col2, #T_4d8bf_row6_col3, #T_4d8bf_row6_col4, #T_4d8bf_row6_col5, #T_4d8bf_row6_col6, #T_4d8bf_row6_col7, #T_4d8bf_row6_col8 {\n",
+              "  text-align: left;\n",
+              "}\n",
+              "</style>\n",
+              "<table id=\"T_4d8bf\">\n",
+              "  <thead>\n",
+              "    <tr>\n",
+              "      <th id=\"T_4d8bf_level0_col0\" class=\"col_heading level0 col0\" >ID</th>\n",
+              "      <th id=\"T_4d8bf_level0_col1\" class=\"col_heading level0 col1\" >Name</th>\n",
+              "      <th id=\"T_4d8bf_level0_col2\" class=\"col_heading level0 col2\" >Description</th>\n",
+              "      <th id=\"T_4d8bf_level0_col3\" class=\"col_heading level0 col3\" >Has Figure</th>\n",
+              "      <th id=\"T_4d8bf_level0_col4\" class=\"col_heading level0 col4\" >Has Table</th>\n",
+              "      <th id=\"T_4d8bf_level0_col5\" class=\"col_heading level0 col5\" >Required Inputs</th>\n",
+              "      <th id=\"T_4d8bf_level0_col6\" class=\"col_heading level0 col6\" >Params</th>\n",
+              "      <th id=\"T_4d8bf_level0_col7\" class=\"col_heading level0 col7\" >Tags</th>\n",
+              "      <th id=\"T_4d8bf_level0_col8\" class=\"col_heading level0 col8\" >Tasks</th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "    <tr>\n",
+              "      <td id=\"T_4d8bf_row0_col0\" class=\"data row0 col0\" >validmind.model_validation.RegressionResidualsPlot</td>\n",
+              "      <td id=\"T_4d8bf_row0_col1\" class=\"data row0 col1\" >Regression Residuals Plot</td>\n",
+              "      <td id=\"T_4d8bf_row0_col2\" class=\"data row0 col2\" >Evaluates regression model performance using residual distribution and actual vs. predicted plots....</td>\n",
+              "      <td id=\"T_4d8bf_row0_col3\" class=\"data row0 col3\" >True</td>\n",
+              "      <td id=\"T_4d8bf_row0_col4\" class=\"data row0 col4\" >False</td>\n",
+              "      <td id=\"T_4d8bf_row0_col5\" class=\"data row0 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_4d8bf_row0_col6\" class=\"data row0 col6\" >{'bin_size': {'type': 'float', 'default': 0.1}}</td>\n",
+              "      <td id=\"T_4d8bf_row0_col7\" class=\"data row0 col7\" >['model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_4d8bf_row0_col8\" class=\"data row0 col8\" >['regression']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_4d8bf_row1_col0\" class=\"data row1 col0\" >validmind.model_validation.sklearn.ConfusionMatrix</td>\n",
+              "      <td id=\"T_4d8bf_row1_col1\" class=\"data row1 col1\" >Confusion Matrix</td>\n",
+              "      <td id=\"T_4d8bf_row1_col2\" class=\"data row1 col2\" >Evaluates and visually represents the classification ML model's predictive performance using a Confusion Matrix...</td>\n",
+              "      <td id=\"T_4d8bf_row1_col3\" class=\"data row1 col3\" >True</td>\n",
+              "      <td id=\"T_4d8bf_row1_col4\" class=\"data row1 col4\" >False</td>\n",
+              "      <td id=\"T_4d8bf_row1_col5\" class=\"data row1 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_4d8bf_row1_col6\" class=\"data row1 col6\" >{'threshold': {'type': 'float', 'default': 0.5}}</td>\n",
+              "      <td id=\"T_4d8bf_row1_col7\" class=\"data row1 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_4d8bf_row1_col8\" class=\"data row1 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_4d8bf_row2_col0\" class=\"data row2 col0\" >validmind.model_validation.sklearn.PrecisionRecallCurve</td>\n",
+              "      <td id=\"T_4d8bf_row2_col1\" class=\"data row2 col1\" >Precision Recall Curve</td>\n",
+              "      <td id=\"T_4d8bf_row2_col2\" class=\"data row2 col2\" >Evaluates the precision-recall trade-off for binary classification models and visualizes the Precision-Recall curve....</td>\n",
+              "      <td id=\"T_4d8bf_row2_col3\" class=\"data row2 col3\" >True</td>\n",
+              "      <td id=\"T_4d8bf_row2_col4\" class=\"data row2 col4\" >False</td>\n",
+              "      <td id=\"T_4d8bf_row2_col5\" class=\"data row2 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_4d8bf_row2_col6\" class=\"data row2 col6\" >{}</td>\n",
+              "      <td id=\"T_4d8bf_row2_col7\" class=\"data row2 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_4d8bf_row2_col8\" class=\"data row2 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_4d8bf_row3_col0\" class=\"data row3 col0\" >validmind.model_validation.sklearn.ROCCurve</td>\n",
+              "      <td id=\"T_4d8bf_row3_col1\" class=\"data row3 col1\" >ROC Curve</td>\n",
+              "      <td id=\"T_4d8bf_row3_col2\" class=\"data row3 col2\" >Evaluates binary classification model performance by generating and plotting the Receiver Operating Characteristic...</td>\n",
+              "      <td id=\"T_4d8bf_row3_col3\" class=\"data row3 col3\" >True</td>\n",
+              "      <td id=\"T_4d8bf_row3_col4\" class=\"data row3 col4\" >False</td>\n",
+              "      <td id=\"T_4d8bf_row3_col5\" class=\"data row3 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_4d8bf_row3_col6\" class=\"data row3 col6\" >{}</td>\n",
+              "      <td id=\"T_4d8bf_row3_col7\" class=\"data row3 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_4d8bf_row3_col8\" class=\"data row3 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_4d8bf_row4_col0\" class=\"data row4 col0\" >validmind.model_validation.sklearn.TrainingTestDegradation</td>\n",
+              "      <td id=\"T_4d8bf_row4_col1\" class=\"data row4 col1\" >Training Test Degradation</td>\n",
+              "      <td id=\"T_4d8bf_row4_col2\" class=\"data row4 col2\" >Tests if model performance degradation between training and test datasets exceeds a predefined threshold....</td>\n",
+              "      <td id=\"T_4d8bf_row4_col3\" class=\"data row4 col3\" >False</td>\n",
+              "      <td id=\"T_4d8bf_row4_col4\" class=\"data row4 col4\" >True</td>\n",
+              "      <td id=\"T_4d8bf_row4_col5\" class=\"data row4 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_4d8bf_row4_col6\" class=\"data row4 col6\" >{'max_threshold': {'type': 'float', 'default': 0.1}}</td>\n",
+              "      <td id=\"T_4d8bf_row4_col7\" class=\"data row4 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_4d8bf_row4_col8\" class=\"data row4 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_4d8bf_row5_col0\" class=\"data row5 col0\" >validmind.ongoing_monitoring.CalibrationCurveDrift</td>\n",
+              "      <td id=\"T_4d8bf_row5_col1\" class=\"data row5 col1\" >Calibration Curve Drift</td>\n",
+              "      <td id=\"T_4d8bf_row5_col2\" class=\"data row5 col2\" >Evaluates changes in probability calibration between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_4d8bf_row5_col3\" class=\"data row5 col3\" >True</td>\n",
+              "      <td id=\"T_4d8bf_row5_col4\" class=\"data row5 col4\" >True</td>\n",
+              "      <td id=\"T_4d8bf_row5_col5\" class=\"data row5 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_4d8bf_row5_col6\" class=\"data row5 col6\" >{'n_bins': {'type': 'int', 'default': 10}, 'drift_pct_threshold': {'type': 'float', 'default': 20}}</td>\n",
+              "      <td id=\"T_4d8bf_row5_col7\" class=\"data row5 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_4d8bf_row5_col8\" class=\"data row5 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_4d8bf_row6_col0\" class=\"data row6 col0\" >validmind.ongoing_monitoring.ROCCurveDrift</td>\n",
+              "      <td id=\"T_4d8bf_row6_col1\" class=\"data row6 col1\" >ROC Curve Drift</td>\n",
+              "      <td id=\"T_4d8bf_row6_col2\" class=\"data row6 col2\" >Compares ROC curves between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_4d8bf_row6_col3\" class=\"data row6 col3\" >True</td>\n",
+              "      <td id=\"T_4d8bf_row6_col4\" class=\"data row6 col4\" >False</td>\n",
+              "      <td id=\"T_4d8bf_row6_col5\" class=\"data row6 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_4d8bf_row6_col6\" class=\"data row6 col6\" >{}</td>\n",
+              "      <td id=\"T_4d8bf_row6_col7\" class=\"data row6 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_4d8bf_row6_col8\" class=\"data row6 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "  </tbody>\n",
+              "</table>\n"
+            ],
+            "text/plain": [
+              "<pandas.io.formats.style.Styler at 0x36a280f40>"
+            ]
+          },
+          "execution_count": null,
+          "metadata": {},
+          "output_type": "execute_result"
+        }
       ],
-      "text/plain": [
-       "<pandas.io.formats.style.Styler at 0x380009c40>"
+      "source": [
+        "list_tests(tags=[\"model_performance\", \"visualization\"])"
       ]
-     },
-     "execution_count": 9,
-     "metadata": {},
-     "output_type": "execute_result"
-    }
-   ],
-   "source": [
-    "list_tests(filter=\"sklearn\",\n",
-    "    tags=[\"model_performance\", \"visualization\"], task=\"classification\"\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Store test sets for use\n",
-    "\n",
-    "Once you've identified specific sets of tests you'd like to run, you can store the tests in variables, enabling you to easily reuse those tests in later steps.\n",
-    "\n",
-    "For example, if you're validating a summarization model, use [`list_tests()`](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) to retrieve all tests tagged for text summarization and save them to `text_summarization_tests` for later use:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Use `filter`, `task`, and `tags` together to create more specific queries.\n",
+        "\n",
+        "For example, apply all three to find tests compatible with `sklearn` models, designed for `classification` tasks:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [
+        {
+          "data": {
+            "text/html": [
+              "<style type=\"text/css\">\n",
+              "#T_36394 th {\n",
+              "  text-align: left;\n",
+              "}\n",
+              "#T_36394_row0_col0, #T_36394_row0_col1, #T_36394_row0_col2, #T_36394_row0_col3, #T_36394_row0_col4, #T_36394_row0_col5, #T_36394_row0_col6, #T_36394_row0_col7, #T_36394_row0_col8, #T_36394_row1_col0, #T_36394_row1_col1, #T_36394_row1_col2, #T_36394_row1_col3, #T_36394_row1_col4, #T_36394_row1_col5, #T_36394_row1_col6, #T_36394_row1_col7, #T_36394_row1_col8, #T_36394_row2_col0, #T_36394_row2_col1, #T_36394_row2_col2, #T_36394_row2_col3, #T_36394_row2_col4, #T_36394_row2_col5, #T_36394_row2_col6, #T_36394_row2_col7, #T_36394_row2_col8, #T_36394_row3_col0, #T_36394_row3_col1, #T_36394_row3_col2, #T_36394_row3_col3, #T_36394_row3_col4, #T_36394_row3_col5, #T_36394_row3_col6, #T_36394_row3_col7, #T_36394_row3_col8, #T_36394_row4_col0, #T_36394_row4_col1, #T_36394_row4_col2, #T_36394_row4_col3, #T_36394_row4_col4, #T_36394_row4_col5, #T_36394_row4_col6, #T_36394_row4_col7, #T_36394_row4_col8, #T_36394_row5_col0, #T_36394_row5_col1, #T_36394_row5_col2, #T_36394_row5_col3, #T_36394_row5_col4, #T_36394_row5_col5, #T_36394_row5_col6, #T_36394_row5_col7, #T_36394_row5_col8 {\n",
+              "  text-align: left;\n",
+              "}\n",
+              "</style>\n",
+              "<table id=\"T_36394\">\n",
+              "  <thead>\n",
+              "    <tr>\n",
+              "      <th id=\"T_36394_level0_col0\" class=\"col_heading level0 col0\" >ID</th>\n",
+              "      <th id=\"T_36394_level0_col1\" class=\"col_heading level0 col1\" >Name</th>\n",
+              "      <th id=\"T_36394_level0_col2\" class=\"col_heading level0 col2\" >Description</th>\n",
+              "      <th id=\"T_36394_level0_col3\" class=\"col_heading level0 col3\" >Has Figure</th>\n",
+              "      <th id=\"T_36394_level0_col4\" class=\"col_heading level0 col4\" >Has Table</th>\n",
+              "      <th id=\"T_36394_level0_col5\" class=\"col_heading level0 col5\" >Required Inputs</th>\n",
+              "      <th id=\"T_36394_level0_col6\" class=\"col_heading level0 col6\" >Params</th>\n",
+              "      <th id=\"T_36394_level0_col7\" class=\"col_heading level0 col7\" >Tags</th>\n",
+              "      <th id=\"T_36394_level0_col8\" class=\"col_heading level0 col8\" >Tasks</th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "    <tr>\n",
+              "      <td id=\"T_36394_row0_col0\" class=\"data row0 col0\" >validmind.model_validation.sklearn.ConfusionMatrix</td>\n",
+              "      <td id=\"T_36394_row0_col1\" class=\"data row0 col1\" >Confusion Matrix</td>\n",
+              "      <td id=\"T_36394_row0_col2\" class=\"data row0 col2\" >Evaluates and visually represents the classification ML model's predictive performance using a Confusion Matrix...</td>\n",
+              "      <td id=\"T_36394_row0_col3\" class=\"data row0 col3\" >True</td>\n",
+              "      <td id=\"T_36394_row0_col4\" class=\"data row0 col4\" >False</td>\n",
+              "      <td id=\"T_36394_row0_col5\" class=\"data row0 col5\" >['dataset', 'model']</td>\n",
+              "      <td id=\"T_36394_row0_col6\" class=\"data row0 col6\" >{'threshold': {'type': 'float', 'default': 0.5}}</td>\n",
+              "      <td id=\"T_36394_row0_col7\" class=\"data row0 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_36394_row0_col8\" class=\"data row0 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_36394_row1_col0\" class=\"data row1 col0\" >validmind.model_validation.sklearn.PrecisionRecallCurve</td>\n",
+              "      <td id=\"T_36394_row1_col1\" class=\"data row1 col1\" >Precision Recall Curve</td>\n",
+              "      <td id=\"T_36394_row1_col2\" class=\"data row1 col2\" >Evaluates the precision-recall trade-off for binary classification models and visualizes the Precision-Recall curve....</td>\n",
+              "      <td id=\"T_36394_row1_col3\" class=\"data row1 col3\" >True</td>\n",
+              "      <td id=\"T_36394_row1_col4\" class=\"data row1 col4\" >False</td>\n",
+              "      <td id=\"T_36394_row1_col5\" class=\"data row1 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_36394_row1_col6\" class=\"data row1 col6\" >{}</td>\n",
+              "      <td id=\"T_36394_row1_col7\" class=\"data row1 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_36394_row1_col8\" class=\"data row1 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_36394_row2_col0\" class=\"data row2 col0\" >validmind.model_validation.sklearn.ROCCurve</td>\n",
+              "      <td id=\"T_36394_row2_col1\" class=\"data row2 col1\" >ROC Curve</td>\n",
+              "      <td id=\"T_36394_row2_col2\" class=\"data row2 col2\" >Evaluates binary classification model performance by generating and plotting the Receiver Operating Characteristic...</td>\n",
+              "      <td id=\"T_36394_row2_col3\" class=\"data row2 col3\" >True</td>\n",
+              "      <td id=\"T_36394_row2_col4\" class=\"data row2 col4\" >False</td>\n",
+              "      <td id=\"T_36394_row2_col5\" class=\"data row2 col5\" >['model', 'dataset']</td>\n",
+              "      <td id=\"T_36394_row2_col6\" class=\"data row2 col6\" >{}</td>\n",
+              "      <td id=\"T_36394_row2_col7\" class=\"data row2 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_36394_row2_col8\" class=\"data row2 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_36394_row3_col0\" class=\"data row3 col0\" >validmind.model_validation.sklearn.TrainingTestDegradation</td>\n",
+              "      <td id=\"T_36394_row3_col1\" class=\"data row3 col1\" >Training Test Degradation</td>\n",
+              "      <td id=\"T_36394_row3_col2\" class=\"data row3 col2\" >Tests if model performance degradation between training and test datasets exceeds a predefined threshold....</td>\n",
+              "      <td id=\"T_36394_row3_col3\" class=\"data row3 col3\" >False</td>\n",
+              "      <td id=\"T_36394_row3_col4\" class=\"data row3 col4\" >True</td>\n",
+              "      <td id=\"T_36394_row3_col5\" class=\"data row3 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_36394_row3_col6\" class=\"data row3 col6\" >{'max_threshold': {'type': 'float', 'default': 0.1}}</td>\n",
+              "      <td id=\"T_36394_row3_col7\" class=\"data row3 col7\" >['sklearn', 'binary_classification', 'multiclass_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_36394_row3_col8\" class=\"data row3 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_36394_row4_col0\" class=\"data row4 col0\" >validmind.ongoing_monitoring.CalibrationCurveDrift</td>\n",
+              "      <td id=\"T_36394_row4_col1\" class=\"data row4 col1\" >Calibration Curve Drift</td>\n",
+              "      <td id=\"T_36394_row4_col2\" class=\"data row4 col2\" >Evaluates changes in probability calibration between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_36394_row4_col3\" class=\"data row4 col3\" >True</td>\n",
+              "      <td id=\"T_36394_row4_col4\" class=\"data row4 col4\" >True</td>\n",
+              "      <td id=\"T_36394_row4_col5\" class=\"data row4 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_36394_row4_col6\" class=\"data row4 col6\" >{'n_bins': {'type': 'int', 'default': 10}, 'drift_pct_threshold': {'type': 'float', 'default': 20}}</td>\n",
+              "      <td id=\"T_36394_row4_col7\" class=\"data row4 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_36394_row4_col8\" class=\"data row4 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <td id=\"T_36394_row5_col0\" class=\"data row5 col0\" >validmind.ongoing_monitoring.ROCCurveDrift</td>\n",
+              "      <td id=\"T_36394_row5_col1\" class=\"data row5 col1\" >ROC Curve Drift</td>\n",
+              "      <td id=\"T_36394_row5_col2\" class=\"data row5 col2\" >Compares ROC curves between reference and monitoring datasets....</td>\n",
+              "      <td id=\"T_36394_row5_col3\" class=\"data row5 col3\" >True</td>\n",
+              "      <td id=\"T_36394_row5_col4\" class=\"data row5 col4\" >False</td>\n",
+              "      <td id=\"T_36394_row5_col5\" class=\"data row5 col5\" >['datasets', 'model']</td>\n",
+              "      <td id=\"T_36394_row5_col6\" class=\"data row5 col6\" >{}</td>\n",
+              "      <td id=\"T_36394_row5_col7\" class=\"data row5 col7\" >['sklearn', 'binary_classification', 'model_performance', 'visualization']</td>\n",
+              "      <td id=\"T_36394_row5_col8\" class=\"data row5 col8\" >['classification', 'text_classification']</td>\n",
+              "    </tr>\n",
+              "  </tbody>\n",
+              "</table>\n"
+            ],
+            "text/plain": [
+              "<pandas.io.formats.style.Styler at 0x380009c40>"
+            ]
+          },
+          "execution_count": null,
+          "metadata": {},
+          "output_type": "execute_result"
+        }
+      ],
+      "source": [
+        "list_tests(filter=\"sklearn\",\n",
+        "    tags=[\"model_performance\", \"visualization\"], task=\"classification\"\n",
+        ")"
+      ]
+    },
     {
-     "data": {
-      "text/plain": [
-       "['validmind.data_validation.DatasetDescription',\n",
-       " 'validmind.data_validation.DatasetSplit',\n",
-       " 'validmind.data_validation.nlp.CommonWords',\n",
-       " 'validmind.data_validation.nlp.Hashtags',\n",
-       " 'validmind.data_validation.nlp.LanguageDetection',\n",
-       " 'validmind.data_validation.nlp.Mentions',\n",
-       " 'validmind.data_validation.nlp.Punctuations',\n",
-       " 'validmind.data_validation.nlp.StopWords',\n",
-       " 'validmind.data_validation.nlp.TextDescription',\n",
-       " 'validmind.model_validation.BertScore',\n",
-       " 'validmind.model_validation.BleuScore',\n",
-       " 'validmind.model_validation.ContextualRecall',\n",
-       " 'validmind.model_validation.MeteorScore',\n",
-       " 'validmind.model_validation.RegardScore',\n",
-       " 'validmind.model_validation.RougeScore',\n",
-       " 'validmind.model_validation.TokenDisparity',\n",
-       " 'validmind.model_validation.ToxicityScore',\n",
-       " 'validmind.model_validation.embeddings.CosineSimilarityComparison',\n",
-       " 'validmind.model_validation.embeddings.CosineSimilarityHeatmap',\n",
-       " 'validmind.model_validation.embeddings.EuclideanDistanceComparison',\n",
-       " 'validmind.model_validation.embeddings.EuclideanDistanceHeatmap',\n",
-       " 'validmind.model_validation.embeddings.PCAComponentsPairwisePlots',\n",
-       " 'validmind.model_validation.embeddings.TSNEComponentsPairwisePlots',\n",
-       " 'validmind.model_validation.ragas.AnswerCorrectness',\n",
-       " 'validmind.model_validation.ragas.AspectCritic',\n",
-       " 'validmind.model_validation.ragas.ContextEntityRecall',\n",
-       " 'validmind.model_validation.ragas.ContextPrecision',\n",
-       " 'validmind.model_validation.ragas.ContextPrecisionWithoutReference',\n",
-       " 'validmind.model_validation.ragas.ContextRecall',\n",
-       " 'validmind.model_validation.ragas.Faithfulness',\n",
-       " 'validmind.model_validation.ragas.NoiseSensitivity',\n",
-       " 'validmind.model_validation.ragas.ResponseRelevancy',\n",
-       " 'validmind.model_validation.ragas.SemanticSimilarity',\n",
-       " 'validmind.prompt_validation.Bias',\n",
-       " 'validmind.prompt_validation.Clarity',\n",
-       " 'validmind.prompt_validation.Conciseness',\n",
-       " 'validmind.prompt_validation.Delimitation',\n",
-       " 'validmind.prompt_validation.NegativeInstruction',\n",
-       " 'validmind.prompt_validation.Robustness',\n",
-       " 'validmind.prompt_validation.Specificity']"
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Store test sets for use\n",
+        "\n",
+        "Once you've identified specific sets of tests you'd like to run, you can store the tests in variables, enabling you to easily reuse those tests in later steps.\n",
+        "\n",
+        "For example, if you're validating a summarization model, use [`list_tests()`](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) to retrieve all tests tagged for text summarization and save them to `text_summarization_tests` for later use:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [
+        {
+          "data": {
+            "text/plain": [
+              "['validmind.data_validation.DatasetDescription',\n",
+              " 'validmind.data_validation.DatasetSplit',\n",
+              " 'validmind.data_validation.nlp.CommonWords',\n",
+              " 'validmind.data_validation.nlp.Hashtags',\n",
+              " 'validmind.data_validation.nlp.LanguageDetection',\n",
+              " 'validmind.data_validation.nlp.Mentions',\n",
+              " 'validmind.data_validation.nlp.Punctuations',\n",
+              " 'validmind.data_validation.nlp.StopWords',\n",
+              " 'validmind.data_validation.nlp.TextDescription',\n",
+              " 'validmind.model_validation.BertScore',\n",
+              " 'validmind.model_validation.BleuScore',\n",
+              " 'validmind.model_validation.ContextualRecall',\n",
+              " 'validmind.model_validation.MeteorScore',\n",
+              " 'validmind.model_validation.RegardScore',\n",
+              " 'validmind.model_validation.RougeScore',\n",
+              " 'validmind.model_validation.TokenDisparity',\n",
+              " 'validmind.model_validation.ToxicityScore',\n",
+              " 'validmind.model_validation.embeddings.CosineSimilarityComparison',\n",
+              " 'validmind.model_validation.embeddings.CosineSimilarityHeatmap',\n",
+              " 'validmind.model_validation.embeddings.EuclideanDistanceComparison',\n",
+              " 'validmind.model_validation.embeddings.EuclideanDistanceHeatmap',\n",
+              " 'validmind.model_validation.embeddings.PCAComponentsPairwisePlots',\n",
+              " 'validmind.model_validation.embeddings.TSNEComponentsPairwisePlots',\n",
+              " 'validmind.model_validation.ragas.AnswerCorrectness',\n",
+              " 'validmind.model_validation.ragas.AspectCritic',\n",
+              " 'validmind.model_validation.ragas.ContextEntityRecall',\n",
+              " 'validmind.model_validation.ragas.ContextPrecision',\n",
+              " 'validmind.model_validation.ragas.ContextPrecisionWithoutReference',\n",
+              " 'validmind.model_validation.ragas.ContextRecall',\n",
+              " 'validmind.model_validation.ragas.Faithfulness',\n",
+              " 'validmind.model_validation.ragas.NoiseSensitivity',\n",
+              " 'validmind.model_validation.ragas.ResponseRelevancy',\n",
+              " 'validmind.model_validation.ragas.SemanticSimilarity',\n",
+              " 'validmind.prompt_validation.Bias',\n",
+              " 'validmind.prompt_validation.Clarity',\n",
+              " 'validmind.prompt_validation.Conciseness',\n",
+              " 'validmind.prompt_validation.Delimitation',\n",
+              " 'validmind.prompt_validation.NegativeInstruction',\n",
+              " 'validmind.prompt_validation.Robustness',\n",
+              " 'validmind.prompt_validation.Specificity']"
+            ]
+          },
+          "execution_count": null,
+          "metadata": {},
+          "output_type": "execute_result"
+        }
+      ],
+      "source": [
+        "text_summarization_tests = list_tests(task=\"text_summarization\", pretty=False)\n",
+        "text_summarization_tests"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "Now that you know how to browse and filter tests in the ValidMind Library, you’re ready to take the next step. Use the test IDs you’ve selected to either run individual tests or batch run them with custom test suites.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn about the tests suites available in the ValidMind Library.</b></span>\n",
+        "<br></br>\n",
+        "Check out our <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/explore_tests/explore_test_suites.html\" style=\"color: #DE257E;\"><b>Explore test suites</b></a> notebook for more code examples and usage of key functions.</div>\n",
+        "\n",
+        "<a id='toc7_1__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you'll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "%pip show validmind"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "copyright-fb6994d364c54669b356f7a2278d6480",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
       ]
-     },
-     "execution_count": 10,
-     "metadata": {},
-     "output_type": "execute_result"
     }
-   ],
-   "source": [
-    "text_summarization_tests = list_tests(task=\"text_summarization\", pretty=False)\n",
-    "text_summarization_tests"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "Now that you know how to browse and filter tests in the ValidMind Library, you’re ready to take the next step. Use the test IDs you’ve selected to either run individual tests or batch run them with custom test suites.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn about the tests suites available in the ValidMind Library.</b></span>\n",
-    "<br></br>\n",
-    "Check out our <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/explore_tests/explore_test_suites.html\" style=\"color: #DE257E;\"><b>Explore test suites</b></a> notebook for more code examples and usage of key functions.</div>\n",
-    "\n",
-    "<a id='toc7_1__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc8__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you'll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-fb6994d364c54669b356f7a2278d6480",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.10.13"
+    }
   },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 4
+  "nbformat": 4,
+  "nbformat_minor": 4
 }
diff --git a/site/notebooks/how_to/tests/run_tests/1-run_dataset-based_tests.ipynb b/site/notebooks/how_to/tests/run_tests/1-run_dataset-based_tests.ipynb
new file mode 100644
index 0000000000..ae4b200aa6
--- /dev/null
+++ b/site/notebooks/how_to/tests/run_tests/1-run_dataset-based_tests.ipynb
@@ -0,0 +1,785 @@
+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Run dataset-based tests\n",
+        "\n",
+        "Learn how to use the ValidMind Library to run tests that take any dataset or record (model) as input. Identify specific tests to run, initialize ValidMind dataset objects in preparation for passing them to your tests, and then run the chosen tests — generating outputs that can be automatically logged to your documentation in the ValidMind Platform."
+      ],
+      "id": "976bb3d9"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "  - [Preview the documentation template](#toc2_3__)    \n",
+        "- [Explore a ValidMind test](#toc3__)    \n",
+        "- [Working with ValidMind datasets](#toc4__)    \n",
+        "  - [Create a sample dataset](#toc4_1__)    \n",
+        "  - [Initialize the ValidMind dataset](#toc4_2__)    \n",
+        "- [Running ValidMind tests](#toc5__)    \n",
+        "  - [Run test using ValidMind dataset](#toc5_1__)    \n",
+        "  - [Run and log test requiring parameters](#toc5_2__)    \n",
+        "    - [Log ClassImbalance test with default parameters](#toc5_2_1__)    \n",
+        "    - [Log ClassImbalance test with custom paramaters](#toc5_2_2__)    \n",
+        "- [Work with test results](#toc6__)    \n",
+        "- [Next steps](#toc7__)    \n",
+        "  - [Discover more learning resources](#toc7_1__)    \n",
+        "- [Upgrade ValidMind](#toc8__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ],
+      "id": "8c4d9b9c"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models. \n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators."
+      ],
+      "id": "f49237b3"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
+      ],
+      "id": "907737bd"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+      ],
+      "id": "115cdfa7"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ],
+      "id": "c3051ca8"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ],
+      "id": "656db165"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
+        "<br></br>\n",
+        "Python 3.8 <= x <= 3.14</div>\n",
+        "\n",
+        "To install the library:"
+      ],
+      "id": "30fa24d7"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "524602cc"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ],
+      "id": "b38fc5f6"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook.\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ],
+      "id": "451c5a1b"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Binary classification`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ],
+      "id": "0e55ac40"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ],
+      "id": "3545620d"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "0ed9e84d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ],
+      "id": "8fea9380"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "e44a2345"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Explore a ValidMind test\n",
+        "\n",
+        "Before we run a test, use [the `vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) to return information on out-of-the-box tests available in the ValidMind Library.\n",
+        "\n",
+        "Let's assume you want to generate the *pearson correlation matrix* for a dataset. A Pearson correlation matrix is a table that shows the [Pearson correlation coefficients](https://en.wikipedia.org/wiki/Pearson_correlation_coefficient) between several variables.\n",
+        "\n",
+        "We'll pass in a `filter` to the `list_tests` function to find the test ID for the pearson correlation matrix:"
+      ],
+      "id": "43ee2f43"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.list_tests(filter=\"PearsonCorrelationMatrix\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "a63e7a43"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "We've identified from the output that the test ID for the pearson correlation matrix test is `validmind.data_validation.PearsonCorrelationMatrix`.\n",
+        "\n",
+        "Use this ID combined with [the `describe_test()` function](https://docs.validmind.ai/validmind/validmind/tests.html#describe_test) to retrieve more information about the test, including its **Required Inputs**:"
+      ],
+      "id": "011de751"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test_id = \"validmind.data_validation.PearsonCorrelationMatrix\"\n",
+        "vm.tests.describe_test(test_id)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "9886cd27"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Since this test requires a dataset, you can expect it to throw an error when we run it without passing in a `dataset` as input:"
+      ],
+      "id": "f1f7a84a"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "try:\n",
+        "    vm.tests.run_test(test_id)\n",
+        "except Exception as e:\n",
+        "    print(e)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "ee38704a"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn more about the individual tests available in the ValidMind Library</b></span>\n",
+        "<br></br>\n",
+        "Check out our <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/explore_tests/explore_tests.html\" style=\"color: #DE257E;\"><b>Explore tests</b></a> notebook for more code examples and usage of key functions.</div>"
+      ],
+      "id": "60ede8e0"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Working with ValidMind datasets"
+      ],
+      "id": "6bcd01d2"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Create a sample dataset\n",
+        "\n",
+        "Since we need a dataset to run tests, let's use the [sklearn `make_classification` function](https://scikit-learn.org/stable/modules/generated/sklearn.datasets.make_classification.html) to generate a random sample dataset for testing.\n",
+        "\n",
+        "In the code example below, note that:\n",
+        "\n",
+        "- The `make_classification` function generates a synthetic binary classification dataset with `10,000` samples and `10` features, where the `weights=[0.1]` parameter creates a class imbalance (roughly 10% positive class).\n",
+        "- The `random_state=42` parameter ensures reproducibility so you get the same dataset each time you run the code.\n",
+        "- The generated feature matrix `X` and target array `y` are combined into a single [Pandas DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html) with columns named `feature_0` through `feature_9`, plus a `target` column that has a value of `1` for the positive class and `0` otherwise."
+      ],
+      "id": "35331764"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import pandas as pd\n",
+        "from sklearn.datasets import make_classification\n",
+        "\n",
+        "X, y = make_classification(\n",
+        "    n_samples=10000,\n",
+        "    n_features=10,\n",
+        "    weights=[0.1],\n",
+        "    random_state=42,\n",
+        ")\n",
+        "X.shape\n",
+        "y.shape\n",
+        "\n",
+        "df = pd.DataFrame(X, columns=[f\"feature_{i}\" for i in range(X.shape[1])])\n",
+        "df[\"target\"] = y\n",
+        "df.head()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "25774f44"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind dataset\n",
+        "\n",
+        "The next step is to connect your data with a ValidMind `Dataset` object. **This step is always necessary every time you want to connect a dataset to documentation and produce test results through ValidMind,** but you only need to do it once per dataset.\n",
+        "\n",
+        "ValidMind dataset objects provide a wrapper to any type of dataset (NumPy, Pandas, Polars, etc.) so that tests can run transparently regardless of the underlying library.\n",
+        "\n",
+        "Initialize a ValidMind dataset object using the [`init_dataset` function](https://docs.validmind.ai/validmind/validmind.html#init_dataset) from the ValidMind (`vm`) module. For this example, we'll pass in the following arguments:\n",
+        "\n",
+        "- **`dataset`** — The raw dataset that you want to provide as input to tests.\n",
+        "- **`input_id`** — A unique identifier that allows tracking what inputs are used when running each individual test.\n",
+        "- **`target_column`** — A required argument if tests require access to true values. This is the name of the target column in the dataset."
+      ],
+      "id": "3b3032fc"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Initialize the ValidMind dataset for the previously created sample `df`\n",
+        "vm_dataset = vm.init_dataset(\n",
+        "    df,\n",
+        "    input_id=\"my_demo_dataset\",\n",
+        "    target_column=\"target\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "70c52c03"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Running ValidMind tests\n",
+        "\n",
+        "Now that we know how to initialize a ValidMind `dataset` object, we're ready to run some tests!\n",
+        "\n",
+        "You run individual tests by calling [the `run_test` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test) provided by the `validmind.tests` module. For the examples below, we'll pass in the following arguments:\n",
+        "\n",
+        "- **`test_id`** — The ID of the test to run, as seen in the `ID` column when you run `list_tests`.\n",
+        "- **`inputs`** — A dictionary of test inputs, such as `dataset`, `model`, `datasets`, or `models`. These are ValidMind objects initialized with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) or [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model)."
+      ],
+      "id": "ec65df1b"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Run test using ValidMind dataset\n",
+        "\n",
+        "Given that our `test_id` is currently set to `validmind.data_validation.PearsonCorrelationMatrix`, we'll get the results of the Pearson Correlation Matrix test as output when we call `run_test()`:"
+      ],
+      "id": "c46789a4"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = vm.tests.run_test(\n",
+        "    test_id,\n",
+        "    inputs={\"dataset\": vm_dataset},\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "0c636915"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2__'></a>\n",
+        "\n",
+        "### Run and log test requiring parameters\n",
+        "\n",
+        "Our `vm_dataset` can also be used for any other test that requires a dataset input,  including tests that take additional parameters.\n",
+        "\n",
+        "Let's find a *class imbalance* test to understand the distribution of the target column in the dataset to demonstrate. Class imbalance is a common problem in machine learning, particularly in classification tasks, where the number of instances (or data points) in each class isn't evenly distributed across the available categories.\n",
+        "\n",
+        "`Tags` describe what a test applies to and help you filter tests for your use case. Use [list_tags()](https://docs.validmind.ai/validmind/validmind/tests.html#list_tags) to view all unique tags used to describe tests in the ValidMind Library:"
+      ],
+      "id": "12694f87"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Sort the tags in ABC order\n",
+        "sorted(vm.tests.list_tags())"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "99eaf2da"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Use `list_tests()`, this time filtering tests by tags for `binary_classification` relating to `tabular_data`:"
+      ],
+      "id": "561b225a"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.list_tests(tags=[\"binary_classification\", \"tabular_data\"])"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "97a45b6b"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let's use `describe_test()` again to retrieve more information about the test, including confirmation that it accepts some additional parameters, such as `min_percent_threshold` which allows you configure the threshold for an acceptable class imbalance:"
+      ],
+      "id": "4ba2ec07"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.describe_test(\"validmind.data_validation.ClassImbalance\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "ec456cd2"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2_1__'></a>\n",
+        "\n",
+        "#### Log ClassImbalance test with default parameters\n",
+        "\n",
+        "Every test result returned by the `run_test()` function has a [`.log()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#TestResult.log) that can be used to send the test results to the ValidMind Platform.\n",
+        "\n",
+        "Let's first run the class imbalance test without any parameters to see its output using a default value for the threshold and log the results to the ValidMind Platform for later comparison:"
+      ],
+      "id": "e419dd51"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.ClassImbalance\",\n",
+        "    inputs={\"dataset\": vm_dataset},\n",
+        ")\n",
+        "\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "1c137483"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2_2__'></a>\n",
+        "\n",
+        "#### Log ClassImbalance test with custom paramaters\n",
+        "\n",
+        "From the output, we've confirmed that the class imbalance test passes the pass-fail criteria with the default threshold of 10%. Let's try to run the test with a threshold of 20% to see if it fails.\n",
+        "\n",
+        "When running individual tests, **you can use a custom `result_id` to tag the individual result with a unique identifier**, allowing you to submit individual results for the same test to the ValidMind Platform:\n",
+        "\n",
+        "- This `result_id` can be appended to `test_id` with a `:` separator.\n",
+        "- The `custom_threshold` identifier will correspond with the results of our adjusted `min_percent_threshold` parameter."
+      ],
+      "id": "6cc499de"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.ClassImbalance:custom_threshold\",\n",
+        "    inputs={\"dataset\": vm_dataset},\n",
+        "    params={\"min_percent_threshold\": 20},\n",
+        ")\n",
+        "\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "2c6f19ad"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "When the threshold is set to 20%, the results show that the class imbalance test fails."
+      ],
+      "id": "30e82fc3"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Work with test results\n",
+        "\n",
+        "You can look at the output of tests produced by the ValidMind Library right in this notebook where you ran the tests, as you would expect. But there is a better way — use the ValidMind Platform to attach the logged test results your documentation (**Learn more:** [Work with test results](https://docs.validmind.ai/guide/documentation/work-with-test-results.html)):\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you connected to earlier.\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "3. Locate the Data Preparation section and click on **2.1. Data Description** to expand that section.\n",
+        "\n",
+        "4. Hover under the logged test block for the default Class Imbalance test until a horizontal dashed line with a **+** button appears, indicating that you can insert a new block.\n",
+        "\n",
+        "5. Click **+** and then select **Test-Driven Block** under FROM LIBRARY:\n",
+        "\n",
+        "    - Click on **VM Library** under TEST-DRIVEN in the left sidebar.\n",
+        "    - Select `ClassImbalance:custom_threshold` as the test.\n",
+        "\n",
+        "6. Finally, click **Insert 1 Test Result to Document** to add the test result to the documentation.\n",
+        "\n",
+        "    Confirm that the individual results for the adjusted threshold class imbalance test has been correctly inserted into section **2.1. Data Description** of the documentation.\n",
+        "\n",
+        "You just worked with a draft of your model's documentation, in an easily consumable format matching the structure of the template you previewed in the beginning of this notebook. When you connect to a model with the ValidMind Library, logged test results automatically populate for easy insertion into your documentation.\n",
+        "\n",
+        "In the ValidMind Platform, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))"
+      ],
+      "id": "faa09935"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "Now that you know the basics of how to run out-of-the-box tests in the ValidMind Library, you’re ready to take the next step. Use `run_test()` with any combination of datasets or records (models) as inputs to run comparison tests, and log your consolidated test results to the ValidMind Platform.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn how to run comparison tests with the ValidMind Library.</b></span>\n",
+        "<br></br>\n",
+        "Check out our <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/run_tests/2-run_comparison_tests.html\" style=\"color: #DE257E;\"><b>Run comparison tests</b></a> notebook for code examples and usage of key functions.</div>"
+      ],
+      "id": "cbe20d76"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_1__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ],
+      "id": "ec08c9bc"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ],
+      "id": "bff625a1"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "b5f64e27"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ],
+      "id": "da29fb9d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ],
+      "id": "82837a85"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-38501808b29c456ab97562eebdd497d4"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.12.12"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 5
+}
\ No newline at end of file
diff --git a/site/notebooks/how_to/tests/run_tests/1_run_dataset_based_tests.ipynb b/site/notebooks/how_to/tests/run_tests/1_run_dataset_based_tests.ipynb
deleted file mode 100644
index c4937af216..0000000000
--- a/site/notebooks/how_to/tests/run_tests/1_run_dataset_based_tests.ipynb
+++ /dev/null
@@ -1,775 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "id": "976bb3d9",
-   "metadata": {},
-   "source": [
-    "# Run dataset-based tests\n",
-    "\n",
-    "Learn how to use the ValidMind Library to run tests that take any dataset or model as input. Identify specific tests to run, initialize ValidMind dataset objects in preparation for passing them to your tests, and then run the chosen tests — generating outputs that can be automatically logged to your model's documentation in the ValidMind Platform."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "8c4d9b9c",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "  - [Preview the documentation template](#toc2_3__)    \n",
-    "- [Explore a ValidMind test](#toc3__)    \n",
-    "- [Working with ValidMind datasets](#toc4__)    \n",
-    "  - [Create a sample dataset](#toc4_1__)    \n",
-    "  - [Initialize the ValidMind dataset](#toc4_2__)    \n",
-    "- [Running ValidMind tests](#toc5__)    \n",
-    "  - [Run test using ValidMind dataset](#toc5_1__)    \n",
-    "  - [Run and log test requiring parameters](#toc5_2__)    \n",
-    "    - [Log ClassImbalance test with default parameters](#toc5_2_1__)    \n",
-    "    - [Log ClassImbalance test with custom paramaters](#toc5_2_2__)    \n",
-    "- [Work with test results](#toc6__)    \n",
-    "- [Next steps](#toc7__)    \n",
-    "  - [Discover more learning resources](#toc7_1__)    \n",
-    "- [Upgrade ValidMind](#toc8__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f49237b3",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models. \n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "907737bd",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "115cdfa7",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "c3051ca8",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Metrics**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
-    "\n",
-    "**Custom metrics**: Custom metrics are functions that you define to evaluate your model or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom metric.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom metric. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a metric, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom metrics can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "656db165",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "30fa24d7",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
-    "<br></br>\n",
-    "Python 3.8 <= x <= 3.14</div>\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "524602cc",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b38fc5f6",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "451c5a1b",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook.\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "0e55ac40",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Binary classification`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "3545620d",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "0ed9e84d",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "8fea9380",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "e44a2345",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "43ee2f43",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Explore a ValidMind test\n",
-    "\n",
-    "Before we run a test, use [the `vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) to return information on out-of-the-box tests available in the ValidMind Library.\n",
-    "\n",
-    "Let's assume you want to generate the *pearson correlation matrix* for a dataset. A Pearson correlation matrix is a table that shows the [Pearson correlation coefficients](https://en.wikipedia.org/wiki/Pearson_correlation_coefficient) between several variables.\n",
-    "\n",
-    "We'll pass in a `filter` to the `list_tests` function to find the test ID for the pearson correlation matrix:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "a63e7a43",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.list_tests(filter=\"PearsonCorrelationMatrix\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "011de751",
-   "metadata": {},
-   "source": [
-    "We've identified from the output that the test ID for the pearson correlation matrix test is `validmind.data_validation.PearsonCorrelationMatrix`.\n",
-    "\n",
-    "Use this ID combined with [the `describe_test()` function](https://docs.validmind.ai/validmind/validmind/tests.html#describe_test) to retrieve more information about the test, including its **Required Inputs**:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "9886cd27",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test_id = \"validmind.data_validation.PearsonCorrelationMatrix\"\n",
-    "vm.tests.describe_test(test_id)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f1f7a84a",
-   "metadata": {},
-   "source": [
-    "Since this test requires a dataset, you can expect it to throw an error when we run it without passing in a `dataset` as input:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "ee38704a",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "try:\n",
-    "    vm.tests.run_test(test_id)\n",
-    "except Exception as e:\n",
-    "    print(e)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "60ede8e0",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn more about the individual tests available in the ValidMind Library</b></span>\n",
-    "<br></br>\n",
-    "Check out our <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/explore_tests/explore_tests.html\" style=\"color: #DE257E;\"><b>Explore tests</b></a> notebook for more code examples and usage of key functions.</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "6bcd01d2",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Working with ValidMind datasets"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "35331764",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Create a sample dataset\n",
-    "\n",
-    "Since we need a dataset to run tests, let's use the [sklearn `make_classification` function](https://scikit-learn.org/stable/modules/generated/sklearn.datasets.make_classification.html) to generate a random sample dataset for testing.\n",
-    "\n",
-    "In the code example below, note that:\n",
-    "\n",
-    "- The `make_classification` function generates a synthetic binary classification dataset with `10,000` samples and `10` features, where the `weights=[0.1]` parameter creates a class imbalance (roughly 10% positive class).\n",
-    "- The `random_state=42` parameter ensures reproducibility so you get the same dataset each time you run the code.\n",
-    "- The generated feature matrix `X` and target array `y` are combined into a single [Pandas DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html) with columns named `feature_0` through `feature_9`, plus a `target` column that has a value of `1` for the positive class and `0` otherwise."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "25774f44",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import pandas as pd\n",
-    "from sklearn.datasets import make_classification\n",
-    "\n",
-    "X, y = make_classification(\n",
-    "    n_samples=10000,\n",
-    "    n_features=10,\n",
-    "    weights=[0.1],\n",
-    "    random_state=42,\n",
-    ")\n",
-    "X.shape\n",
-    "y.shape\n",
-    "\n",
-    "df = pd.DataFrame(X, columns=[f\"feature_{i}\" for i in range(X.shape[1])])\n",
-    "df[\"target\"] = y\n",
-    "df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "3b3032fc",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind dataset\n",
-    "\n",
-    "The next step is to connect your data with a ValidMind `Dataset` object. **This step is always necessary every time you want to connect a dataset to documentation and produce test results through ValidMind,** but you only need to do it once per dataset.\n",
-    "\n",
-    "ValidMind dataset objects provide a wrapper to any type of dataset (NumPy, Pandas, Polars, etc.) so that tests can run transparently regardless of the underlying library.\n",
-    "\n",
-    "Initialize a ValidMind dataset object using the [`init_dataset` function](https://docs.validmind.ai/validmind/validmind.html#init_dataset) from the ValidMind (`vm`) module. For this example, we'll pass in the following arguments:\n",
-    "\n",
-    "- **`dataset`** — The raw dataset that you want to provide as input to tests.\n",
-    "- **`input_id`** — A unique identifier that allows tracking what inputs are used when running each individual test.\n",
-    "- **`target_column`** — A required argument if tests require access to true values. This is the name of the target column in the dataset."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "70c52c03",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize the ValidMind dataset for the previously created sample `df`\n",
-    "vm_dataset = vm.init_dataset(\n",
-    "    df,\n",
-    "    input_id=\"my_demo_dataset\",\n",
-    "    target_column=\"target\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "ec65df1b",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Running ValidMind tests\n",
-    "\n",
-    "Now that we know how to initialize a ValidMind `dataset` object, we're ready to run some tests!\n",
-    "\n",
-    "You run individual tests by calling [the `run_test` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test) provided by the `validmind.tests` module. For the examples below, we'll pass in the following arguments:\n",
-    "\n",
-    "- **`test_id`** — The ID of the test to run, as seen in the `ID` column when you run `list_tests`.\n",
-    "- **`inputs`** — A dictionary of test inputs, such as `dataset`, `model`, `datasets`, or `models`. These are ValidMind objects initialized with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) or [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model)."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "c46789a4",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_1__'></a>\n",
-    "\n",
-    "### Run test using ValidMind dataset\n",
-    "\n",
-    "Given that our `test_id` is currently set to `validmind.data_validation.PearsonCorrelationMatrix`, we'll get the results of the Pearson Correlation Matrix test as output when we call `run_test()`:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "0c636915",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = vm.tests.run_test(\n",
-    "    test_id,\n",
-    "    inputs={\"dataset\": vm_dataset},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "12694f87",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2__'></a>\n",
-    "\n",
-    "### Run and log test requiring parameters\n",
-    "\n",
-    "Our `vm_dataset` can also be used for any other test that requires a dataset input,  including tests that take additional parameters.\n",
-    "\n",
-    "Let's find a *class imbalance* test to understand the distribution of the target column in the dataset to demonstrate. Class imbalance is a common problem in machine learning, particularly in classification tasks, where the number of instances (or data points) in each class isn't evenly distributed across the available categories.\n",
-    "\n",
-    "`Tags` describe what a test applies to and help you filter tests for your use case. Use [list_tags()](https://docs.validmind.ai/validmind/validmind/tests.html#list_tags) to view all unique tags used to describe tests in the ValidMind Library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "99eaf2da",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Sort the tags in ABC order\n",
-    "sorted(vm.tests.list_tags())"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "561b225a",
-   "metadata": {},
-   "source": [
-    "Use `list_tests()`, this time filtering tests by tags for `binary_classification` relating to `tabular_data`:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "97a45b6b",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.list_tests(tags=[\"binary_classification\", \"tabular_data\"])"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "4ba2ec07",
-   "metadata": {},
-   "source": [
-    "Let's use `describe_test()` again to retrieve more information about the test, including confirmation that it accepts some additional parameters, such as `min_percent_threshold` which allows you configure the threshold for an acceptable class imbalance:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "ec456cd2",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.describe_test(\"validmind.data_validation.ClassImbalance\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e419dd51",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2_1__'></a>\n",
-    "\n",
-    "#### Log ClassImbalance test with default parameters\n",
-    "\n",
-    "Every test result returned by the `run_test()` function has a [`.log()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#TestResult.log) that can be used to send the test results to the ValidMind Platform.\n",
-    "\n",
-    "Let's first run the class imbalance test without any parameters to see its output using a default value for the threshold and log the results to the ValidMind Platform for later comparison:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "1c137483",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.ClassImbalance\",\n",
-    "    inputs={\"dataset\": vm_dataset},\n",
-    ")\n",
-    "\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "6cc499de",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2_2__'></a>\n",
-    "\n",
-    "#### Log ClassImbalance test with custom paramaters\n",
-    "\n",
-    "From the output, we've confirmed that the class imbalance test passes the pass-fail criteria with the default threshold of 10%. Let's try to run the test with a threshold of 20% to see if it fails.\n",
-    "\n",
-    "When running individual tests, **you can use a custom `result_id` to tag the individual result with a unique identifier**, allowing you to submit individual results for the same test to the ValidMind Platform:\n",
-    "\n",
-    "- This `result_id` can be appended to `test_id` with a `:` separator.\n",
-    "- The `custom_threshold` identifier will correspond with the results of our adjusted `min_percent_threshold` parameter."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "2c6f19ad",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.ClassImbalance:custom_threshold\",\n",
-    "    inputs={\"dataset\": vm_dataset},\n",
-    "    params={\"min_percent_threshold\": 20},\n",
-    ")\n",
-    "\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "30e82fc3",
-   "metadata": {},
-   "source": [
-    "When the threshold is set to 20%, the results show that the class imbalance test fails."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "faa09935",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Work with test results\n",
-    "\n",
-    "You can look at the output of tests produced by the ValidMind Library right in this notebook where you ran the tests, as you would expect. But there is a better way — use the ValidMind Platform to attach the logged test results your model's documentation ([Need more help?](https://docs.validmind.ai/developer/model-documentation/work-with-test-results.html)):\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you connected to earlier.\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "3. Locate the Data Preparation section and click on **2.1. Data Description** to expand that section.\n",
-    "\n",
-    "4. Hover under the logged test block for the default Class Imbalance test until a horizontal dashed line with a **+** button appears, indicating that you can insert a new block.\n",
-    "\n",
-    "5. Click **+** and then select **Test-Driven Block** under FROM LIBRARY:\n",
-    "\n",
-    "    - Click on **VM Library** under TEST-DRIVEN in the left sidebar.\n",
-    "    - Select `ClassImbalance:custom_threshold` as the test.\n",
-    "\n",
-    "6. Finally, click **Insert 1 Test Result to Document** to add the test result to the documentation.\n",
-    "\n",
-    "    Confirm that the individual results for the adjusted threshold class imbalance test has been correctly inserted into section **2.1. Data Description** of the documentation.\n",
-    "\n",
-    "You just worked with a draft of your model's documentation, in an easily consumable format matching the structure of the template you previewed in the beginning of this notebook. When you connect to a model with the ValidMind Library, logged test results automatically populate for easy insertion into your documentation.\n",
-    "\n",
-    "In the ValidMind Platform, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "cbe20d76",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "Now that you know the basics of how to run out-of-the-box tests in the ValidMind Library, you’re ready to take the next step. Use `run_test()` with any combination of datasets or models as inputs to run comparison tests, and log your consolidated test results to the ValidMind Platform.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn how to run comparison tests with the ValidMind Library.</b></span>\n",
-    "<br></br>\n",
-    "Check out our <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/run_tests/2_run_comparison_tests.html\" style=\"color: #DE257E;\"><b>Run comparison tests</b></a> notebook for code examples and usage of key functions.</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "ec08c9bc",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_1__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "bff625a1",
-   "metadata": {},
-   "source": [
-    "<a id='toc8__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "b5f64e27",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "da29fb9d",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "82837a85",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-38501808b29c456ab97562eebdd497d4",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
-}
diff --git a/site/notebooks/how_to/tests/run_tests/2-run_comparison_tests.ipynb b/site/notebooks/how_to/tests/run_tests/2-run_comparison_tests.ipynb
new file mode 100644
index 0000000000..1766a413fe
--- /dev/null
+++ b/site/notebooks/how_to/tests/run_tests/2-run_comparison_tests.ipynb
@@ -0,0 +1,1119 @@
+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Run comparison tests\n",
+        "\n",
+        "Learn how to use the ValidMind Library to run comparison tests that take any datasets or records (models) as inputs. Identify comparison tests to run, initialize ValidMind dataset and model objects in preparation for passing them to tests, and then run tests — generating outputs automatically logged to your documentation in the ValidMind Platform.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>We recommend that you first complete our introductory notebook on running tests.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/notebooks/how_to/tests/run_tests/1-run_dataset-based_tests.html\" style=\"color: #DE257E;\"><b>Run dataset-based tests</b></a></div>"
+      ],
+      "id": "ed8282aa"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "  - [Preview the documentation template](#toc2_3__)    \n",
+        "  - [Initialize the Python environment](#toc2_4__)    \n",
+        "- [Explore a ValidMind test](#toc3__)    \n",
+        "- [Working with ValidMind datasets](#toc4__)    \n",
+        "  - [Prepare the sample dataset](#toc4_1__)    \n",
+        "    - [Import the sample dataset](#toc4_1_1__)    \n",
+        "    - [Split the dataset](#toc4_1_2__)    \n",
+        "  - [Initialize the ValidMind dataset](#toc4_2__)    \n",
+        "- [Working with ValidMind models](#toc5__)    \n",
+        "  - [Train a sample model](#toc5_1__)    \n",
+        "  - [Initialize the ValidMind model](#toc5_2__)    \n",
+        "  - [Assign predictions](#toc5_3__)    \n",
+        "- [Running ValidMind tests](#toc6__)    \n",
+        "  - [Run classifier performance test with one model](#toc6_1__)    \n",
+        "  - [Run comparison tests](#toc6_2__)    \n",
+        "    - [Run classifier performance test with multiple models](#toc6_2_1__)    \n",
+        "    - [Run classifier performance test with multiple parameter values](#toc6_2_2__)    \n",
+        "    - [Run comparison test with multiple datasets](#toc6_2_3__)    \n",
+        "- [Work with test results](#toc7__)    \n",
+        "- [Next steps](#toc8__)    \n",
+        "  - [Discover more learning resources](#toc8_1__)    \n",
+        "- [Upgrade ValidMind](#toc9__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ],
+      "id": "90ab1b8a"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models. \n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators."
+      ],
+      "id": "60aa37b6"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
+      ],
+      "id": "6dfa3d15"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+      ],
+      "id": "8e87dd4d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ],
+      "id": "64971d85"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ],
+      "id": "69a40ac3"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
+        "<br></br>\n",
+        "Python 3.8 <= x <= 3.14</div>\n",
+        "\n",
+        "To install the library:"
+      ],
+      "id": "ec35c724"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "fc97888f"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ],
+      "id": "b3c0c2f5"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook.\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ],
+      "id": "d3e3302f"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Binary classification`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ],
+      "id": "679d46b2"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ],
+      "id": "2b6e1fb1"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "c51ae01c"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ],
+      "id": "52b68564"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "fd332a9d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_4__'></a>\n",
+        "\n",
+        "### Initialize the Python environment\n",
+        "\n",
+        "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
+      ],
+      "id": "184b8c97"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import xgboost as xgb\n",
+        "\n",
+        "%matplotlib inline"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "8e2127cd"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Explore a ValidMind test\n",
+        "\n",
+        "Before we run a test, use [the `vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) to return information on out-of-the-box tests available in the ValidMind Library.\n",
+        "\n",
+        "Let's assume you want to evaluate *classifier performance* for a model. Classifier performance measures how well a classification model correctly predicts outcomes, using metrics like [precision, recall, and F1 score](https://en.wikipedia.org/wiki/Precision_and_recall).\n",
+        "\n",
+        "We'll pass in a `filter` to the `list_tests` function to find the test ID for classifier performance:"
+      ],
+      "id": "c3098355"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.list_tests(filter=\"ClassifierPerformance\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "a6a6f715"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "We've identified from the output that the test ID for the classifier performance test is `validmind.model_validation.ClassifierPerformance`.\n",
+        "\n",
+        "Use this ID combined with [the `describe_test()` function](https://docs.validmind.ai/validmind/validmind/tests.html#describe_test) to retrieve more information about the test, including its **Required Inputs**:"
+      ],
+      "id": "d1f08b64"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test_id = \"validmind.model_validation.sklearn.ClassifierPerformance\"\n",
+        "vm.tests.describe_test(test_id)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "f8a46c7d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Since this test requires both a dataset object and a model object, you can expect it to throw an error when we run it without passing in either as input:"
+      ],
+      "id": "10a49439"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "try:\n",
+        "    vm.tests.run_test(test_id)\n",
+        "except Exception as e:\n",
+        "    print(e)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "f853c272"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn more about the individual tests available in the ValidMind Library</b></span>\n",
+        "<br></br>\n",
+        "Check out our <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/explore_tests/explore_tests.html\" style=\"color: #DE257E;\"><b>Explore tests</b></a> notebook for more code examples and usage of key functions.</div>"
+      ],
+      "id": "da36ba6b"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Working with ValidMind datasets"
+      ],
+      "id": "40324c13"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Prepare the sample dataset"
+      ],
+      "id": "3f28ffe2"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1_1__'></a>\n",
+        "\n",
+        "#### Import the sample dataset\n",
+        "\n",
+        "Since we need a dataset to run tests, let's import the public [Bank Customer Churn Prediction](https://www.kaggle.com/datasets/shantanudhakadd/bank-customer-churn-prediction) dataset from Kaggle so that we have something to work with.\n",
+        "\n",
+        "In our below example, note that:\n",
+        "\n",
+        "- The target column, `Exited` has a value of `1` when a customer has churned and `0` otherwise.\n",
+        "- The ValidMind Library provides a wrapper to automatically load the dataset as a [Pandas DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html) object. A Pandas Dataframe is a two-dimensional tabular data structure that makes use of rows and columns."
+      ],
+      "id": "4c45a55c"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Import the sample dataset from the library\n",
+        "\n",
+        "from validmind.datasets.classification import customer_churn\n",
+        "\n",
+        "print(\n",
+        "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{customer_churn.target_column}' \\n\\t• Class labels: {customer_churn.class_labels}\"\n",
+        ")\n",
+        "\n",
+        "raw_df = customer_churn.load_data()\n",
+        "raw_df.head()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "3ef2dfbb"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1_2__'></a>\n",
+        "\n",
+        "#### Split the dataset\n",
+        "\n",
+        "Let's first split our dataset to help assess how well the model generalizes to unseen data.\n",
+        "\n",
+        "Use [`preprocess()`](https://docs.validmind.ai/validmind/validmind/datasets/classification/customer_churn.html#preprocess) to split our dataset into three subsets:\n",
+        "\n",
+        "1. **train_df** — Used to train the model.\n",
+        "2. **validation_df** — Used to evaluate the model's performance during training.\n",
+        "3. **test_df** — Used later on to asses the model's performance on new, unseen data."
+      ],
+      "id": "2fc43d28"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "train_df, validation_df, test_df = customer_churn.preprocess(raw_df)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "88c87d4a"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind dataset\n",
+        "\n",
+        "The next step is to connect your data with a ValidMind `Dataset` object. **This step is always necessary every time you want to connect a dataset to documentation and produce test results through ValidMind,** but you only need to do it once per dataset.\n",
+        "\n",
+        "ValidMind dataset objects provide a wrapper to any type of dataset (NumPy, Pandas, Polars, etc.) so that tests can run transparently regardless of the underlying library.\n",
+        "\n",
+        "Initialize a ValidMind dataset object using the [`init_dataset` function](https://docs.validmind.ai/validmind/validmind.html#init_dataset) from the ValidMind (`vm`) module. For this example, we'll pass in the following arguments:\n",
+        "\n",
+        "- **`dataset`** — The raw dataset that you want to provide as input to tests.\n",
+        "- **`input_id`** — A unique identifier that allows tracking what inputs are used when running each individual test.\n",
+        "- **`target_column`** — A required argument if tests require access to true values. This is the name of the target column in the dataset."
+      ],
+      "id": "a5d77885"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds = vm.init_dataset(\n",
+        "    dataset=train_df,\n",
+        "    input_id=\"train_dataset\",\n",
+        "    target_column=customer_churn.target_column,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    dataset=test_df,\n",
+        "    input_id=\"test_dataset\",\n",
+        "    target_column=customer_churn.target_column,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "bf0ec747"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Working with ValidMind models"
+      ],
+      "id": "cbb1a68f"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Train a sample model\n",
+        "\n",
+        "To train the model, we need to provide it with:\n",
+        "\n",
+        "1. **Inputs** — Features such as customer age, usage, etc.\n",
+        "2. **Outputs (Expected answers/labels)** — in our case, we would like to know whether the customer churned or not.\n",
+        "\n",
+        "Here, we'll use `x_train` and `x_val` to hold the input data (features), and `y_train` and `y_val` to hold the answers (the target we want to predict):"
+      ],
+      "id": "68089f0a"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "x_train = train_df.drop(customer_churn.target_column, axis=1)\n",
+        "y_train = train_df[customer_churn.target_column]\n",
+        "x_val = validation_df.drop(customer_churn.target_column, axis=1)\n",
+        "y_val = validation_df[customer_churn.target_column]"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "39e8c7ea"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Next, let's create an *XGBoost classifier model* that will automatically stop training if it doesn't improve after 10 tries. XGBoost is a gradient-boosted tree ensemble that builds trees sequentially, with each tree correcting the errors of the previous ones — typically known for strong predictive performance and built-in regularization to reduce overfitting.\n",
+        "\n",
+        "Setting an explicit threshold avoids wasting time and helps prevent further overfitting by stopping training when further improvement isn't happening. We'll also set three evaluation metrics to get a more complete picture of model performance:\n",
+        "\n",
+        "1. **error** — Measures how often the model makes incorrect predictions.\n",
+        "2. **logloss** — Indicates how confident the predictions are.\n",
+        "3. **auc** — Evaluates how well the model distinguishes between churn and not churn."
+      ],
+      "id": "6d93642b"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "model = xgb.XGBClassifier(early_stopping_rounds=10)\n",
+        "model.set_params(\n",
+        "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "255e3583"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Finally, our actual training step — where the model learns patterns from the data, so it can make predictions later:\n",
+        "\n",
+        "- The model is trained on `x_train` and `y_train`, and evaluates its performance using `x_val` and `y_val` to check if it’s learning well.\n",
+        "- To turn off printed output while training, we'll set `verbose` to `False`."
+      ],
+      "id": "a021582a"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "model.fit(\n",
+        "    x_train,\n",
+        "    y_train,\n",
+        "    eval_set=[(x_val, y_val)],\n",
+        "    verbose=False,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "e3aa3657"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind model\n",
+        "\n",
+        "You'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for our model.\n",
+        "\n",
+        "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+        "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
+        "\n",
+        "Initialize your model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
+      ],
+      "id": "ed11ea0b"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_model_xgb = vm.init_model(\n",
+        "    model,\n",
+        "    input_id=\"xgboost\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "4b2be11f"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_3__'></a>\n",
+        "\n",
+        "### Assign predictions\n",
+        "\n",
+        "Once the model has been registered, you can assign model predictions to the training and testing datasets.\n",
+        "\n",
+        "- The [`assign_predictions()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#assign_predictions) from the `Dataset` object can link existing predictions to any number of models.\n",
+        "- This method links the model's class prediction values and probabilities to our `vm_train_ds` and `vm_test_ds` datasets.\n",
+        "\n",
+        "If no prediction values are passed, the method will compute predictions automatically:"
+      ],
+      "id": "53f12da6"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds.assign_predictions(model=vm_model_xgb)\n",
+        "vm_test_ds.assign_predictions(model=vm_model_xgb)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "229185fd"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Running ValidMind tests\n",
+        "\n",
+        "Now that we know how to initialize ValidMind `dataset` and `model` objects, we're ready to run some tests!\n",
+        "\n",
+        "You run individual tests by calling [the `run_test` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test) provided by the `validmind.tests` module. For the examples below, we'll pass in the following arguments:\n",
+        "\n",
+        "- **`test_id`** — The ID of the test to run, as seen in the `ID` column when you run `list_tests`.\n",
+        "- **`inputs`** — A dictionary of test inputs, such as `dataset`, `model`, `datasets`, or `models`. These are ValidMind objects initialized with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) or [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model)."
+      ],
+      "id": "18c1cb2e"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_1__'></a>\n",
+        "\n",
+        "### Run classifier performance test with one model\n",
+        "\n",
+        "Run `validmind.data_validation.ClassifierPerformance` test with the testing dataset (`vm_test_ds`) and model (`vm_model_xgb`) as inputs:"
+      ],
+      "id": "6f7e7779"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.ClassifierPerformance\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_test_ds,\n",
+        "        \"model\": vm_model_xgb,\n",
+        "    },\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "85189af9"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2__'></a>\n",
+        "\n",
+        "### Run comparison tests\n",
+        "\n",
+        "To evaluate which models might be a better fit for a use case based on their performance on selected criteria, we can run the same test with multiple models. We'll train three additional models and run the classifier performance test with for all four models using a single `run_test()` call.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>ValidMind helps streamline your documentation and testing.</b></span>\n",
+        "<br></br>\n",
+        "You could call <code>run_test()</code> multiple times passing in different inputs, but you can also pass an <code>input_grid</code> object — a dictionary of test input keys and values that allow you to run a single test for a combination of models and datasets.\n",
+        "<br></br>\n",
+        "With <code>input_grid</code>, run comparison tests for multiple datasets, or even multiple datasets and models simultaneously — <code>input_grid</code> can be used with <code>run_test()</code> for all possible combinations of inputs, generating a cohesive and comprehensive single output.\n",
+        "</div>"
+      ],
+      "id": "5e8be8d5"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "*Random forest classifier* models use an ensemble method that builds multiple decision trees and averages their predictions. Random forest is robust to overfitting and handles non-linear relations well, but is typically less interpretable than simpler models:"
+      ],
+      "id": "e33c7a82"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from sklearn.ensemble import RandomForestClassifier\n",
+        "\n",
+        "# Train the random forest classifer model\n",
+        "model_rf = RandomForestClassifier()\n",
+        "model_rf.fit(x_train, y_train)\n",
+        "\n",
+        "# Initialize the ValidMind model object for the random forest classifer model\n",
+        "vm_model_rf = vm.init_model(\n",
+        "    model_rf,\n",
+        "    input_id=\"random_forest\",\n",
+        ")\n",
+        "\n",
+        "# Assign predictions to the test dataset for the random forest classifer model\n",
+        "vm_test_ds.assign_predictions(model=vm_model_rf)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "1976b7e8"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "*Logistic regression* models are linear models that estimate class probabilities via a logistic (sigmoid) function. Logistic regression is highly interpretable with fast training, establishing a strong baseline — however, they struggle when relationships are non-linear as real-world relationships often are:"
+      ],
+      "id": "f8e167cf"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from sklearn.linear_model import LogisticRegression\n",
+        "from sklearn.preprocessing import StandardScaler\n",
+        "from sklearn.pipeline import Pipeline\n",
+        "\n",
+        "# Scaling features ensures the lbfgs solver converges reliably\n",
+        "model_lr = Pipeline([\n",
+        "    (\"scaler\", StandardScaler()),\n",
+        "    (\"lr\", LogisticRegression()),\n",
+        "])\n",
+        "model_lr.fit(x_train, y_train)\n",
+        "\n",
+        "# Initialize the ValidMind model object for the logistic regression model\n",
+        "vm_model_lr = vm.init_model(\n",
+        "    model_lr,\n",
+        "    input_id=\"logistic_regression\",\n",
+        ")\n",
+        "\n",
+        "# Assign predictions to the test dataset for the logistic regression model\n",
+        "vm_test_ds.assign_predictions(model=vm_model_lr)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "90bbf148"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "*Decision tree classifier* models are a single tree with data split on feature thresholds. Useful as an explanability benchmark, decision trees are easy to visualize and interpret — but are prone to overfitting without pruning or ensemble techniques:"
+      ],
+      "id": "d3478f86"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from sklearn.tree import DecisionTreeClassifier\n",
+        "\n",
+        "# Train the decision tree classifer model\n",
+        "model_dt = DecisionTreeClassifier()\n",
+        "model_dt.fit(x_train, y_train)\n",
+        "\n",
+        "# Initialize the ValidMind model object for the decision tree classifier model\n",
+        "vm_model_dt = vm.init_model(\n",
+        "    model_dt,\n",
+        "    input_id=\"decision_tree\",\n",
+        ")\n",
+        "\n",
+        "# Assign predictions to the test dataset for the decision tree classifiermodel\n",
+        "vm_test_ds.assign_predictions(model=vm_model_dt)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "bfa1e17d"
+    },
+    {
+      "cell_type": "markdown",
+      "id": "59428da9",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2_1__'></a>\n",
+        "\n",
+        "#### Run classifier performance test with multiple models\n",
+        "\n",
+        "Now, we'll use the `input_grid` to run the `model_validation.sklearn.ClassifierPerformance` test on all four models using the testing dataset (`vm_test_ds`).\n",
+        "\n",
+        "When running individual tests, you can use a custom `result_id` to tag the individual result with a unique identifier by appending this `result_id` to the `test_id` with a `:` separator. We'll append an identifier to signify that this test was run on `all_models` to differentiate this test run from other runs:\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "perf_comparison_result = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.ClassifierPerformance:all_models\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_test_ds],\n",
+        "        \"model\": [vm_model_xgb, vm_model_rf, vm_model_lr, vm_model_dt],\n",
+        "    },\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "2e48ce1e"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Our output indicates that the XGBoost and random forest classification models provide the strongest overall classification performance, so we'll continue our testing with those two models as input only."
+      ],
+      "id": "1b76eae0"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2_2__'></a>\n",
+        "\n",
+        "#### Run classifier performance test with multiple parameter values\n",
+        "\n",
+        "Next, let's run the classifier performance test with the `param_grid` object, which runs the same test multiple times with different parameter values. We'll append an identifier to signify that this test was run with our `parameter_grid` configuration:"
+      ],
+      "id": "9fcc67b9"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "parameter_comparison_result = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.ClassifierPerformance:parameter_grid\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_test_ds],\n",
+        "        \"model\": [vm_model_xgb,vm_model_rf]\n",
+        "    },\n",
+        "    param_grid={\n",
+        "        \"average\": [\"macro\", \"micro\"]\n",
+        "    },\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "d0ad94c9"
+    },
+    {
+      "cell_type": "markdown",
+      "id": "19e8251b",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2_3__'></a>\n",
+        "\n",
+        "#### Run comparison test with multiple datasets\n",
+        "\n",
+        "Let's also run the `model_validation.sklearn.ROCCurve` test using `input_grid` to iterate through multiple datasets, which plots the ROC curves for the training (`vm_train_ds`) and test  (`vm_test_ds`) datasets side by side — a common scenario when you want to compare the performance of a model on the training and test datasets and visually assess how much performance is lost in the test dataset.\n",
+        "\n",
+        "We'll also need to assign predictions to the training dataset for the random forest classifier model, since we didn't do that in our earlier setup:\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds.assign_predictions(model=vm_model_rf)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "96c3b426"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "We'll append an identifier to signify that this test was run with our `train_vs_test` dataset comparison configuration:"
+      ],
+      "id": "7e07db9d"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "roc_curve_result = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.ROCCurve:train_vs_test\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "        \"model\": [vm_model_xgb,vm_model_rf],\n",
+        "    },\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "4056aa1e"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Work with test results\n",
+        "\n",
+        "Every test result returned by the `run_test()` function has a [`.log()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#TestResult.log) that can be used to send the test results to the ValidMind Platform. When logging individual test results to the platform, you'll need to manually add those results to the desired section of the documentation.\n",
+        "\n",
+        "You can do this through the ValidMind Platform interface after logging your test results (**Learn more:** [Work with test results](https://docs.validmind.ai/guide/documentation/work-with-test-results.html)), or directly via the ValidMind Library when calling `.log()` by providing an optional `section_id`. The `section_id` should be a string that matches the title of a section in the documentation template in `snake_case`.\n",
+        "\n",
+        "Let's log the results of the classifier performance test (`perf_comparison_result`) and the ROCCurve (`roc_curve_result`) test in the `model_evaluation` section of the documentation — present in the template we previewed in the beginning of this notebook:"
+      ],
+      "id": "a899fb84"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "perf_comparison_result.log(section_id=\"model_evaluation\")\n",
+        "roc_curve_result.log(section_id=\"model_evaluation\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "e119bf1e"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Finally, let's head to the model we connected to at the beginning of this notebook and view our inserted test results in the updated documentation (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html)):\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you connected to earlier.\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "3. Expand the **3.2. Model Evaluation** section.\n",
+        "\n",
+        "4. Confirm that `perf_comparison_result` and `roc_curve_result` display in this section as expected."
+      ],
+      "id": "098dba6c"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "Now that you know how to run comparison tests with the ValidMind Library, you’re ready to take the next step. Extend the functionality of `run_test()` with your own custom test functions that can be incorporated into documentation templates just like any default out-of-the-box ValidMind test.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn how to implement custom tests with the ValidMind Library.</b></span>\n",
+        "<br></br>\n",
+        "Check out our <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/custom_tests/implement_custom_tests.html\" style=\"color: #DE257E;\"><b>Implement comparison tests</b></a> notebook for code examples and usage of key functions.</div>"
+      ],
+      "id": "a658f908"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8_1__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ],
+      "id": "407b6c2b"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc9__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ],
+      "id": "82b51b49"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "vscode": {
+          "languageId": "plaintext"
+        }
+      },
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "0d35972c"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ],
+      "id": "86478a30"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ],
+      "id": "10073159"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-5fe1b67f8fdc4d26bb090f5e655857bf"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "Python 3",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "name": "python",
+      "version": "3.10"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 5
+}
diff --git a/site/notebooks/how_to/tests/run_tests/2_run_comparison_tests.ipynb b/site/notebooks/how_to/tests/run_tests/2_run_comparison_tests.ipynb
deleted file mode 100644
index ffcd999fc2..0000000000
--- a/site/notebooks/how_to/tests/run_tests/2_run_comparison_tests.ipynb
+++ /dev/null
@@ -1,1095 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "id": "1d29276f",
-   "metadata": {},
-   "source": [
-    "# Run comparison tests\n",
-    "\n",
-    "Learn how to use the ValidMind Library to run comparison tests that take any datasets or models as inputs. Identify comparison tests to run, initialize ValidMind dataset and model objects in preparation for passing them to tests, and then run tests — generating outputs automatically logged to your model's documentation in the ValidMind Platform.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>We recommend that you first complete our introductory notebook on running tests.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/notebooks/how_to/tests/run_tests/1_run_dataset_based_tests.html\" style=\"color: #DE257E;\"><b>Run dataset-based tests</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "61065444",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "  - [Preview the documentation template](#toc2_3__)    \n",
-    "  - [Initialize the Python environment](#toc2_4__)    \n",
-    "- [Explore a ValidMind test](#toc3__)    \n",
-    "- [Working with ValidMind datasets](#toc4__)    \n",
-    "  - [Import the sample dataset](#toc4_1__)    \n",
-    "  - [Split the dataset](#toc4_2__)    \n",
-    "  - [Initialize the ValidMind dataset](#toc4_3__)    \n",
-    "- [Working with ValidMind models](#toc5__)    \n",
-    "  - [Train a sample model](#toc5_1__)    \n",
-    "  - [Initialize the ValidMind model](#toc5_2__)    \n",
-    "  - [Assign predictions](#toc5_3__)    \n",
-    "- [Running ValidMind tests](#toc6__)    \n",
-    "  - [Run classifier performance test with one model](#toc6_1__)    \n",
-    "  - [Run comparison tests](#toc6_2__)    \n",
-    "    - [Run classifier performance test with multiple models](#toc6_2_1__)    \n",
-    "    - [Run classifier performance test with multiple parameter values](#toc6_2_2__)    \n",
-    "    - [Run comparison test with multiple datasets](#toc6_2_3__)    \n",
-    "- [Work with test results](#toc7__)    \n",
-    "- [Next steps](#toc8__)    \n",
-    "  - [Discover more learning resources](#toc8_1__)    \n",
-    "- [Upgrade ValidMind](#toc9__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "67a4d9dc",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models. \n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "eeb30df8",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "293c3f98",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "4fc836d0",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Metrics**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
-    "\n",
-    "**Custom metrics**: Custom metrics are functions that you define to evaluate your model or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom metric.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom metric. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a metric, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom metrics can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "8d52b6e0",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e0d2daaf",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
-    "<br></br>\n",
-    "Python 3.8 <= x <= 3.14</div>\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "fc97888f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "1ff56571",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "c4d9f164",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook.\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "852392e5",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Binary classification`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "6490e991",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet::"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "c51ae01c",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "99e9d14f",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "fd332a9d",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f805ec38",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_4__'></a>\n",
-    "\n",
-    "### Initialize the Python environment\n",
-    "\n",
-    "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "8e2127cd",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import xgboost as xgb\n",
-    "\n",
-    "%matplotlib inline"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "1783e13c",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Explore a ValidMind test\n",
-    "\n",
-    "Before we run a test, use [the `vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) to return information on out-of-the-box tests available in the ValidMind Library.\n",
-    "\n",
-    "Let's assume you want to evaluate *classifier performance* for a model. Classifier performance measures how well a classification model correctly predicts outcomes, using metrics like [precision, recall, and F1 score](https://en.wikipedia.org/wiki/Precision_and_recall).\n",
-    "\n",
-    "We'll pass in a `filter` to the `list_tests` function to find the test ID for classifier performance:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "a6a6f715",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.list_tests(filter=\"ClassifierPerformance\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "96a56e4b",
-   "metadata": {},
-   "source": [
-    "We've identified from the output that the test ID for the classifier performance test is `validmind.model_validation.ClassifierPerformance`.\n",
-    "\n",
-    "Use this ID combined with [the `describe_test()` function](https://docs.validmind.ai/validmind/validmind/tests.html#describe_test) to retrieve more information about the test, including its **Required Inputs**:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "f8a46c7d",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test_id = \"validmind.model_validation.sklearn.ClassifierPerformance\"\n",
-    "vm.tests.describe_test(test_id)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "97053f50",
-   "metadata": {},
-   "source": [
-    "Since this test requires a dataset and a model, you can expect it to throw an error when we run it without passing in either as input:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "f853c272",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "try:\n",
-    "    vm.tests.run_test(test_id)\n",
-    "except Exception as e:\n",
-    "    print(e)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "1a3115ed",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn more about the individual tests available in the ValidMind Library</b></span>\n",
-    "<br></br>\n",
-    "Check out our <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/explore_tests/explore_tests.html\" style=\"color: #DE257E;\"><b>Explore tests</b></a> notebook for more code examples and usage of key functions.</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "89da851b",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Working with ValidMind datasets"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "50bfdb1b",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Import the sample dataset\n",
-    "\n",
-    "Since we need a dataset to run tests, let's import the public [Bank Customer Churn Prediction](https://www.kaggle.com/datasets/shantanudhakadd/bank-customer-churn-prediction) dataset from Kaggle so that we have something to work with.\n",
-    "\n",
-    "In our below example, note that:\n",
-    "\n",
-    "- The target column, `Exited` has a value of `1` when a customer has churned and `0` otherwise.\n",
-    "- The ValidMind Library provides a wrapper to automatically load the dataset as a [Pandas DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html) object. A Pandas Dataframe is a two-dimensional tabular data structure that makes use of rows and columns."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "3ef2dfbb",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Import the sample dataset from the library\n",
-    "\n",
-    "from validmind.datasets.classification import customer_churn\n",
-    "\n",
-    "print(\n",
-    "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{customer_churn.target_column}' \\n\\t• Class labels: {customer_churn.class_labels}\"\n",
-    ")\n",
-    "\n",
-    "raw_df = customer_churn.load_data()\n",
-    "raw_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "a5a8212f",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Split the dataset\n",
-    "\n",
-    "Let's first split our dataset to help assess how well the model generalizes to unseen data.\n",
-    "\n",
-    "Use [`preprocess()`](https://docs.validmind.ai/validmind/validmind/datasets/classification/customer_churn.html#preprocess) to split our dataset into three subsets:\n",
-    "\n",
-    "1. **train_df** — Used to train the model.\n",
-    "2. **validation_df** — Used to evaluate the model's performance during training.\n",
-    "3. **test_df** — Used later on to asses the model's performance on new, unseen data."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "88c87d4a",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "train_df, validation_df, test_df = customer_churn.preprocess(raw_df)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "2ae225d7",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_3__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind dataset\n",
-    "\n",
-    "The next step is to connect your data with a ValidMind `Dataset` object. **This step is always necessary every time you want to connect a dataset to documentation and produce test results through ValidMind,** but you only need to do it once per dataset.\n",
-    "\n",
-    "ValidMind dataset objects provide a wrapper to any type of dataset (NumPy, Pandas, Polars, etc.) so that tests can run transparently regardless of the underlying library.\n",
-    "\n",
-    "Initialize a ValidMind dataset object using the [`init_dataset` function](https://docs.validmind.ai/validmind/validmind.html#init_dataset) from the ValidMind (`vm`) module. For this example, we'll pass in the following arguments:\n",
-    "\n",
-    "- **`dataset`** — The raw dataset that you want to provide as input to tests.\n",
-    "- **`input_id`** — A unique identifier that allows tracking what inputs are used when running each individual test.\n",
-    "- **`target_column`** — A required argument if tests require access to true values. This is the name of the target column in the dataset."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "bf0ec747",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds = vm.init_dataset(\n",
-    "    dataset=train_df,\n",
-    "    input_id=\"train_dataset\",\n",
-    "    target_column=customer_churn.target_column,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    dataset=test_df,\n",
-    "    input_id=\"test_dataset\",\n",
-    "    target_column=customer_churn.target_column,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "6d26f65b",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Working with ValidMind models"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "6d1677f6",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_1__'></a>\n",
-    "\n",
-    "### Train a sample model\n",
-    "\n",
-    "To train the model, we need to provide it with:\n",
-    "\n",
-    "1. **Inputs** — Features such as customer age, usage, etc.\n",
-    "2. **Outputs (Expected answers/labels)** — in our case, we would like to know whether the customer churned or not.\n",
-    "\n",
-    "Here, we'll use `x_train` and `x_val` to hold the input data (features), and `y_train` and `y_val` to hold the answers (the target we want to predict):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "39e8c7ea",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "x_train = train_df.drop(customer_churn.target_column, axis=1)\n",
-    "y_train = train_df[customer_churn.target_column]\n",
-    "x_val = validation_df.drop(customer_churn.target_column, axis=1)\n",
-    "y_val = validation_df[customer_churn.target_column]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "4ac628eb",
-   "metadata": {},
-   "source": [
-    "Next, let's create an *XGBoost classifier model* that will automatically stop training if it doesn't improve after 10 tries. XGBoost is a gradient-boosted tree ensemble that builds trees sequentially, with each tree correcting the errors of the previous ones — typically known for strong predictive performance and built-in regularization to reduce overfitting.\n",
-    "\n",
-    "Setting an explicit threshold avoids wasting time and helps prevent further overfitting by stopping training when further improvement isn't happening. We'll also set three evaluation metrics to get a more complete picture of model performance:\n",
-    "\n",
-    "1. **error** — Measures how often the model makes incorrect predictions.\n",
-    "2. **logloss** — Indicates how confident the predictions are.\n",
-    "3. **auc** — Evaluates how well the model distinguishes between churn and not churn."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "255e3583",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "model = xgb.XGBClassifier(early_stopping_rounds=10)\n",
-    "model.set_params(\n",
-    "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f6430312",
-   "metadata": {},
-   "source": [
-    "Finally, our actual training step — where the model learns patterns from the data, so it can make predictions later:\n",
-    "\n",
-    "- The model is trained on `x_train` and `y_train`, and evaluates its performance using `x_val` and `y_val` to check if it’s learning well.\n",
-    "- To turn off printed output while training, we'll set `verbose` to `False`."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "e3aa3657",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "model.fit(\n",
-    "    x_train,\n",
-    "    y_train,\n",
-    "    eval_set=[(x_val, y_val)],\n",
-    "    verbose=False,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "c303a046",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind model\n",
-    "\n",
-    "You'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for our model.\n",
-    "\n",
-    "You simply initialize this model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "4b2be11f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_model_xgb = vm.init_model(\n",
-    "    model,\n",
-    "    input_id=\"xgboost\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "2fa83857",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_3__'></a>\n",
-    "\n",
-    "### Assign predictions\n",
-    "\n",
-    "Once the model has been registered, you can assign model predictions to the training and testing datasets.\n",
-    "\n",
-    "- The [`assign_predictions()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#assign_predictions) from the `Dataset` object can link existing predictions to any number of models.\n",
-    "- This method links the model's class prediction values and probabilities to our `vm_train_ds` and `vm_test_ds` datasets.\n",
-    "\n",
-    "If no prediction values are passed, the method will compute predictions automatically:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "229185fd",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds.assign_predictions(model=vm_model_xgb)\n",
-    "vm_test_ds.assign_predictions(model=vm_model_xgb)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "d0b3312e",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Running ValidMind tests\n",
-    "\n",
-    "Now that we know how to initialize ValidMind `dataset` and `model` objects, we're ready to run some tests!\n",
-    "\n",
-    "You run individual tests by calling [the `run_test` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test) provided by the `validmind.tests` module. For the examples below, we'll pass in the following arguments:\n",
-    "\n",
-    "- **`test_id`** — The ID of the test to run, as seen in the `ID` column when you run `list_tests`.\n",
-    "- **`inputs`** — A dictionary of test inputs, such as `dataset`, `model`, `datasets`, or `models`. These are ValidMind objects initialized with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) or [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model)."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "96c89f32",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1__'></a>\n",
-    "\n",
-    "### Run classifier performance test with one model\n",
-    "\n",
-    "Run `validmind.data_validation.ClassifierPerformance` test with the testing dataset (`vm_test_ds`) and model (`vm_model_xgb`) as inputs:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "85189af9",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.ClassifierPerformance\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_test_ds,\n",
-    "        \"model\": vm_model_xgb,\n",
-    "    },\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "676dff89",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2__'></a>\n",
-    "\n",
-    "### Run comparison tests\n",
-    "\n",
-    "To evaluate which models might be a better fit for a use case based on their performance on selected criteria, we can run the same test with multiple models. We'll train three additional models and run the classifier performance test with for all four models using a single `run_test()` call.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>ValidMind helps streamline your documentation and testing.</b></span>\n",
-    "<br></br>\n",
-    "You could call <code>run_test()</code> multiple times passing in different inputs, but you can also pass an <code>input_grid</code> object — a dictionary of test input keys and values that allow you to run a single test for a combination of models and datasets.\n",
-    "<br></br>\n",
-    "With <code>input_grid</code>, run comparison tests for multiple datasets, or even multiple datasets and models simultaneously — <code>input_grid</code> can be used with <code>run_test()</code> for all possible combinations of inputs, generating a cohesive and comprehensive single output.\n",
-    "</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "3d9912dc",
-   "metadata": {},
-   "source": [
-    "*Random forest classifier* models use an ensemble method that builds multiple decision trees and averages their predictions. Random forest is robust to overfitting and handles non-linear relations well, but is typically less interpretable than simpler models:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "1976b7e8",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from sklearn.ensemble import RandomForestClassifier\n",
-    "\n",
-    "# Train the random forest classifer model\n",
-    "model_rf = RandomForestClassifier()\n",
-    "model_rf.fit(x_train, y_train)\n",
-    "\n",
-    "# Initialize the ValidMind model object for the random forest classifer model\n",
-    "vm_model_rf = vm.init_model(\n",
-    "    model_rf,\n",
-    "    input_id=\"random_forest\",\n",
-    ")\n",
-    "\n",
-    "# Assign predictions to the test dataset for the random forest classifer model\n",
-    "vm_test_ds.assign_predictions(model=vm_model_rf)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "a259927c",
-   "metadata": {},
-   "source": [
-    "*Logistic regression* models are linear models that estimate class probabilities via a logistic (sigmoid) function. Logistic regression is highly interpretable with fast training, establishing a strong baseline — however, they struggle when relationships are non-linear as real-world relationships often are:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "90bbf148",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from sklearn.linear_model import LogisticRegression\n",
-    "from sklearn.preprocessing import StandardScaler\n",
-    "from sklearn.pipeline import Pipeline\n",
-    "\n",
-    "# Scaling features ensures the lbfgs solver converges reliably\n",
-    "model_lr = Pipeline([\n",
-    "    (\"scaler\", StandardScaler()),\n",
-    "    (\"lr\", LogisticRegression()),\n",
-    "])\n",
-    "model_lr.fit(x_train, y_train)\n",
-    "\n",
-    "# Initialize the ValidMind model object for the logistic regression model\n",
-    "vm_model_lr = vm.init_model(\n",
-    "    model_lr,\n",
-    "    input_id=\"logistic_regression\",\n",
-    ")\n",
-    "\n",
-    "# Assign predictions to the test dataset for the logistic regression model\n",
-    "vm_test_ds.assign_predictions(model=vm_model_lr)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "9a666b41",
-   "metadata": {},
-   "source": [
-    "*Decision tree classifier* models are a single tree with data split on feature thresholds. Useful as an explanability benchmark, decision trees are easy to visualize and interpret — but are prone to overfitting without pruning or ensemble techniques:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "bfa1e17d",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from sklearn.tree import DecisionTreeClassifier\n",
-    "\n",
-    "# Train the decision tree classifer model\n",
-    "model_dt = DecisionTreeClassifier()\n",
-    "model_dt.fit(x_train, y_train)\n",
-    "\n",
-    "# Initialize the ValidMind model object for the decision tree classifier model\n",
-    "vm_model_dt = vm.init_model(\n",
-    "    model_dt,\n",
-    "    input_id=\"decision_tree\",\n",
-    ")\n",
-    "\n",
-    "# Assign predictions to the test dataset for the decision tree classifiermodel\n",
-    "vm_test_ds.assign_predictions(model=vm_model_dt)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "2c8f3268",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2_1__'></a>\n",
-    "\n",
-    "#### Run classifier performance test with multiple models\n",
-    "\n",
-    "Now, we'll use the `input_grid` to run the [`ClassifierPerformance` test](https://docs.validmind.ai/tests/model_validation/sklearn/ClassifierPerformance.html) on all four models using the testing dataset (`vm_test_ds`).\n",
-    "\n",
-    "When running individual tests, you can use a custom `result_id` to tag the individual result with a unique identifier by appending this `result_id` to the `test_id` with a `:` separator. We'll append an identifier to signify that this test was run on `all_models` to differentiate this test run from other runs:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "2e48ce1e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "perf_comparison_result = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.ClassifierPerformance:all_models\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_test_ds],\n",
-    "        \"model\": [vm_model_xgb, vm_model_rf, vm_model_lr, vm_model_dt],\n",
-    "    },\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "81cbf144",
-   "metadata": {},
-   "source": [
-    "Our output indicates that the XGBoost and random forest classification models provide the strongest overall classification performance, so we'll continue our testing with those two models as input only."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "3d3fb6ec",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2_2__'></a>\n",
-    "\n",
-    "#### Run classifier performance test with multiple parameter values\n",
-    "\n",
-    "Next, let's run the classifier performance test with the `param_grid` object, which runs the same test multiple times with different parameter values. We'll append an identifier to signify that this test was run with our `parameter_grid` configuration:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "d0ad94c9",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "parameter_comparison_result = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.ClassifierPerformance:parameter_grid\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_test_ds],\n",
-    "        \"model\": [vm_model_xgb,vm_model_rf]\n",
-    "    },\n",
-    "    param_grid={\n",
-    "        \"average\": [\"macro\", \"micro\"]\n",
-    "    },\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "508c7546",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2_3__'></a>\n",
-    "\n",
-    "#### Run comparison test with multiple datasets\n",
-    "\n",
-    "Let's also run the [ROCCurve test](https://docs.validmind.ai/tests/model_validation/sklearn/ROCCurve.html) using `input_grid` to iterate through multiple datasets, which plots the ROC curves for the training (`vm_train_ds`) and test  (`vm_test_ds`) datasets side by side — a common scenario when you want to compare the performance of a model on the training and test datasets and visually assess how much performance is lost in the test dataset.\n",
-    "\n",
-    "We'll also need to assign predictions to the training dataset for the random forest classifier model, since we didn't do that in our earlier setup:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "96c3b426",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds.assign_predictions(model=vm_model_rf)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "2be82bae",
-   "metadata": {},
-   "source": [
-    "We'll append an identifier to signify that this test was run with our `train_vs_test` dataset comparison configuration:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "4056aa1e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "roc_curve_result = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.ROCCurve:train_vs_test\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "        \"model\": [vm_model_xgb,vm_model_rf],\n",
-    "    },\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "a05570d5",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Work with test results\n",
-    "\n",
-    "Every test result returned by the `run_test()` function has a [`.log()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#TestResult.log) that can be used to send the test results to the ValidMind Platform. When logging individual test results to the platform, you'll need to manually add those results to the desired section of the model documentation.\n",
-    "\n",
-    "You can do this through the ValidMind Platform interface after logging your test results ([Learn more ...](https://docs.validmind.ai/developer/model-documentation/work-with-test-results.html)), or directly via the ValidMind Library when calling `.log()` by providing an optional `section_id`. The `section_id` should be a string that matches the title of a section in the documentation template in `snake_case`.\n",
-    "\n",
-    "Let's log the results of the classifier performance test (`perf_comparison_result`) and the ROCCurve (`roc_curve_result`) test in the `model_evaluation` section of the documentation — present in the template we previewed in the beginning of this notebook:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "e119bf1e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "perf_comparison_result.log(section_id=\"model_evaluation\")\n",
-    "roc_curve_result.log(section_id=\"model_evaluation\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "ab5205ee",
-   "metadata": {},
-   "source": [
-    "Finally, let's head to the model we connected to at the beginning of this notebook and view our inserted test results in the updated documentation ([Need more help?](https://docs.validmind.ai/guide/model-documentation/working-with-model-documentation.html)):\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you connected to earlier.\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "3. Expand the **3.2. Model Evaluation** section.\n",
-    "\n",
-    "4. Confirm that `perf_comparison_result` and `roc_curve_result` display in this section as expected."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "eb196aac",
-   "metadata": {},
-   "source": [
-    "<a id='toc8__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "Now that you know how to run comparison tests with the ValidMind Library, you’re ready to take the next step. Extend the functionality of `run_test()` with your own custom test functions that can be incorporated into documentation templates just like any default out-of-the-box ValidMind test.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn how to implement custom tests with the ValidMind Library.</b></span>\n",
-    "<br></br>\n",
-    "Check out our <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/custom_tests/implement_custom_tests.html\" style=\"color: #DE257E;\"><b>Implement comparison tests</b></a> notebook for code examples and usage of key functions.</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "083c1d8d",
-   "metadata": {},
-   "source": [
-    "<a id='toc8_1__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "efba0f57",
-   "metadata": {},
-   "source": [
-    "<a id='toc9__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "0d35972c",
-   "metadata": {
-    "vscode": {
-     "languageId": "plaintext"
-    }
-   },
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "abcd07ef",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "5fe70b90",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-54faffd51a5a4717a02b6be426d6b441",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "name": "python",
-   "version": "3.10"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
-}
diff --git a/site/notebooks/how_to/tests/run_tests/configure_tests/configure_judge_llms.ipynb b/site/notebooks/how_to/tests/run_tests/configure_tests/configure_judge_llms.ipynb
new file mode 100644
index 0000000000..3e8d27bcd1
--- /dev/null
+++ b/site/notebooks/how_to/tests/run_tests/configure_tests/configure_judge_llms.ipynb
@@ -0,0 +1,827 @@
+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "id": "0935afb5",
+      "metadata": {},
+      "source": [
+        "# Configure judge LLM and judge embeddings\n",
+        "\n",
+        "This notebook shows how to configure and validate the default judge LLM and judge embeddings used by the ValidMind Library for LLM-focused tests.\n",
+        "\n",
+        "It exercises three important paths:\n",
+        "1. Prompt-validation tests, which depend on the default judge LLM.\n",
+        "2. RAGAS-based tests, which depend on both the default judge LLM and the default judge embeddings model.\n",
+        "3. DeepEval scorers, which depend on the default local scorer model path.\n",
+        "\n",
+        "The notebook automatically selects the available provider from your environment, with OpenAI taking precedence when both OpenAI and Gemini keys are set, to match the library's default-provider logic."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "1f2befa6",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents\n",
+        "- [Introduction](#toc1__)\n",
+        "- [About ValidMind](#toc2__)\n",
+        "  - [Before you begin](#toc2_1__)\n",
+        "  - [New to ValidMind?](#toc2_2__)\n",
+        "  - [Key concepts](#toc2_3__)\n",
+        "- [Setting up](#toc3__)\n",
+        "  - [Install the ValidMind Library](#toc3_1__)\n",
+        "  - [Connect to the ValidMind Platform](#toc3_2__)\n",
+        "    - [Register or select a model](#toc3_2_1__)\n",
+        "    - [Choose a documentation template](#toc3_2_2__)\n",
+        "    - [Get your code snippet](#toc3_2_3__)\n",
+        "  - [Initialize the notebook environment](#toc3_3__)\n",
+        "- [Getting to know ValidMind](#toc4__)\n",
+        "  - [Preview the documentation template](#toc4_1__)\n",
+        "  - [View model documentation in the ValidMind Platform](#toc4_2__)\n",
+        "- [Configure the judge provider](#toc5__)\n",
+        "- [Prompt-validation tests](#toc6__)\n",
+        "- [RAGAS tests](#toc7__)\n",
+        "- [DeepEval scorers](#toc8__)\n",
+        "- [In summary](#toc9__)\n",
+        "- [Next steps](#toc10__)\n",
+        "  - [Discover more learning resources](#toc10_1__)\n",
+        "- [Upgrade ValidMind](#toc11__)\n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "b77005b8",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## Introduction\n",
+        "\n",
+        "This notebook shows how to configure and validate the default judge LLM and judge embeddings used by the ValidMind Library for LLM-focused tests.\n",
+        "\n",
+        "It walks through the provider configuration used by three important evaluation paths:\n",
+        "- prompt-validation tests\n",
+        "- RAGAS-based tests\n",
+        "- DeepEval scorers\n",
+        "\n",
+        "Along the way, you will initialize ValidMind model and dataset objects, inspect the resolved judge configuration, run representative tests, and optionally log the results to the ValidMind Platform. By the end of the notebook, you will have a practical reference for configuring judge models and understanding how those settings affect different LLM evaluation workflows."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "56ecff8d",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models. \n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "e8743d30",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "Before running this notebook, make sure you have:\n",
+        "- a Python environment with the ValidMind Library and its LLM dependencies installed\n",
+        "- access to a ValidMind account if you want to log results to the ValidMind Platform\n",
+        "- credentials for one supported judge provider in your environment\n",
+        "\n",
+        "This notebook supports:\n",
+        "- OpenAI via `OPENAI_API_KEY`, with optional `OPENAI_MODEL` and `OPENAI_EMBEDDINGS_MODEL` overrides. The current default judge model is `gpt-4.1` and the default embeddings model is `text-embedding-3-small`.\n",
+        "- Gemini via `GOOGLE_API_KEY` or `GEMINI_API_KEY`, with optional `GEMINI_MODEL` and `GEMINI_EMBEDDINGS_MODEL` overrides. The current defaults are `gemini-2.5-pro` and `models/text-embedding-004`.\n",
+        "- Azure OpenAI via `AZURE_OPENAI_KEY`, `AZURE_OPENAI_ENDPOINT`, and `AZURE_OPENAI_MODEL`. The current default embeddings model is `text-embedding-3-small`.\n",
+        "\n",
+        "You can still run the notebook locally without connecting to the ValidMind Platform, but connecting a model document makes it easier to review and share results after the tests complete."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "ee479eb5",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you are new to the ValidMind Library, start with the [ValidMind Library overview](https://docs.validmind.ai/developer/validmind-library.html). It introduces the core workflow for initializing models and datasets, running tests, and logging outputs back to the ValidMind Platform.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>You only need a ValidMind account if you want to log results to the ValidMind Platform.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "689e55db",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**Judge LLM**: The language model used by ValidMind to evaluate prompts, answers, contexts, and other LLM outputs.\n",
+        "\n",
+        "**Judge embeddings**: The embeddings model used when a test requires semantic similarity or retrieval-based comparison.\n",
+        "\n",
+        "**Provider credentials**: Environment variables that tell ValidMind which provider to use for judge evaluation. In this notebook, the provider is resolved automatically from the credentials available in your environment.\n",
+        "\n",
+        "**ValidMind dataset**: A dataset initialized with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset). Wrapping a pandas DataFrame this way lets you pass the dataset into ValidMind tests with the metadata those tests expect.\n",
+        "\n",
+        "**ValidMind model**: A model initialized with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). In this notebook, we use a lightweight model object to run prompt-validation tests against a prompt template.\n",
+        "\n",
+        "**Prompt-validation tests**: Tests that evaluate prompt quality and instructions, such as clarity or bias, using a judge LLM.\n",
+        "\n",
+        "**RAGAS tests**: Retrieval-augmented generation tests that can rely on both a judge LLM and judge embeddings.\n",
+        "\n",
+        "**DeepEval scorers**: LLM-based scorers used for tasks such as answer relevancy and hallucination detection. These use the evaluation model path but do not require judge embeddings."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "8d6a8300",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
+        "<br></br>\n",
+        "Python 3.8 <= x <= 3.14</div>\n",
+        "\n",
+        "Install the ValidMind Library with the optional LLM dependencies so the notebook can run prompt-validation tests, RAGAS tests, and DeepEval scorers:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "da644666",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "%pip install -q \"validmind[llm]\""
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "17c1c7d2",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2__'></a>\n",
+        "\n",
+        "### Connect to the ValidMind Platform\n",
+        "\n",
+        "If you want to log notebook outputs to the ValidMind Platform, start by selecting an existing model in your inventory or registering a new one. This notebook can run without platform connectivity, but linking it to a model document gives you a place to review the results after the examples finish.\n",
+        "\n",
+        "<a id='toc3_2_1__'></a>\n",
+        "\n",
+        "#### Register or select a model\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
+        "2. Open **Inventory** and either select an existing model or click **+ Register Model**.\n",
+        "3. Complete the model details and stakeholder assignments if you are registering a new model.\n",
+        "4. Open the document where you want notebook results to be logged.\n",
+        "\n",
+        "Using a real model document is especially helpful in this notebook because it lets you compare the locally executed tests with the sections available in your template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "dc628c6c",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_2__'></a>\n",
+        "\n",
+        "#### Choose a documentation template\n",
+        "\n",
+        "If you plan to log results from this notebook, make sure your model document uses a template that includes sections for the LLM evaluation results you want to capture.\n",
+        "\n",
+        "This is important because tests that are not included in the selected template will not appear automatically in the Platform document, even if you run and log them successfully from the notebook. If you want to document those results as well, you can add the relevant sections or tests manually in the Platform.\n",
+        "\n",
+        "Before running the notebook, preview the template structure and confirm that the document has the sections you expect for your workflow."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "702f5196",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the code snippet associated with your model document so that test results are uploaded to the correct destination in the ValidMind Platform.\n",
+        "\n",
+        "1. In the model sidebar, open **Getting Started**.\n",
+        "2. Select the document you want to update.\n",
+        "3. Copy the generated code snippet.\n",
+        "4. Load the values from an `.env` file or replace the placeholders in the example below with your own values.\n",
+        "\n",
+        "Using environment variables is usually the easiest way to keep the notebook portable across environments and avoid hard-coding connection details in the notebook itself."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "c52a42d0",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    api_host=\"http://localhost:5000/api/v1/tracking\",\n",
+        "    api_key=\"..\",\n",
+        "    api_secret=\"..\",\n",
+        "    document=\"documentation\", # requires library >=2.12.0\n",
+        "    model=\"..\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "3657a7a4",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_3__'></a>\n",
+        "\n",
+        "### Initialize the notebook environment\n",
+        "\n",
+        "Load environment variables and prepare the notebook session. In the execution cells that follow, you will import the libraries needed for this walkthrough, inspect the configured judge provider, and create the ValidMind objects used by the example tests.\n",
+        "\n",
+        "This section is also where the notebook becomes reproducible: once your credentials and dependencies are in place, the remaining sections can be run top to bottom."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "979988a9",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "import os\n",
+        "\n",
+        "import pandas as pd\n",
+        "\n",
+        "from validmind.ai import utils as ai_utils\n",
+        "from validmind.models import Prompt\n",
+        "from validmind.tests import run_test"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "3db58d74",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Getting to know ValidMind"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "45450d55",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "If you have already connected this notebook to a model document, you can preview the active template structure directly from the library.\n",
+        "\n",
+        "This is useful for confirming where logged results will appear before you run the prompt-validation, RAGAS, and DeepEval examples below. It also helps you spot gaps early if a test you plan to run is not represented in the current template:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "98f0b602",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "vm.preview_template()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "58e1d75f",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### View model documentation in the ValidMind Platform\n",
+        "\n",
+        "After you run the notebook and log results, open your model document in the ValidMind Platform to review how the test outputs were added.\n",
+        "\n",
+        "Comparing the template preview with the rendered document is a good way to confirm that your notebook is writing results to the expected sections. If a result does not appear automatically, check whether the corresponding test is part of the selected template before troubleshooting the notebook run itself."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "86038351",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Configure the judge provider\n",
+        "\n",
+        "The next cells load your environment variables, resolve the judge provider from the credentials available in your session, and initialize the ValidMind Library for result logging.\n",
+        "\n",
+        "This notebook uses the same provider resolution logic as the library itself:\n",
+        "- OpenAI is selected when `OPENAI_API_KEY` is available, with `OPENAI_MODEL` as an optional override. The current default judge model is `gpt-4.1`.\n",
+        "- Azure OpenAI is selected when Azure credentials are available, using `AZURE_OPENAI_MODEL` for the judge model.\n",
+        "- Gemini is selected when `GOOGLE_API_KEY` or `GEMINI_API_KEY` is available, with optional `GEMINI_MODEL` and `GEMINI_EMBEDDINGS_MODEL` overrides. The current defaults are `gemini-2.5-pro` and `models/text-embedding-004`.\n",
+        "\n",
+        "If more than one provider is configured, OpenAI takes precedence to match the library default.\n",
+        "\n",
+        "This matters because the same default judge configuration is reused across multiple evaluation paths, so checking it once here makes the later test results easier to interpret."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "a3efda1f",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Optional: override the default judge models for this notebook session.\n",
+        "# os.environ[\"OPENAI_MODEL\"] = \"gpt-4.1\"\n",
+        "# os.environ[\"GEMINI_MODEL\"] = \"gemini-2.5-pro\"\n",
+        "# os.environ[\"GEMINI_EMBEDDINGS_MODEL\"] = \"models/text-embedding-004\""
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "f0438cf0",
+      "metadata": {},
+      "source": [
+        "The next cells import the required libraries, inspect the resolved provider configuration, and connect the notebook to the ValidMind Platform. Reading the printed provider and class names is a quick sanity check that your environment is using the judge setup you expect before any tests are executed."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "089f10fa",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Load credentials and resolve the provider\n",
+        "\n",
+        "Run the next cells to:\n",
+        "- import the libraries used in this notebook\n",
+        "- inspect the provider selected from your environment\n",
+        "- inspect the resolved judge LLM and judge embeddings classes\n",
+        "- initialize the ValidMind Library with your platform credentials\n",
+        "\n",
+        "If both OpenAI and Gemini credentials are available, OpenAI will be selected to match the default provider precedence used by the library.\n",
+        "\n",
+        "This section gives you a concrete view of the effective configuration that the later prompt-validation, RAGAS, and DeepEval examples will use."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "f1479922",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "from validmind.ai.utils import get_client_and_model, get_judge_config\n",
+        "\n",
+        "client, model = get_client_and_model()\n",
+        "judge_llm, judge_embeddings = get_judge_config()\n",
+        "\n",
+        "print(\"resolved_model:\", model)\n",
+        "print(\"judge_llm_type:\", type(judge_llm).__name__)\n",
+        "print(\"judge_embeddings_type:\", type(judge_embeddings).__name__)\n",
+        "\n",
+        "# Useful for Gemini/OpenAI/Azure debugging\n",
+        "print(\"judge_llm:\", judge_llm)\n",
+        "print(\"judge_embeddings:\", judge_embeddings)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "e7868c71",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Prompt-validation tests\n",
+        "\n",
+        "This section validates the default judge LLM path with two representative prompt-validation tests. For this smoke test, we use a simple prompt-only model because these tests evaluate the prompt template itself and do not require model predictions.\n",
+        "\n",
+        "The example below creates a ValidMind model with `vm.init_model()` and attaches a prompt template to it. That gives the tests a standard object to inspect, even though there is no real predictive model behind the example.\n",
+        "\n",
+        "- `Clarity` checks whether the prompt instructions are clear and well-scoped.\n",
+        "- `Bias` checks whether the prompt structure or examples could induce biased behavior."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "7cc07ba8",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "system_prompt = \"\"\"\n",
+        "You are an AI assistant specialized in sentiment analysis for financial news.\n",
+        "You will classify each sentence as positive, negative, or neutral.\n",
+        "Respond only with the sentiment label.\n",
+        "\"\"\".strip()\n",
+        "\n",
+        "\n",
+        "def noop_predict(_):\n",
+        "    return \"dummy\"\n",
+        "\n",
+        "\n",
+        "vm_prompt_model = vm.init_model(\n",
+        "    input_id=\"judge_prompt_model\",\n",
+        "    predict_fn=noop_predict,\n",
+        "    prompt=Prompt(template=system_prompt, variables=[]),\n",
+        ")\n",
+        "\n",
+        "vm_prompt_model.prompt.template"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "40298f6b",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "run_test(\n",
+        "    test_id=\"validmind.prompt_validation.Clarity\",\n",
+        "    inputs={\"model\": vm_prompt_model},\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "4180b0f1",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "run_test(\n",
+        "    test_id=\"validmind.prompt_validation.Bias\",\n",
+        "    inputs={\"model\": vm_prompt_model},\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "9935d075",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## RAGAS tests\n",
+        "\n",
+        "This section validates the default judge LLM plus default judge embeddings path. The selected tests are useful because they exercise the RAGAS integration that historically depended on the default OpenAI setup.\n",
+        "\n",
+        "The example data is wrapped with `vm.init_dataset()`, which turns the pandas DataFrame into a ValidMind dataset object that can be passed directly into these tests.\n",
+        "\n",
+        "- `ResponseRelevancy` exercises the judge LLM and embeddings path.\n",
+        "- `AnswerCorrectness` exercises semantic and factual comparison with judge embeddings.\n",
+        "- `Faithfulness` is a companion smoke test for the judge LLM path on RAG data.\n",
+        "\n",
+        "These tests produce Plotly figures, so this notebook focuses on running and logging the results rather than comparing visual output in detail."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "17cbf0e3",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "rag_df = pd.DataFrame(\n",
+        "    {\n",
+        "        \"user_input\": [\n",
+        "            \"What happened to the company's revenue guidance?\",\n",
+        "            \"Why did the bank's stock decline?\",\n",
+        "            \"What was the announced dividend decision?\",\n",
+        "        ],\n",
+        "        \"retrieved_contexts\": [\n",
+        "            [\n",
+        "                \"The company raised its full-year revenue guidance after reporting strong demand in the enterprise segment.\",\n",
+        "                \"Management said the improved forecast was driven by larger-than-expected renewals.\",\n",
+        "            ],\n",
+        "            [\n",
+        "                \"The bank's stock declined after it reported higher-than-expected credit losses in its consumer portfolio.\",\n",
+        "                \"Executives also warned that provisions may remain elevated next quarter.\",\n",
+        "            ],\n",
+        "            [\n",
+        "                \"The board announced that it would keep the quarterly dividend unchanged.\",\n",
+        "                \"Management said capital return policy remains the same for now.\",\n",
+        "            ],\n",
+        "        ],\n",
+        "        \"response\": [\n",
+        "            \"The company increased its full-year revenue guidance after stronger enterprise demand.\",\n",
+        "            \"The bank's stock fell because it disclosed higher-than-expected credit losses.\",\n",
+        "            \"The company kept its dividend unchanged.\",\n",
+        "        ],\n",
+        "        \"reference\": [\n",
+        "            \"The company raised its full-year revenue guidance because demand in the enterprise segment was strong.\",\n",
+        "            \"The bank's shares dropped after it reported higher-than-expected credit losses.\",\n",
+        "            \"The board decided to leave the quarterly dividend unchanged.\",\n",
+        "        ],\n",
+        "    }\n",
+        ")\n",
+        "\n",
+        "vm_rag_ds = vm.init_dataset(\n",
+        "    dataset=rag_df,\n",
+        "    input_id=\"judge_rag_dataset\",\n",
+        "    text_column=\"user_input\",\n",
+        "    target_column=\"reference\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "fcdb6232",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "run_test(\n",
+        "    test_id=\"validmind.model_validation.ragas.ResponseRelevancy\",\n",
+        "    inputs={\"dataset\": vm_rag_ds},\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "25124a2f",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "run_test(\n",
+        "    test_id=\"validmind.model_validation.ragas.AnswerCorrectness\",\n",
+        "    inputs={\"dataset\": vm_rag_ds},\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "3a58bd42",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "run_test(\n",
+        "    test_id=\"validmind.model_validation.ragas.Faithfulness\",\n",
+        "    inputs={\"dataset\": vm_rag_ds},\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "8b65420f",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## DeepEval scorers\n",
+        "\n",
+        "This section validates the default local scorer model path used by DeepEval-based scorers in `validmind.scorers.llm.deepeval`.\n",
+        "\n",
+        "As in the RAGAS example, we create a ValidMind dataset with `vm.init_dataset()` so the scorer workflow runs against the same kind of object customers would use in their own notebooks.\n",
+        "\n",
+        "These scorers do not use the judge embeddings object. For this notebook, we use two representative examples:\n",
+        "- `AnswerRelevancy`\n",
+        "- `Hallucination`\n",
+        "\n",
+        "They are included here so the notebook covers all three LLM evaluation surfaces:\n",
+        "- prompt-validation\n",
+        "- RAGAS\n",
+        "- DeepEval scorers"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "c34f2484",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "deepeval_df = pd.DataFrame(\n",
+        "    {\n",
+        "        \"input\": [\n",
+        "            \"What is the capital of France?\",\n",
+        "            \"Why did the company raise its full-year guidance?\",\n",
+        "            \"What did the board decide about the quarterly dividend?\",\n",
+        "        ],\n",
+        "        \"actual_output\": [\n",
+        "            \"The capital of France is Paris.\",\n",
+        "            \"The company raised guidance because enterprise demand was stronger than expected.\",\n",
+        "            \"The board kept the quarterly dividend unchanged.\",\n",
+        "        ],\n",
+        "        \"context\": [\n",
+        "            [\"France's capital city is Paris.\"],\n",
+        "            [\n",
+        "                \"Management raised its full-year guidance after reporting stronger-than-expected demand in the enterprise segment.\"\n",
+        "            ],\n",
+        "            [\n",
+        "                \"The board announced that the quarterly dividend would remain unchanged.\"\n",
+        "            ],\n",
+        "        ],\n",
+        "    }\n",
+        ")\n",
+        "\n",
+        "vm_deepeval_ds = vm.init_dataset(\n",
+        "    dataset=deepeval_df,\n",
+        "    input_id=\"judge_deepeval_dataset\",\n",
+        "    text_column=\"input\",\n",
+        "    target_column=\"actual_output\",\n",
+        ")\n",
+        "\n",
+        "deepeval_df"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "9a3cdae0",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "vm_deepeval_ds.assign_scores(metrics=[\n",
+        "    \"validmind.scorers.llm.deepeval.Hallucination\",\n",
+        "    \"validmind.scorers.llm.deepeval.AnswerRelevancy\"\n",
+        "])"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "d86a90ab",
+      "metadata": {},
+      "source": [
+        "<a id='toc9__'></a>\n",
+        "\n",
+        "## In summary\n",
+        "\n",
+        "In this notebook, you learned how to:\n",
+        "- [x] configure the judge provider from environment credentials\n",
+        "- [x] override the default judge LLM and judge embeddings models\n",
+        "- [x] initialize ValidMind model and dataset objects for LLM evaluation workflows\n",
+        "- [x] run prompt-validation tests that use the judge LLM\n",
+        "- [x] run RAGAS tests that use the judge LLM and judge embeddings\n",
+        "- [x] run DeepEval scorers that use the local scorer model path"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "c7b72b3e",
+      "metadata": {},
+      "source": [
+        "<a id='toc10__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can use this notebook as a starting point for your own LLM evaluation workflows. A few practical follow-ups are:\n",
+        "- replace the sample prompt and datasets with your own evaluation inputs\n",
+        "- set `OPENAI_MODEL` / `OPENAI_EMBEDDINGS_MODEL` when you want to override the OpenAI judge pair, or `GEMINI_MODEL` / `GEMINI_EMBEDDINGS_MODEL` when you want to standardize the Gemini judge pair used across notebooks or environments\n",
+        "- expand the set of tests and scorers based on your use case"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "e5eb12d8",
+      "metadata": {},
+      "source": [
+        "<a id='toc10_1__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "To continue learning about testing and evaluation with the ValidMind Library, explore:\n",
+        "\n",
+        "- [Run tests and test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [ValidMind Library overview](https://docs.validmind.ai/developer/validmind-library.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "You can also visit the [ValidMind documentation](https://docs.validmind.ai/) for broader guidance on configuration, testing workflows, and model documentation."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "99a11a0e",
+      "metadata": {},
+      "source": [
+        "<a id='toc11__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, periodically check that you are using a recent version so you can access the latest provider integrations, tests, and product improvements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "cfed92f5",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "%pip show validmind"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "58cc2437",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "aa5c4672",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "copyright-fe0b013da3464949b043e9dbdd34b608",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ]
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": ".venv-py31111",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.11.11"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 5
+}
diff --git a/site/notebooks/how_to/tests/run_tests/configure_tests/customize_test_result_descriptions.ipynb b/site/notebooks/how_to/tests/run_tests/configure_tests/customize_test_result_descriptions.ipynb
index 68c659a45d..9a0ae2e2dc 100644
--- a/site/notebooks/how_to/tests/run_tests/configure_tests/customize_test_result_descriptions.ipynb
+++ b/site/notebooks/how_to/tests/run_tests/configure_tests/customize_test_result_descriptions.ipynb
@@ -10,11 +10,11 @@
     "\n",
     "In this notebook, you'll learn how to take complete control over the context that drives test description generation. ValidMind provides a `context` parameter in `run_test` that accepts a dictionary with three complementary keys for comprehensive context management:\n",
     "\n",
-    "- `instructions`: Overwrites ValidMind’s default result description structure. If you provide custom instructions, they take full priority over the built-in ones. This parameter controls how the final description is structured and presented. Use this to specify formatting requirements, target different audiences (executives vs. technical teams), or ensure consistent report styles across your organization.  \n",
+    "- `instructions`: Overwrites ValidMind’s default result description structure. If you provide custom instructions, they take full priority over the built-in ones. This parameter controls how the final description is structured and presented. Use this to specify formatting requirements, target different audiences (executives vs. technical teams), or ensure consistent report styles across your organization.\n",
     "\n",
-    "- `test_description`: Overwrites the test’s built-in docstring if provided. This parameter contains the technical mechanics of how the test works. However, for generic tests where the methodology isn't the focus, you may use this to describe what's actually being analyzed—the specific variables, features, or metrics being plotted and their business meaning rather than the statistical mechanics. You can also override ValidMind's built-in test documentation if you prefer different structure or language. \n",
+    "- `test_description`: Overwrites the test’s built-in docstring if provided. This parameter contains the technical mechanics of how the test works. However, for generic tests where the methodology isn't the focus, you may use this to describe what's actually being analyzed—the specific variables, features, or metrics being plotted and their business meaning rather than the statistical mechanics. You can also override ValidMind's built-in test documentation if you prefer different structure or language.\n",
     "\n",
-    "- `additional_context`: Does not overwrite the instructions or test descriptions, but instead adds to them. This parameter provides any background information you want the LLM to consider when analyzing results. It could include business priorities, acceptance thresholds, regulatory requirements, domain expertise, use case details, model purpose, or stakeholder concerns—any information that helps the LLM better understand and interpret your specific situation.\n",
+    "- `additional_context`: Does not overwrite the instructions or test descriptions, but instead adds to them. This parameter provides any background information you want the LLM to consider when analyzing results. It could include business priorities, acceptance thresholds, regulatory requirements, domain expertise, use case details, record (model) purpose, or stakeholder concerns—any information that helps the LLM better understand and interpret your specific situation.\n",
     "\n",
     "Together, these context parameters allow you to manage every aspect of how the LLM interprets and presents your test results. Whether you need to align descriptions with regulatory requirements, target specific audiences, incorporate organizational policies, or ensure consistent reporting standards, this context management approach gives you the flexibility to generate descriptions that perfectly match your needs while still leveraging the analytical power of AI-generated insights."
    ]
@@ -113,17 +113,19 @@
     "\n",
     "#### Register sample model\n",
     "\n",
-    "Let's first register a sample model for use with this notebook:\n",
+    "Let's first register a sample record (model) for use with this notebook:\n",
     "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
+    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
     "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
+    "2. In the left sidebar, select **Inventory**.\n",
     "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
+    "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
     "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
+    "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
     "\n",
-    "5. Click **Register Model** to add the model to your inventory."
+    "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+    "\n",
+    "6. Click **Register Model** to add the model to your inventory."
    ]
   },
   {
@@ -134,10 +136,12 @@
     "\n",
     "#### Apply documentation template\n",
     "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
+    "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
     "\n",
     "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
     "\n",
+    "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+    "\n",
     "2. Under **TEMPLATE**, select `Binary classification`.\n",
     "\n",
     "3. Click **Use Template** to apply the template."
@@ -151,11 +155,13 @@
     "\n",
     "#### Get your code snippet\n",
     "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
+    "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
     "\n",
     "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+    "\n",
     "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+    "\n",
+    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
    ]
   },
   {
@@ -190,7 +196,7 @@
     "\n",
     "### Initialize the Python environment\n",
     "\n",
-    "After you've connected to your model register in the ValidMind Platform, let's import the necessary libraries and set up your Python environment for data analysis:"
+    "After you've connected to your model registered in the ValidMind Platform, let's import the necessary libraries and set up your Python environment for data analysis:"
    ]
   },
   {
@@ -329,9 +335,12 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "Additionally, you'll need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data. \n",
+    "You'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for our model.\n",
+    "\n",
+    "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+    "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
     "\n",
-    "Simply intialize this model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
+    "Initialize your model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
    ]
   },
   {
@@ -695,7 +704,7 @@
     "\n",
     "### Understanding the additional context parameter\n",
     "\n",
-    "The `additional_context` parameter can be used to add any background information that helps put the test results into context. For example, you might include business priorities and constraints that shape how results are interpreted, risk tolerance levels or acceptance criteria specific to your organization, regulatory requirements that influence what counts as acceptable performance, or details about the intended use case of the model in production. These are just examples—the parameter is flexible and can capture whatever context is most relevant to your needs.\n",
+    "The `additional_context` parameter can be used to add any background information that helps put the test results into context. For example, you might include business priorities and constraints that shape how results are interpreted, risk tolerance levels or acceptance criteria specific to your organization, regulatory requirements that influence what counts as acceptable performance, or details about the intended use case of the record (model) in production. These are just examples—the parameter is flexible and can capture whatever context is most relevant to your needs.\n",
     "\n",
     "**Key difference:**\n",
     "- `instructions`: \"Write a 3-paragraph executive summary\"\n",
@@ -843,7 +852,7 @@
     "A short description of what the test does and what kind of output it generates.\n",
     "\n",
     "- **Purpose:**\n",
-    "Explains why the test exists and what it is designed to evaluate. This section provides the context for the test’s role in model documentation, often describing the intended use cases or the kind of insights it supports.\n",
+    "Explains why the test exists and what it is designed to evaluate. This section provides the context for the test’s role in documentation, often describing the intended use cases or the kind of insights it supports.\n",
     "\n",
     "- **Test mechanism**:\n",
     "Describes how the test works internally. This includes the approach or methodology, what inputs are used, how results are calculated or visualized, and the logic behind the test’s implementation.\n",
diff --git a/site/notebooks/how_to/tests/run_tests/configure_tests/enable_pii_detection.ipynb b/site/notebooks/how_to/tests/run_tests/configure_tests/enable_pii_detection.ipynb
index ddbd734e9d..bc07a3cffe 100644
--- a/site/notebooks/how_to/tests/run_tests/configure_tests/enable_pii_detection.ipynb
+++ b/site/notebooks/how_to/tests/run_tests/configure_tests/enable_pii_detection.ipynb
@@ -1,674 +1,669 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "id": "fafe2741",
-   "metadata": {},
-   "source": [
-    "# Enable PII detection in tests"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "75cb4b61",
-   "metadata": {},
-   "source": [
-    "Learn how to enable and configure Personally Identifiable Information (PII) detection when running tests with the ValidMind Library. Choose whether or not to include PII in test descriptions generated, or whether or not to include PII in test results logged to the ValidMind Platform."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e4ebad56",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library with PII detection](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_1__)    \n",
-    "- [Using PII detection](#toc3__)    \n",
-    "  - [Create a custom test that outputs PII](#toc3_1__)    \n",
-    "  - [Run test under different PII detection modes](#toc3_2__)    \n",
-    "    - [disabled](#toc3_2_1__)    \n",
-    "    - [test_results](#toc3_2_2__)    \n",
-    "    - [test_descriptions](#toc3_2_3__)    \n",
-    "    - [all](#toc3_2_4__)    \n",
-    "  - [Override detection](#toc3_3__)    \n",
-    "    - [Override test result logging](#toc3_3_1__)    \n",
-    "    - [Override test descriptions and test result logging](#toc3_3_2__)    \n",
-    "  - [Review logged test results](#toc3_4__)    \n",
-    "- [Troubleshooting](#toc4__)    \n",
-    "- [Learn more](#toc5__)    \n",
-    "- [Upgrade ValidMind](#toc6__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "a2f801a9",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models. \n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e920bce6",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "3a3fb4fc",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "9a49b776",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Metrics**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
-    "\n",
-    "**Custom metrics**: Custom metrics are functions that you define to evaluate your model or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom metric.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom metric. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a metric, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom metrics can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "41aee68d",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "ba30e377",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library with PII detection\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
-    "<br></br>\n",
-    "Python 3.8 <= x <= 3.14</div>\n",
-    "\n",
-    "To use PII detection powered by [Microsoft Presidio](https://microsoft.github.io/presidio/), install the library with the explicit `[pii-detection]` extra specifier:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "b830ae91",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q \"validmind[pii-detection]\""
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "4b44677b",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library\n",
-    "\n",
-    "ValidMind generates a unique _code snippet_ for each registered model to connect with your developer environment. You initialize the ValidMind Library with this code snippet, which ensures that your documentation and tests are uploaded to the correct model when you run the notebook."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "84464a2b",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "eeda4c8c",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "62f24552",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Using PII detection"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "fd9b6e44",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Create a custom test that outputs PII\n",
-    "\n",
-    "To demonstrate the feature, we'll need a test that outputs PII. First we'll create a custom test that returns:\n",
-    "\n",
-    "- A description string containing PII (name, email, phone)\n",
-    "- A small table containing PII in columns\n",
-    "\n",
-    "This output mirrors the structure used in other custom test notebooks and will exercise both table and description PII detection paths. However, if structured detection is unavailable, the library falls back to token-level text scans when possible."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "04d8c802",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import pandas as pd\n",
-    "\n",
-    "from validmind import test\n",
-    "\n",
-    "@test(\"pii_demo.PIIDetection\")\n",
-    "def pii_custom_test():\n",
-    "    \"\"\"A custom test that returns demo PII.\n",
-    "    This default test description will display when PII is not sent to the LLM to generate test descriptions based on test result data.\"\"\"\n",
-    "    return pd.DataFrame(\n",
-    "        {\n",
-    "            \"name\": [\"Jane Smith\", \"John Doe\", \"Alice Johnson\"],\n",
-    "            \"email\": [\n",
-    "                \"jane.smith@bank.example\",\n",
-    "                \"john.doe@company.example\",\n",
-    "                \"alice.johnson@service.example\",\n",
-    "            ],\n",
-    "            \"phone\": [\"(212) 555-9876\", \"(415) 555-1234\", \"(646) 555-5678\"],\n",
-    "        }\n",
-    "    )"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "53e02410",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about custom tests?</b></span>\n",
-    "<br></br>\n",
-    "Check out our extended introduction to custom tests — <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/custom_tests/implement_custom_tests.html\" style=\"color: #DE257E;\"><b>Implement custom tests</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "c4065f2a",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2__'></a>\n",
-    "\n",
-    "### Run test under different PII detection modes\n",
-    "\n",
-    "Next, let's import [the `run_test` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test) provided by the `validmind.tests` module to run our custom test via a function called `run_pii_test()` that catches exceptions to observe blocking behavior when PII is present:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "b42288e5",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import os\n",
-    "from validmind.tests import run_test\n",
-    "\n",
-    "# Run test and tag result with unique `result_id`\n",
-    "def run_pii_test(result_id=\"\"):\n",
-    "    try:\n",
-    "        test_name = f\"pii_demo.PIIDetection:{result_id}\"\n",
-    "        result = run_test(test_name)\n",
-    "\n",
-    "        # Check if the test description was generated by LLM\n",
-    "        if not result._was_description_generated:\n",
-    "            print(\"PII detected: LLM-generated test description skipped\")\n",
-    "        else:\n",
-    "            print(\"No PII detected or detection disabled: Test description generated by LLM\")\n",
-    "\n",
-    "        # Try logging test results to the ValidMind Platform\n",
-    "        result.log()\n",
-    "        print(\"No PII detected or detection disabled: Test results logged to the ValidMind Platform\")\n",
-    "    except Exception as e:\n",
-    "        print(\"PII detected: Test results not logged to the ValidMind Platform\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "867dbd94",
-   "metadata": {},
-   "source": [
-    "We'll then switch the `VALIDMIND_PII_DETECTION` environment variable across modes in the below examples.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note that since we are running a custom test that does not exist in your model's default documentation template, we'll receive output indicating that a test-driven block doesn't currently exist in your model's documentation for that particular test ID.</b></span>\n",
-    "<br></br>\n",
-    "That's expected, as when we run custom tests the results logged need to be manually added to your documentation within the ValidMind Platform or added to your documentation template.</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "0e151763",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_1__'></a>\n",
-    "\n",
-    "#### disabled\n",
-    "\n",
-    "When detection is set to `disabled`, tests run and generate test descriptions. Logging tests with [`.log()`](https://docs.validmind.ai/validmind/validmind/vm_models.html#TestResult.log) will also send test descriptions and test results to the ValidMind Platform as usual:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "3078af64",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "print(\"\\n=== Mode: disabled ===\")\n",
-    "os.environ[\"VALIDMIND_PII_DETECTION\"] = \"disabled\"\n",
-    "\n",
-    "# Run test and tag result with unique ID `disabled`\n",
-    "run_pii_test(\"disabled\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "c797d2e3",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_2__'></a>\n",
-    "\n",
-    "#### test_results\n",
-    "\n",
-    "When detection is set for `test_results`, tests run and generate test descriptions for review in your environment, but logging tests will not send descriptions or test results to the ValidMind Platform:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "12e61a80",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "print(\"\\n=== Mode: test_results ===\")\n",
-    "os.environ[\"VALIDMIND_PII_DETECTION\"] = \"test_results\"\n",
-    "\n",
-    "# Run test and tag result with unique ID `results_blocked`\n",
-    "run_pii_test(\"results_blocked\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "9d5cb41c",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_3__'></a>\n",
-    "\n",
-    "#### test_descriptions\n",
-    "\n",
-    "When detection is set for `test_descriptions`, tests run but will not generate test descriptions, and logging tests will not send descriptions but will send test results to the ValidMind Platform:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "feba6207",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "print(\"\\n=== Mode: test_descriptions ===\")\n",
-    "os.environ[\"VALIDMIND_PII_DETECTION\"] = \"test_descriptions\"\n",
-    "\n",
-    "# Run test and tag result with unique ID `desc_blocked`\n",
-    "run_pii_test(\"desc_blocked\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "1d3d7256",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_4__'></a>\n",
-    "\n",
-    "#### all\n",
-    "\n",
-    "When detection is set to `all`, tests run will not generate test descriptions or log test results to the ValidMind Platform."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "af5040b5",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "print(\"\\n=== Mode: all ===\")\n",
-    "os.environ[\"VALIDMIND_PII_DETECTION\"] = \"all\"\n",
-    "\n",
-    "# Run test and tag result with unique ID `all_blocked`\n",
-    "run_pii_test(\"all_blocked\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b1a5fd8e",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_3__'></a>\n",
-    "\n",
-    "### Override detection\n",
-    "\n",
-    "You can override blocking by passing `unsafe=True` to `result.log(unsafe=True)`, but this is not recommended outside controlled workflows.\n",
-    "\n",
-    "To demonstrate, let's rerun our custom test with some override scenarios."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "8a378b22",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_3_1__'></a>\n",
-    "\n",
-    "#### Override test result logging\n",
-    "\n",
-    "First, let's rerun our custom test with detection set to `all`, which will send the test results but not the test descriptions to the ValidMind Platform:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "0387be21",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "print(\"\\n=== Mode: all & unsafe=True ===\")\n",
-    "os.environ[\"VALIDMIND_PII_DETECTION\"] = \"all\"\n",
-    "\n",
-    "# Run test and tag result with unique ID `override_results`\n",
-    "try:\n",
-    "    result = run_test(\"pii_demo.PIIDetection:override_results\")\n",
-    "\n",
-    "    # Check if the test description was generated by LLM\n",
-    "    if not result._was_description_generated:\n",
-    "        print(\"PII detected: LLM-generated test description skipped\")\n",
-    "    else:\n",
-    "        print(\"No PII detected or detection disabled: Test description generated by LLM\")\n",
-    "\n",
-    "    # Try logging test results to the ValidMind Platform\n",
-    "    result.log(unsafe=True)\n",
-    "    print(\"No PII detected, detection disabled, or override set: Test results logged to the ValidMind Platform\")\n",
-    "except Exception as e:\n",
-    "    print(\"PII detected: Test results not logged to the ValidMind Platform\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "8197c39c",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_3_2__'></a>\n",
-    "\n",
-    "#### Override test descriptions and test result logging\n",
-    "\n",
-    "To send both the test descriptions and test results via override, set the `VALIDMIND_PII_DETECTION` environment variable to `test_results` while including the override flag:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "b40a2670",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "print(\"\\n=== Mode: test_results & unsafe=True ===\")\n",
-    "os.environ[\"VALIDMIND_PII_DETECTION\"] = \"test_results\"\n",
-    "\n",
-    "# Run test and tag result with unique ID `override_both`\n",
-    "try:\n",
-    "    result = run_test(\"pii_demo.PIIDetection:override_both\")\n",
-    "\n",
-    "    # Check if the test description was generated by LLM\n",
-    "    if not result._was_description_generated:\n",
-    "        print(\"PII detected: LLM-generated test description skipped\")\n",
-    "    else:\n",
-    "        print(\"No PII detected, detection disabled, or override set: Test description generated by LLM\")\n",
-    "\n",
-    "    # Try logging test results to the ValidMind Platform\n",
-    "    result.log(unsafe=True)\n",
-    "    print(\"No PII detected, detection disabled, or override set: Test results logged to the ValidMind Platform\")\n",
-    "except Exception as e:\n",
-    "    print(\"PII detected: Test results not logged to the ValidMind Platform\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f2ce4348",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_4__'></a>\n",
-    "\n",
-    "### Review logged test results\n",
-    "\n",
-    "Now let's take a look at the results that were logged to the ValidMind Platform:\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier.\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "3. Click on any section heading to expand that section to add a new test-driven block ([Need more help?](https://docs.validmind.ai/developer/model-documentation/work-with-test-results.html)).\n",
-    "\n",
-    "4. Under TEST-DRIVEN in the sidebar, click **Custom**.\n",
-    "\n",
-    "5. Confirm that you're able to insert the following logged results:\n",
-    "\n",
-    "    - `pii_demo.PIIDetection:disabled`\n",
-    "    - `pii_demo.PIIDetection:desc_blocked`\n",
-    "    - `pii_demo.PIIDetection:override_results`\n",
-    "    - `pii_demo.PIIDetection:override_both`"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "d034b04c",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Troubleshooting\n",
-    "\n",
-    "- [x] If you see warnings that Presidio or Presidio analyzer is unavailable, ensure you installed extras: `validmind[pii-detection]`.\n",
-    "- [x] Ensure your environment is restarted after installing new packages if imports fail."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "1da184e0",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Learn more\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "bcaf7fd4",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you'll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "dffb39a5",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "9e9f387d",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "faf6cb0d",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-096666bfeef04fd7802d45e5dc221ca2",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "Python 3",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "name": "python",
-   "version": "3.10"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
-}
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Enable PII detection in tests"
+      ],
+      "id": "adbd775e"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Learn how to enable and configure Personally Identifiable Information (PII) detection when running tests with the ValidMind Library. Choose whether or not to include PII in test descriptions generated, or whether or not to include PII in test results logged to the ValidMind Platform."
+      ],
+      "id": "6014f87e"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library with PII detection](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_1__)    \n",
+        "- [Create a custom test that outputs PII](#toc3__)    \n",
+        "- [Running tests under different PII detection modes](#toc4__)    \n",
+        "  - [disabled](#toc4_1__)    \n",
+        "  - [test_results](#toc4_2__)    \n",
+        "  - [test_descriptions](#toc4_3__)    \n",
+        "  - [all](#toc4_4__)    \n",
+        "- [Overriding detection](#toc5__)    \n",
+        "  - [Override test result logging](#toc5_1__)    \n",
+        "  - [Override test descriptions and test result logging](#toc5_2__)    \n",
+        "- [Review logged test results](#toc6__)    \n",
+        "- [Troubleshooting](#toc7__)    \n",
+        "- [Learn more](#toc8__)    \n",
+        "- [Upgrade ValidMind](#toc9__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ],
+      "id": "b92af62b"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models. \n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators."
+      ],
+      "id": "570a178e"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
+      ],
+      "id": "df929220"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+      ],
+      "id": "f626d8bd"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ],
+      "id": "deb8fd73"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ],
+      "id": "32293a17"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library with PII detection\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
+        "<br></br>\n",
+        "Python 3.8 <= x <= 3.14</div>\n",
+        "\n",
+        "To use PII detection powered by [Microsoft Presidio](https://microsoft.github.io/presidio/), install the library with the explicit `[pii-detection]` extra specifier:"
+      ],
+      "id": "6e23f9b2"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q \"validmind[pii-detection]\""
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "b830ae91"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library\n",
+        "\n",
+        "ValidMind generates a unique _code snippet_ for each registered model to connect with your developer environment. You initialize the ValidMind Library with this code snippet, which ensures that your documentation and tests are uploaded to the correct model when you run the notebook."
+      ],
+      "id": "fa8a1a7d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ],
+      "id": "3a467dc2"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "eeda4c8c"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Create a custom test that outputs PII\n",
+        "\n",
+        "To demonstrate the feature, we'll need a test that outputs PII. First we'll create a custom test that returns:\n",
+        "\n",
+        "- A description string containing PII (name, email, phone)\n",
+        "- A small table containing PII in columns\n",
+        "\n",
+        "This output mirrors the structure used in other custom test notebooks and will exercise both table and description PII detection paths. However, if structured detection is unavailable, the library falls back to token-level text scans when possible."
+      ],
+      "id": "82638dab"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import pandas as pd\n",
+        "\n",
+        "from validmind import test\n",
+        "\n",
+        "@test(\"pii_demo.PIIDetection\")\n",
+        "def pii_custom_test():\n",
+        "    \"\"\"A custom test that returns demo PII.\n",
+        "    This default test description will display when PII is not sent to the LLM to generate test descriptions based on test result data.\"\"\"\n",
+        "    return pd.DataFrame(\n",
+        "        {\n",
+        "            \"name\": [\"Jane Smith\", \"John Doe\", \"Alice Johnson\"],\n",
+        "            \"email\": [\n",
+        "                \"jane.smith@bank.example\",\n",
+        "                \"john.doe@company.example\",\n",
+        "                \"alice.johnson@service.example\",\n",
+        "            ],\n",
+        "            \"phone\": [\"(212) 555-9876\", \"(415) 555-1234\", \"(646) 555-5678\"],\n",
+        "        }\n",
+        "    )"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "04d8c802"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about custom tests?</b></span>\n",
+        "<br></br>\n",
+        "Check out our extended introduction to custom tests — <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/custom_tests/implement_custom_tests.html\" style=\"color: #DE257E;\"><b>Implement custom tests</b></a></div>"
+      ],
+      "id": "96878fab"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Running tests under different PII detection modes\n",
+        "\n",
+        "Next, let's import [the `run_test` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test) provided by the `validmind.tests` module to run our custom test via a function called `run_pii_test()` that catches exceptions to observe blocking behavior when PII is present:"
+      ],
+      "id": "0faaceb5"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import os\n",
+        "from validmind.tests import run_test\n",
+        "\n",
+        "# Run test and tag result with unique `result_id`\n",
+        "def run_pii_test(result_id=\"\"):\n",
+        "    try:\n",
+        "        test_name = f\"pii_demo.PIIDetection:{result_id}\"\n",
+        "        result = run_test(test_name)\n",
+        "\n",
+        "        # Check if the test description was generated by LLM\n",
+        "        if not result._was_description_generated:\n",
+        "            print(\"PII detected: LLM-generated test description skipped\")\n",
+        "        else:\n",
+        "            print(\"No PII detected or detection disabled: Test description generated by LLM\")\n",
+        "\n",
+        "        # Try logging test results to the ValidMind Platform\n",
+        "        result.log()\n",
+        "        print(\"No PII detected or detection disabled: Test results logged to the ValidMind Platform\")\n",
+        "    except Exception as e:\n",
+        "        print(\"PII detected: Test results not logged to the ValidMind Platform\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "b42288e5"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "We'll then switch the `VALIDMIND_PII_DETECTION` environment variable across modes in the below examples.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note that since we are running a custom test that does not exist in your model's default documentation template, we'll receive output indicating that a test-driven block doesn't currently exist in your model's documentation for that particular test ID.</b></span>\n",
+        "<br></br>\n",
+        "That's expected, as when we run custom tests the results logged need to be manually added to your documentation within the ValidMind Platform or added to your documentation template.</div>"
+      ],
+      "id": "9a6e3398"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### disabled\n",
+        "\n",
+        "When detection is set to `disabled`, tests run and generate test descriptions. Logging tests with [`.log()`](https://docs.validmind.ai/validmind/validmind/vm_models.html#TestResult.log) will also send test descriptions and test results to the ValidMind Platform as usual:"
+      ],
+      "id": "9801463d"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "print(\"\\n=== Mode: disabled ===\")\n",
+        "os.environ[\"VALIDMIND_PII_DETECTION\"] = \"disabled\"\n",
+        "\n",
+        "# Run test and tag result with unique ID `disabled`\n",
+        "run_pii_test(\"disabled\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "3078af64"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### test_results\n",
+        "\n",
+        "When detection is set for `test_results`, tests run and generate test descriptions for review in your environment, but logging tests will not send descriptions or test results to the ValidMind Platform:"
+      ],
+      "id": "89de78cc"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "print(\"\\n=== Mode: test_results ===\")\n",
+        "os.environ[\"VALIDMIND_PII_DETECTION\"] = \"test_results\"\n",
+        "\n",
+        "# Run test and tag result with unique ID `results_blocked`\n",
+        "run_pii_test(\"results_blocked\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "12e61a80"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_3__'></a>\n",
+        "\n",
+        "### test_descriptions\n",
+        "\n",
+        "When detection is set for `test_descriptions`, tests run but will not generate test descriptions, and logging tests will not send descriptions but will send test results to the ValidMind Platform:"
+      ],
+      "id": "8fbe427e"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "print(\"\\n=== Mode: test_descriptions ===\")\n",
+        "os.environ[\"VALIDMIND_PII_DETECTION\"] = \"test_descriptions\"\n",
+        "\n",
+        "# Run test and tag result with unique ID `desc_blocked`\n",
+        "run_pii_test(\"desc_blocked\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "feba6207"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_4__'></a>\n",
+        "\n",
+        "### all\n",
+        "\n",
+        "When detection is set to `all`, tests run will not generate test descriptions or log test results to the ValidMind Platform."
+      ],
+      "id": "0e8950d1"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "print(\"\\n=== Mode: all ===\")\n",
+        "os.environ[\"VALIDMIND_PII_DETECTION\"] = \"all\"\n",
+        "\n",
+        "# Run test and tag result with unique ID `all_blocked`\n",
+        "run_pii_test(\"all_blocked\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "af5040b5"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Overriding detection\n",
+        "\n",
+        "You can override blocking by passing `unsafe=True` to `result.log(unsafe=True)`, but this is not recommended outside controlled workflows.\n",
+        "\n",
+        "To demonstrate, let's rerun our custom test with some override scenarios."
+      ],
+      "id": "67240344"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Override test result logging\n",
+        "\n",
+        "First, let's rerun our custom test with detection set to `all`, which will send the test results but not the test descriptions to the ValidMind Platform:"
+      ],
+      "id": "be0510b9"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "print(\"\\n=== Mode: all & unsafe=True ===\")\n",
+        "os.environ[\"VALIDMIND_PII_DETECTION\"] = \"all\"\n",
+        "\n",
+        "# Run test and tag result with unique ID `override_results`\n",
+        "try:\n",
+        "    result = run_test(\"pii_demo.PIIDetection:override_results\")\n",
+        "\n",
+        "    # Check if the test description was generated by LLM\n",
+        "    if not result._was_description_generated:\n",
+        "        print(\"PII detected: LLM-generated test description skipped\")\n",
+        "    else:\n",
+        "        print(\"No PII detected or detection disabled: Test description generated by LLM\")\n",
+        "\n",
+        "    # Try logging test results to the ValidMind Platform\n",
+        "    result.log(unsafe=True)\n",
+        "    print(\"No PII detected, detection disabled, or override set: Test results logged to the ValidMind Platform\")\n",
+        "except Exception as e:\n",
+        "    print(\"PII detected: Test results not logged to the ValidMind Platform\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "0387be21"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2__'></a>\n",
+        "\n",
+        "### Override test descriptions and test result logging\n",
+        "\n",
+        "To send both the test descriptions and test results via override, set the `VALIDMIND_PII_DETECTION` environment variable to `test_results` while including the override flag:"
+      ],
+      "id": "4e65af32"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "print(\"\\n=== Mode: test_results & unsafe=True ===\")\n",
+        "os.environ[\"VALIDMIND_PII_DETECTION\"] = \"test_results\"\n",
+        "\n",
+        "# Run test and tag result with unique ID `override_both`\n",
+        "try:\n",
+        "    result = run_test(\"pii_demo.PIIDetection:override_both\")\n",
+        "\n",
+        "    # Check if the test description was generated by LLM\n",
+        "    if not result._was_description_generated:\n",
+        "        print(\"PII detected: LLM-generated test description skipped\")\n",
+        "    else:\n",
+        "        print(\"No PII detected, detection disabled, or override set: Test description generated by LLM\")\n",
+        "\n",
+        "    # Try logging test results to the ValidMind Platform\n",
+        "    result.log(unsafe=True)\n",
+        "    print(\"No PII detected, detection disabled, or override set: Test results logged to the ValidMind Platform\")\n",
+        "except Exception as e:\n",
+        "    print(\"PII detected: Test results not logged to the ValidMind Platform\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "b40a2670"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Review logged test results\n",
+        "\n",
+        "Now let's take a look at the results that were logged to the ValidMind Platform:\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier.\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "3. Click on any section heading to expand that section to add a new test-driven block. (**Learn more:** [Work with test results](https://docs.validmind.ai/guide/documentation/work-with-test-results.html))\n",
+        "\n",
+        "4. Under TEST-DRIVEN in the sidebar, click **Custom**.\n",
+        "\n",
+        "5. Confirm that you're able to insert the following logged results:\n",
+        "\n",
+        "    - `pii_demo.PIIDetection:disabled`\n",
+        "    - `pii_demo.PIIDetection:desc_blocked`\n",
+        "    - `pii_demo.PIIDetection:override_results`\n",
+        "    - `pii_demo.PIIDetection:override_both`"
+      ],
+      "id": "84d6ed78"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Troubleshooting\n",
+        "\n",
+        "- [x] If you see warnings that Presidio or Presidio analyzer is unavailable, ensure you installed extras: `validmind[pii-detection]`.\n",
+        "- [x] Ensure your environment is restarted after installing new packages if imports fail."
+      ],
+      "id": "faaa950f"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## Learn more\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ],
+      "id": "59c93159"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc9__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you'll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ],
+      "id": "8eba96a6"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "dffb39a5"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ],
+      "id": "dbce28c3"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ],
+      "id": "6225eab3"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-0bc871eca4814e78b16e692e1f2b3209"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "Python 3",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "name": "python",
+      "version": "3.10"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 5
+}
\ No newline at end of file
diff --git a/site/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.ipynb b/site/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.ipynb
index 472d7e59d1..6a4b81ba2d 100644
--- a/site/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.ipynb
+++ b/site/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.ipynb
@@ -1,576 +1,586 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Run tests with multiple datasets\n",
-    "\n",
-    "To support running tests that require more than one dataset, ValidMind provides a mechanim that allows you to pass multiple datasets as inputs.\n",
-    "\n",
-    "<!--- TO DO Check that this explanation is accurate --->\n",
-    "To ensure a model generalizes well to new, unseen data, it's common to use separate datasets for training, validation, and testing, with each set serving to check the model's performance at different stages of development. Additionally, since models often encounter data from various sources that might differ in distribution, quality, or type, using multiple datasets in testing can simulate this diversity and better prepare the model for deployment.\n",
-    "\n",
-    "This interactive notebook includes the code required to load the demo dataset, preprocess the raw dataset and train a model for testing, initialize ValidMind objects, and run a test that requires multiple datasets."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "  - [Preview the documentation template](#toc2_3__)    \n",
-    "- [Load the sample dataset](#toc3__)    \n",
-    "- [Prepocess the raw dataset](#toc4__)    \n",
-    "- [Train models for testing](#toc5__)    \n",
-    "- [Initialize ValidMind objects](#toc6__)    \n",
-    "  - [Initialize the ValidMind model](#toc6_1__)    \n",
-    "  - [Initialize the ValidMind datasets](#toc6_2__)    \n",
-    "- [Run a test that requires multiple datasets](#toc7__)    \n",
-    "  - [Run predictions and link with the model](#toc7_1__)    \n",
-    "  - [Run test](#toc7_2__)    \n",
-    "- [Next steps](#toc8__)    \n",
-    "  - [Work with your model documentation](#toc8_1__)    \n",
-    "  - [Discover more learning resources](#toc8_2__)    \n",
-    "- [Upgrade ValidMind](#toc9__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
-    "\n",
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Metrics**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
-    "\n",
-    "**Custom metrics**: Custom metrics are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom metric.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom metric. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a metric, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom metrics can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Binary classification`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Load the sample dataset\n",
-    "\n",
-    "The sample dataset used here is provided by the ValidMind library. To be able to use it, you need to import the dataset and load it into a pandas [DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html), a two-dimensional tabular data structure that makes use of rows and columns:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Import the sample dataset from the library\n",
-    "\n",
-    "from validmind.datasets.classification import customer_churn as demo_dataset\n",
-    "\n",
-    "print(\n",
-    "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{demo_dataset.target_column}' \\n\\t• Class labels: {demo_dataset.class_labels}\"\n",
-    ")\n",
-    "\n",
-    "raw_df = demo_dataset.load_data()\n",
-    "raw_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Prepocess the raw dataset\n",
-    "\n",
-    "Preprocessing performs a number of operations to get ready for the subsequent steps:\n",
-    "\n",
-    "- Preprocess the data: Splits the DataFrame (`df`) into multiple datasets (`train_df`, `validation_df`, and `test_df`) using `demo_dataset.preprocess` to simplify preprocessing.\n",
-    "- Separate features and targets: Drops the target column to create feature sets (`x_train`, `x_val`) and target sets (`y_train`, `y_val`)."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "train_df, validation_df, test_df = demo_dataset.preprocess(raw_df)\n",
-    "x_train = train_df.drop(demo_dataset.target_column, axis=1)\n",
-    "y_train = train_df[demo_dataset.target_column]\n",
-    "x_val = validation_df.drop(demo_dataset.target_column, axis=1)\n",
-    "y_val = validation_df[demo_dataset.target_column]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Train models for testing\n",
-    "\n",
-    "Initialize XGBoost and Logistic Regression Classifiers"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from sklearn.linear_model import LogisticRegression\n",
-    "import xgboost\n",
-    "\n",
-    "%matplotlib inline\n",
-    "\n",
-    "xgb = xgboost.XGBClassifier(early_stopping_rounds=10)\n",
-    "xgb.set_params(\n",
-    "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
-    ")\n",
-    "xgb.fit(\n",
-    "    x_train,\n",
-    "    y_train,\n",
-    "    eval_set=[(x_val, y_val)],\n",
-    "    verbose=False,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Initialize ValidMind objects\n",
-    "\n",
-    "<a id='toc6_1__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind model"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_model_xgb = vm.init_model(\n",
-    "    xgb,\n",
-    "    input_id=\"xgb\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind datasets\n",
-    "\n",
-    "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
-    "\n",
-    "This function takes a number of arguments:\n",
-    "\n",
-    "- `dataset` — the raw dataset that you want to provide as input to tests\n",
-    "- `input_id` - a unique identifier that allows tracking what inputs are used when running each individual test\n",
-    "- `target_column` — a required argument if tests require access to true values. This is the name of the target column in the dataset\n",
-    "- `class_labels` — an optional value to map predicted classes to class labels\n",
-    "\n",
-    "With all datasets ready, you can now initialize the raw, training and test datasets (`raw_df`, `train_df` and `test_df`) created earlier into their own dataset objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds = vm.init_dataset(\n",
-    "    input_id=\"train_dataset\",\n",
-    "    dataset=train_df,\n",
-    "    target_column=demo_dataset.target_column,\n",
-    ")\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    input_id=\"test_dataset\", dataset=test_df, target_column=demo_dataset.target_column\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Run a test that requires multiple datasets\n",
-    "\n",
-    "We are going to show the following in next two blocks:\n",
-    "\n",
-    "- Assign predictions for `vm_train_ds` and `vm_test_ds`\n",
-    "- Run `RobustnessDiagnosis` which is one example test that takes two input datasets"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_1__'></a>\n",
-    "\n",
-    "### Run predictions and link with the model"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds.assign_predictions(model=vm_model_xgb)\n",
-    "vm_test_ds.assign_predictions(model=vm_model_xgb)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_2__'></a>\n",
-    "\n",
-    "### Run test"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.RobustnessDiagnosis\",\n",
-    "    inputs={\"datasets\": (vm_train_ds, vm_test_ds), \"model\": vm_model_xgb},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc8__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
-    "\n",
-    "<a id='toc8_1__'></a>\n",
-    "\n",
-    "### Work with your model documentation\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)\n",
-    "\n",
-    "<a id='toc8_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc9__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-72af338f140e4a4bad5cb3954201d23e",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "colab": {
-   "provenance": []
-  },
-  "gpuClass": "standard",
-  "kernelspec": {
-   "display_name": ".venv",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.8.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 0
-}
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Run tests with multiple datasets\n",
+        "\n",
+        "To support running tests that require more than one dataset, ValidMind provides a mechanim that allows you to pass multiple datasets as inputs.\n",
+        "\n",
+        "<!--- TO DO Check that this explanation is accurate --->\n",
+        "To ensure a model generalizes well to new, unseen data, it's common to use separate datasets for training, validation, and testing, with each set serving to check the model's performance at different stages of development. Additionally, since models often encounter data from various sources that might differ in distribution, quality, or type, using multiple datasets in testing can simulate this diversity and better prepare the model for deployment.\n",
+        "\n",
+        "This interactive notebook includes the code required to load the demo dataset, preprocess the raw dataset and train a model for testing, initialize ValidMind objects, and run a test that requires multiple datasets."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "  - [Preview the documentation template](#toc2_3__)    \n",
+        "- [Load the sample dataset](#toc3__)    \n",
+        "- [Prepocess the raw dataset](#toc4__)    \n",
+        "- [Train models for testing](#toc5__)    \n",
+        "- [Initialize ValidMind objects](#toc6__)    \n",
+        "  - [Initialize the ValidMind model](#toc6_1__)    \n",
+        "  - [Initialize the ValidMind datasets](#toc6_2__)    \n",
+        "- [Run a test that requires multiple datasets](#toc7__)    \n",
+        "  - [Run predictions and link with the model](#toc7_1__)    \n",
+        "  - [Run test](#toc7_2__)    \n",
+        "- [Next steps](#toc8__)    \n",
+        "  - [Work with your model documentation](#toc8_1__)    \n",
+        "  - [Discover more learning resources](#toc8_2__)    \n",
+        "- [Upgrade ValidMind](#toc9__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+        "\n",
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Binary classification`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Load the sample dataset\n",
+        "\n",
+        "The sample dataset used here is provided by the ValidMind library. To be able to use it, you need to import the dataset and load it into a pandas [DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html), a two-dimensional tabular data structure that makes use of rows and columns:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Import the sample dataset from the library\n",
+        "\n",
+        "from validmind.datasets.classification import customer_churn as demo_dataset\n",
+        "\n",
+        "print(\n",
+        "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{demo_dataset.target_column}' \\n\\t• Class labels: {demo_dataset.class_labels}\"\n",
+        ")\n",
+        "\n",
+        "raw_df = demo_dataset.load_data()\n",
+        "raw_df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Prepocess the raw dataset\n",
+        "\n",
+        "Preprocessing performs a number of operations to get ready for the subsequent steps:\n",
+        "\n",
+        "- Preprocess the data: Splits the DataFrame (`df`) into multiple datasets (`train_df`, `validation_df`, and `test_df`) using `demo_dataset.preprocess` to simplify preprocessing.\n",
+        "- Separate features and targets: Drops the target column to create feature sets (`x_train`, `x_val`) and target sets (`y_train`, `y_val`)."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "train_df, validation_df, test_df = demo_dataset.preprocess(raw_df)\n",
+        "x_train = train_df.drop(demo_dataset.target_column, axis=1)\n",
+        "y_train = train_df[demo_dataset.target_column]\n",
+        "x_val = validation_df.drop(demo_dataset.target_column, axis=1)\n",
+        "y_val = validation_df[demo_dataset.target_column]"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Train models for testing\n",
+        "\n",
+        "Initialize XGBoost and Logistic Regression Classifiers"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from sklearn.linear_model import LogisticRegression\n",
+        "import xgboost\n",
+        "\n",
+        "%matplotlib inline\n",
+        "\n",
+        "xgb = xgboost.XGBClassifier(early_stopping_rounds=10)\n",
+        "xgb.set_params(\n",
+        "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
+        ")\n",
+        "xgb.fit(\n",
+        "    x_train,\n",
+        "    y_train,\n",
+        "    eval_set=[(x_val, y_val)],\n",
+        "    verbose=False,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Initialize ValidMind objects\n",
+        "\n",
+        "<a id='toc6_1__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind model"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_model_xgb = vm.init_model(\n",
+        "    xgb,\n",
+        "    input_id=\"xgb\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind datasets\n",
+        "\n",
+        "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
+        "\n",
+        "This function takes a number of arguments:\n",
+        "\n",
+        "- `dataset` — the raw dataset that you want to provide as input to tests\n",
+        "- `input_id` - a unique identifier that allows tracking what inputs are used when running each individual test\n",
+        "- `target_column` — a required argument if tests require access to true values. This is the name of the target column in the dataset\n",
+        "- `class_labels` — an optional value to map predicted classes to class labels\n",
+        "\n",
+        "With all datasets ready, you can now initialize the raw, training and test datasets (`raw_df`, `train_df` and `test_df`) created earlier into their own dataset objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds = vm.init_dataset(\n",
+        "    input_id=\"train_dataset\",\n",
+        "    dataset=train_df,\n",
+        "    target_column=demo_dataset.target_column,\n",
+        ")\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    input_id=\"test_dataset\", dataset=test_df, target_column=demo_dataset.target_column\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Run a test that requires multiple datasets\n",
+        "\n",
+        "We are going to show the following in next two blocks:\n",
+        "\n",
+        "- Assign predictions for `vm_train_ds` and `vm_test_ds`\n",
+        "- Run `RobustnessDiagnosis` which is one example test that takes two input datasets"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_1__'></a>\n",
+        "\n",
+        "### Run predictions and link with the model"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds.assign_predictions(model=vm_model_xgb)\n",
+        "vm_test_ds.assign_predictions(model=vm_model_xgb)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_2__'></a>\n",
+        "\n",
+        "### Run test"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.RobustnessDiagnosis\",\n",
+        "    inputs={\"datasets\": (vm_train_ds, vm_test_ds), \"model\": vm_model_xgb},\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
+        "\n",
+        "<a id='toc8_1__'></a>\n",
+        "\n",
+        "### Work with your documentation\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
+        "\n",
+        "<a id='toc8_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc9__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-72af338f140e4a4bad5cb3954201d23e"
+    }
+  ],
+  "metadata": {
+    "colab": {
+      "provenance": []
+    },
+    "gpuClass": "standard",
+    "kernelspec": {
+      "display_name": ".venv",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.8.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 0
+}
\ No newline at end of file
diff --git a/site/notebooks/how_to/tests/run_tests/configure_tests/understand_utilize_rawdata.ipynb b/site/notebooks/how_to/tests/run_tests/configure_tests/understand_utilize_rawdata.ipynb
index 5fe3c360de..e5fb3ead8e 100644
--- a/site/notebooks/how_to/tests/run_tests/configure_tests/understand_utilize_rawdata.ipynb
+++ b/site/notebooks/how_to/tests/run_tests/configure_tests/understand_utilize_rawdata.ipynb
@@ -1,741 +1,742 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "id": "c18ba8a2",
-   "metadata": {},
-   "source": [
-    "# Understand and utilize `RawData` in ValidMind tests\n",
-    "\n",
-    "Test functions in ValidMind can return a special object called *`RawData`*, which holds intermediate or unprocessed data produced somewhere in the test logic but not returned as part of the test's visible output, such as in tables or figures.\n",
-    "\n",
-    "- The `RawData` feature allows you to customize the output of tests, making it a powerful tool for creating custom tests and post-processing functions.\n",
-    "- `RawData` is useful when running post-processing functions with tests to recompute tabular outputs, redraw figures, or even create new outputs entirely.\n",
-    "\n",
-    "In this notebook, you'll learn how to access, inspect, and utilize `RawData` from ValidMind tests."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "5b5b248c",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [Setup](#toc1_)    \n",
-    "  - [Installation and intialization](#toc1_1_)    \n",
-    "  - [Load the sample dataset](#toc1_2_)    \n",
-    "  - [Initialize the ValidMind objects](#toc1_3_)    \n",
-    "- [`RawData` usage examples](#toc2_)    \n",
-    "  - [Using `RawData` from the ROC Curve Test](#toc2_1_)    \n",
-    "  - [Pearson Correlation Matrix](#toc2_2_)    \n",
-    "  - [Precision-Recall Curve](#toc2_3_)    \n",
-    "  - [Using `RawData` in custom tests](#toc2_4_)    \n",
-    "  - [Using `RawData` in comparison tests](#toc2_5_)    \n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "6dd79a98",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_'></a>\n",
-    "\n",
-    "## Setup\n",
-    "\n",
-    "Before we can run our examples, we'll need to set the stage to enable running tests with the ValidMind Library. Since the focus of this notebook is on the `RawData` object, this section will merely summarize the steps instead of going into greater detail. \n",
-    "\n",
-    "\n",
-    "**To learn more about running tests with ValidMind:** [Run tests and test suites](https://docs.validmind.ai/developer/model-testing/testing-overview.html)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "5b6d8d15",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_1_'></a>\n",
-    "\n",
-    "### Installation and intialization\n",
-    "\n",
-    "First, let's make sure that the ValidMind Library is installed and ready to go, and our Python environment set up for data analysis:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "04eb084e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Install the ValidMind Library\n",
-    "%pip install -q validmind\n",
-    "\n",
-    "# Initialize the ValidMind Library\n",
-    "import validmind as vm\n",
-    "\n",
-    "# Import the `xgboost` library with an alias\n",
-    "import xgboost as xgb\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "5e6aa2cb",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_2_'></a>\n",
-    "\n",
-    "### Load the sample dataset\n",
-    "\n",
-    "Then, we'll import a sample ValidMind dataset and preprocess it:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "50d72eba",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Import the `customer_churn` sample dataset\n",
-    "from validmind.datasets.classification import customer_churn\n",
-    "raw_df = customer_churn.load_data()\n",
-    "\n",
-    "# Preprocess the raw dataset\n",
-    "train_df, validation_df, test_df = customer_churn.preprocess(raw_df)\n",
-    "\n",
-    "# Separate features and targets\n",
-    "x_train = train_df.drop(customer_churn.target_column, axis=1)\n",
-    "y_train = train_df[customer_churn.target_column]\n",
-    "x_val = validation_df.drop(customer_churn.target_column, axis=1)\n",
-    "y_val = validation_df[customer_churn.target_column]\n",
-    "\n",
-    "# Create an `XGBClassifier` object\n",
-    "model = xgb.XGBClassifier(early_stopping_rounds=10)\n",
-    "model.set_params(\n",
-    "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
-    ")\n",
-    "\n",
-    "# Train the model using the validation set\n",
-    "model.fit(\n",
-    "    x_train,\n",
-    "    y_train,\n",
-    "    eval_set=[(x_val, y_val)],\n",
-    "    verbose=False,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e3895d35",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_3_'></a>\n",
-    "\n",
-    "### Initialize the ValidMind objects"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "c0e441f4",
-   "metadata": {},
-   "source": [
-    "Before you can run tests, you'll need to initialize a ValidMind dataset object, as well as a ValidMind model object that can be passed to other functions for analysis and tests on the data:\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "b2310bc4",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize the dataset object\n",
-    "vm_raw_dataset = vm.init_dataset(\n",
-    "    dataset=raw_df,\n",
-    "    input_id=\"raw_dataset\",\n",
-    "    target_column=customer_churn.target_column,\n",
-    "    class_labels=customer_churn.class_labels,\n",
-    "    __log=False,\n",
-    ")\n",
-    "\n",
-    "# Initialize the datasets into their own dataset objects\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    dataset=train_df,\n",
-    "    input_id=\"train_dataset\",\n",
-    "    target_column=customer_churn.target_column,\n",
-    "    __log=False,\n",
-    ")\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    dataset=test_df,\n",
-    "    input_id=\"test_dataset\",\n",
-    "    target_column=customer_churn.target_column,\n",
-    "    __log=False,\n",
-    ")\n",
-    "\n",
-    "# Initialize a model object\n",
-    "vm_model = vm.init_model(\n",
-    "    model,\n",
-    "    input_id=\"model\",\n",
-    "    __log=False,\n",
-    ")\n",
-    "\n",
-    "# Assign predictions to the datasets\n",
-    "vm_train_ds.assign_predictions(\n",
-    "    model=vm_model,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds.assign_predictions(\n",
-    "    model=vm_model,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "25ec99fc",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_'></a>\n",
-    "\n",
-    "## `RawData` usage examples\n",
-    "\n",
-    "Once you're set up to run tests, you can then try out the following examples:\n",
-    "\n",
-    "  - [Using `RawData` from the ROC Curve Test](#toc2_1_)    \n",
-    "  - [Pearson Correlation Matrix](#toc2_2_)    \n",
-    "  - [Precision-Recall Curve](#toc2_3_)    \n",
-    "  - [Using `RawData` in custom tests](#toc2_4_)  \n",
-    "  - [Using `RawData` in comparison tests](#toc2_5_)  "
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "33d79841",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1_'></a>\n",
-    "\n",
-    "### Using `RawData` from the ROC Curve Test\n",
-    "\n",
-    "In this introductory example, we run the [ROC Curve](https://docs.validmind.ai/tests/model_validation/sklearn/ROCCurve.html) test, inspect its `RawData` output, and then create a custom ROC curve using the raw data values.\n",
-    "\n",
-    "First, let's run the default ROC Curve test for comparsion with later iterations:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "58a3a779",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.tests import run_test\n",
-    "\n",
-    "# Run the ROC Curve test normally\n",
-    "result_roc = run_test(\n",
-    "    \"validmind.model_validation.sklearn.ROCCurve\",\n",
-    "    inputs={\"dataset\": vm_test_ds, \"model\": vm_model},\n",
-    "    generate_description=False,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "66c44fe0",
-   "metadata": {},
-   "source": [
-    "Now let's assume we want to create a custom version of the above figure. First, let's inspect the raw data that this test produces so we can see what we have to work with.\n",
-    "\n",
-    "`RawData` objects have a `inspect()` method that will pretty print the attributes of the object to be able to quickly see the data and its types:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "513ce01e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Inspect the RawData output from the ROC test\n",
-    "print(\"RawData from ROC Curve Test:\")\n",
-    "result_roc.raw_data.inspect()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "586f3a12",
-   "metadata": {},
-   "source": [
-    "As we can see, the ROC Curve returns a `RawData` object with the following attributes:\n",
-    "- **`fpr`:** A list of false positive rates\n",
-    "- **`tpr`:** A list of true positive rates\n",
-    "- **`auc`:** The area under the curve\n",
-    "\n",
-    "This should be enough to create our own custom ROC curve via a post-processing function without having to create a whole new test from scratch and without having to recompute any of the data:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "613778d2",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import matplotlib.pyplot as plt\n",
-    "\n",
-    "from validmind.vm_models.result import TestResult\n",
-    "\n",
-    "\n",
-    "def custom_roc_curve(result: TestResult):\n",
-    "    # Extract raw data from the test result\n",
-    "    fpr = result.raw_data.fpr\n",
-    "    tpr = result.raw_data.tpr\n",
-    "    auc = result.raw_data.auc\n",
-    "\n",
-    "    # Create a custom ROC curve plot\n",
-    "    fig = plt.figure()\n",
-    "    plt.plot(fpr, tpr, label=f\"Custom ROC (AUC = {auc:.2f})\", color=\"blue\")\n",
-    "    plt.plot([0, 1], [0, 1], linestyle=\"--\", color=\"gray\", label=\"Random Guess\")\n",
-    "    plt.xlabel(\"False Positive Rate\")\n",
-    "    plt.ylabel(\"True Positive Rate\")\n",
-    "    plt.title(\"Custom ROC Curve from RawData\")\n",
-    "    plt.legend()\n",
-    "\n",
-    "    # close the plot to avoid it automatically being shown in the notebook\n",
-    "    plt.close()\n",
-    "\n",
-    "    # remove existing figure\n",
-    "    result.remove_figure(0)\n",
-    "\n",
-    "    # add new figure\n",
-    "    result.add_figure(fig)\n",
-    "\n",
-    "    return result\n",
-    "\n",
-    "# test it on the existing result\n",
-    "modified_result = custom_roc_curve(result_roc)\n",
-    "\n",
-    "# show the modified result\n",
-    "modified_result.show()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "794d026c",
-   "metadata": {},
-   "source": [
-    "Now that we have created a post-processing function and verified that it works on our existing test result, we can use it directly in `run_test()` from now on:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "7c7566f3",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"validmind.model_validation.sklearn.ROCCurve\",\n",
-    "    inputs={\"dataset\": vm_test_ds, \"model\": vm_model},\n",
-    "    post_process_fn=custom_roc_curve,\n",
-    "    generate_description=False,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "1d0b94aa",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_'></a>\n",
-    "\n",
-    "### Pearson Correlation Matrix\n",
-    "\n",
-    "In this next example, try commenting out the `post_process_fn` argument in the following cell and see what happens between different runs:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "c57fb01b",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import plotly.graph_objects as go\n",
-    "\n",
-    "\n",
-    "def custom_heatmap(result: TestResult):\n",
-    "    corr_matrix = result.raw_data.correlation_matrix\n",
-    "\n",
-    "    heatmap = go.Heatmap(\n",
-    "        z=corr_matrix.values,\n",
-    "        x=list(corr_matrix.columns),\n",
-    "        y=list(corr_matrix.index),\n",
-    "        colorscale=\"Viridis\",\n",
-    "    )\n",
-    "    fig = go.Figure(data=[heatmap])\n",
-    "    fig.update_layout(title=\"Custom Heatmap from RawData\")\n",
-    "\n",
-    "    plt.close()\n",
-    "\n",
-    "    result.remove_figure(0)\n",
-    "    result.add_figure(fig)\n",
-    "\n",
-    "    return result\n",
-    "\n",
-    "\n",
-    "result_corr = run_test(\n",
-    "    \"validmind.data_validation.PearsonCorrelationMatrix\",\n",
-    "    inputs={\"dataset\": vm_test_ds},\n",
-    "    generate_description=False,\n",
-    "    # COMMENT OUT `post_process_fn`\n",
-    "    post_process_fn=custom_heatmap,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "0a7cbbc6",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3_'></a>\n",
-    "\n",
-    "### Precision-Recall Curve\n",
-    "\n",
-    "Then, let's try the same thing with the [Precision-Recall Curve](https://docs.validmind.ai/tests/model_validation/sklearn/PrecisionRecallCurve.html) test:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "d16c5209",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def custom_pr_curve(result: TestResult):\n",
-    "    precision = result.raw_data.precision\n",
-    "    recall = result.raw_data.recall\n",
-    "\n",
-    "    fig = plt.figure()\n",
-    "    plt.plot(recall, precision, label=\"Precision-Recall Curve\")\n",
-    "    plt.xlabel(\"Recall\")\n",
-    "    plt.ylabel(\"Precision\")\n",
-    "    plt.title(\"Custom Precision-Recall Curve from RawData\")\n",
-    "    plt.legend()\n",
-    "\n",
-    "    plt.close()\n",
-    "    result.remove_figure(0)\n",
-    "    result.add_figure(fig)\n",
-    "\n",
-    "    return result\n",
-    "\n",
-    "result_pr = run_test(\n",
-    "    \"validmind.model_validation.sklearn.PrecisionRecallCurve\",\n",
-    "    inputs={\"dataset\": vm_test_ds, \"model\": vm_model},\n",
-    "    generate_description=False,\n",
-    "    # COMMENT OUT `post_process_fn`\n",
-    "    post_process_fn=custom_pr_curve,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e25391a4",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_4_'></a>\n",
-    "\n",
-    "### Using `RawData` in custom tests\n",
-    "\n",
-    "These examples demonstrate some very simple ways to use the `RawData` feature of ValidMind tests. The majority of ValidMind-developed tests return some form of raw data that can be used to customize the output of the test, but you can also create your own tests that return `RawData` objects and use them in the same way.\n",
-    "\n",
-    "Let's take a look at how this can be done in custom tests. To start, define and run your custom test:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "dc6a389f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import pandas as pd\n",
-    "\n",
-    "from validmind import test, RawData\n",
-    "from validmind.vm_models import VMDataset, VMModel\n",
-    "\n",
-    "\n",
-    "@test(\"custom.MyCustomTest\")\n",
-    "def MyCustomTest(dataset: VMDataset, model: VMModel) -> tuple[go.Figure, RawData]:\n",
-    "    \"\"\"Custom test that produces a figure and a RawData object\"\"\"\n",
-    "    # pretend we are using the dataset and model to compute some data\n",
-    "    # ...\n",
-    "\n",
-    "    # create some fake data that will be used to generate a figure\n",
-    "    data = pd.DataFrame({\"x\": [10, 20, 30, 40, 50], \"y\": [10, 20, 30, 40, 50]})\n",
-    "\n",
-    "    # create the figure (scatter plot)\n",
-    "    fig = go.Figure(data=go.Scatter(x=data[\"x\"], y=data[\"y\"]))\n",
-    "\n",
-    "    # now let's create a RawData object that holds the \"computed\" data\n",
-    "    raw_data = RawData(scatter_data_df=data)\n",
-    "\n",
-    "    # finally, return both the figure and the raw data\n",
-    "    return fig, raw_data\n",
-    "\n",
-    "\n",
-    "my_result = run_test(\n",
-    "    \"custom.MyCustomTest\",\n",
-    "    inputs={\"dataset\": vm_test_ds, \"model\": vm_model},\n",
-    "    generate_description=False,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "854c219c",
-   "metadata": {},
-   "source": [
-    "We can see that the test result shows the figure. But since we returned a `RawData` object, we can also inspect the contents and see how we could use it to customize or regenerate the figure in the post-processing function:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "1cb661d1",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "my_result.raw_data.inspect()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "55ad4acd",
-   "metadata": {},
-   "source": [
-    "We can see that we get a nicely-formatted preview of the dataframe we stored in the raw data object. Let's go ahead and use it to re-plot our data:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "c1242083",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def custom_plot(result: TestResult):\n",
-    "    data = result.raw_data.scatter_data_df\n",
-    "\n",
-    "    # use something other than a scatter plot\n",
-    "    fig = go.Figure(data=go.Bar(x=data[\"x\"], y=data[\"y\"]))\n",
-    "    fig.update_layout(title=\"Custom Bar Chart from RawData\")\n",
-    "    fig.update_xaxes(title=\"X Axis\")\n",
-    "    fig.update_yaxes(title=\"Y Axis\")\n",
-    "\n",
-    "    result.remove_figure(0)\n",
-    "    result.add_figure(fig)\n",
-    "\n",
-    "    return result\n",
-    "\n",
-    "result = run_test(\n",
-    "    \"custom.MyCustomTest\",\n",
-    "    inputs={\"dataset\": vm_test_ds, \"model\": vm_model},\n",
-    "    post_process_fn=custom_plot,\n",
-    "    generate_description=False,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "53084493",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_5_'></a>\n",
-    "\n",
-    "### Using `RawData` in comparison tests\n",
-    "\n",
-    "When running comparison tests, the `RawData` object will contain the raw data for each individual test result as well as the comparison results between the test results. To support this, the RawData object contains the model and dataset input_ids for each of the datasets and models in the test, so that the post-processing function can use them to customize the output. The example below shows how to use the `RawData` object to customize the output of a comparison test and add a table to the test result that shows the confusion matrix for each individual test result as well as the comparison results between the test results.\n",
-    "\n",
-    "When designing post-processing functions that need to handle both individual and comparison test results, you can check the structure of the raw data to determine which case you're dealing with. In the example below, we check if `confusion_matrix` is a list (comparison test with multiple matrices) or a single matrix (individual test). For comparison tests, the function creates two tables: one showing the confusion matrices for each test case, and another showing the percentage drift between them. For individual tests, it creates a single table with the confusion matrix values. This pattern of checking the raw data structure can be applied to other tests to create versatile post-processing functions that work in both scenarios.\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 13,
-   "id": "bcbbe9f4",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def cm_table(result: TestResult):\n",
-    "    # For individual results\n",
-    "    if not isinstance(result.raw_data.confusion_matrix, list):\n",
-    "        # Extract values from single confusion matrix\n",
-    "        cm = result.raw_data.confusion_matrix\n",
-    "        tn, fp = cm[0, 0], cm[0, 1]\n",
-    "        fn, tp = cm[1, 0], cm[1, 1]\n",
-    "        \n",
-    "        # Create DataFrame for individual matrix\n",
-    "        cm_df = pd.DataFrame({\n",
-    "            'TN': [tn],\n",
-    "            'FP': [fp],\n",
-    "            'FN': [fn],\n",
-    "            'TP': [tp]\n",
-    "        })\n",
-    "        \n",
-    "        # Add individual table\n",
-    "        result.add_table(cm_df, title=\"Confusion Matrix\")\n",
-    "        \n",
-    "    # For comparison results\n",
-    "    else:\n",
-    "        cms = result.raw_data.confusion_matrix\n",
-    "        cm1, cm2 = cms[0], cms[1]\n",
-    "        \n",
-    "        # Create individual results table\n",
-    "        rows = []\n",
-    "        for i, cm in enumerate(cms):\n",
-    "            rows.append({\n",
-    "                'dataset': result.raw_data.dataset[i],\n",
-    "                'model': result.raw_data.model[i],\n",
-    "                'TN': cm[0, 0],\n",
-    "                'FP': cm[0, 1],\n",
-    "                'FN': cm[1, 0],\n",
-    "                'TP': cm[1, 1]\n",
-    "            })\n",
-    "        individual_df = pd.DataFrame(rows)\n",
-    "        \n",
-    "        # Calculate percentage differences\n",
-    "        diff_df = pd.DataFrame({\n",
-    "            'TN_drift (%)': [(cm2[0, 0] - cm1[0, 0]) / cm1[0, 0] * 100],\n",
-    "            'FP_drift (%)': [(cm2[0, 1] - cm1[0, 1]) / cm1[0, 1] * 100],\n",
-    "            'FN_drift (%)': [(cm2[1, 0] - cm1[1, 0]) / cm1[1, 0] * 100],\n",
-    "            'TP_drift (%)': [(cm2[1, 1] - cm1[1, 1]) / cm1[1, 1] * 100]\n",
-    "        }).round(2)\n",
-    "        \n",
-    "        # Add both tables\n",
-    "        result.add_table(individual_df, title=\"Individual Confusion Matrices\")\n",
-    "        result.add_table(diff_df, title=\"Confusion Matrix Drift\")\n",
-    "        \n",
-    "    return result"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "41edd959",
-   "metadata": {},
-   "source": [
-    "Let's first run the confusion matrix test on a single dataset-model pair to see how our post-processing function handles individual results:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "cf3c47fe",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.tests import run_test\n",
-    "\n",
-    "result_cm = run_test(\n",
-    "    \"validmind.model_validation.sklearn.ConfusionMatrix\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_test_ds,\n",
-    "        \"model\": vm_model,\n",
-    "    },\n",
-    "    post_process_fn=cm_table,\n",
-    "    generate_description=False,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "a2482c54",
-   "metadata": {},
-   "source": [
-    "Now let's run a comparison test between test and train datasets to see how the function handles multiple results:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "6a1b4388",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result_cm = run_test(\n",
-    "    \"validmind.model_validation.sklearn.ConfusionMatrix\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_test_ds, vm_train_ds],\n",
-    "        \"model\": [vm_model]\n",
-    "    },\n",
-    "    post_process_fn=cm_table,\n",
-    "    generate_description=False,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "9f7d361a",
-   "metadata": {},
-   "source": [
-    "Let's inspect the raw data to see how comparison tests structure their data - notice how the `RawData` object contains not just the confusion matrices for both datasets, but also tracks which dataset and model each result came from:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "012ec495",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result_cm.raw_data.inspect()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-d9a502e868ba4fc1a70056873609b472",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.15"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "id": "c18ba8a2",
+      "metadata": {},
+      "source": [
+        "# Understand and utilize `RawData` in ValidMind tests\n",
+        "\n",
+        "Test functions in ValidMind can return a special object called *`RawData`*, which holds intermediate or unprocessed data produced somewhere in the test logic but not returned as part of the test's visible output, such as in tables or figures.\n",
+        "\n",
+        "- The `RawData` feature allows you to customize the output of tests, making it a powerful tool for creating custom tests and post-processing functions.\n",
+        "- `RawData` is useful when running post-processing functions with tests to recompute tabular outputs, redraw figures, or even create new outputs entirely.\n",
+        "\n",
+        "In this notebook, you'll learn how to access, inspect, and utilize `RawData` from ValidMind tests."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "5b5b248c",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [Setup](#toc1_)    \n",
+        "  - [Installation and intialization](#toc1_1_)    \n",
+        "  - [Load the sample dataset](#toc1_2_)    \n",
+        "  - [Initialize the ValidMind objects](#toc1_3_)    \n",
+        "- [`RawData` usage examples](#toc2_)    \n",
+        "  - [Using `RawData` from the ROC Curve Test](#toc2_1_)    \n",
+        "  - [Pearson Correlation Matrix](#toc2_2_)    \n",
+        "  - [Precision-Recall Curve](#toc2_3_)    \n",
+        "  - [Using `RawData` in custom tests](#toc2_4_)    \n",
+        "  - [Using `RawData` in comparison tests](#toc2_5_)    \n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "6dd79a98",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_'></a>\n",
+        "\n",
+        "## Setup\n",
+        "\n",
+        "Before we can run our examples, we'll need to set the stage to enable running tests with the ValidMind Library. Since the focus of this notebook is on the `RawData` object, this section will merely summarize the steps instead of going into greater detail. \n",
+        "\n",
+        "\n",
+        "**To learn more about running tests with ValidMind:** [Run tests and test suites](https://docs.validmind.ai/developer/model-testing/testing-overview.html)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "5b6d8d15",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_1_'></a>\n",
+        "\n",
+        "### Installation and intialization\n",
+        "\n",
+        "First, let's make sure that the ValidMind Library is installed and ready to go, and our Python environment set up for data analysis:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "04eb084e",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Install the ValidMind Library\n",
+        "%pip install -q validmind\n",
+        "\n",
+        "# Initialize the ValidMind Library\n",
+        "import validmind as vm\n",
+        "\n",
+        "# Import the `xgboost` library with an alias\n",
+        "import xgboost as xgb\n"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "5e6aa2cb",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_2_'></a>\n",
+        "\n",
+        "### Load the sample dataset\n",
+        "\n",
+        "Then, we'll import a sample ValidMind dataset and preprocess it:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "50d72eba",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Import the `customer_churn` sample dataset\n",
+        "from validmind.datasets.classification import customer_churn\n",
+        "raw_df = customer_churn.load_data()\n",
+        "\n",
+        "# Preprocess the raw dataset\n",
+        "train_df, validation_df, test_df = customer_churn.preprocess(raw_df)\n",
+        "\n",
+        "# Separate features and targets\n",
+        "x_train = train_df.drop(customer_churn.target_column, axis=1)\n",
+        "y_train = train_df[customer_churn.target_column]\n",
+        "x_val = validation_df.drop(customer_churn.target_column, axis=1)\n",
+        "y_val = validation_df[customer_churn.target_column]\n",
+        "\n",
+        "# Create an `XGBClassifier` object\n",
+        "model = xgb.XGBClassifier(early_stopping_rounds=10)\n",
+        "model.set_params(\n",
+        "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
+        ")\n",
+        "\n",
+        "# Train the model using the validation set\n",
+        "model.fit(\n",
+        "    x_train,\n",
+        "    y_train,\n",
+        "    eval_set=[(x_val, y_val)],\n",
+        "    verbose=False,\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "e3895d35",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_3_'></a>\n",
+        "\n",
+        "### Initialize the ValidMind objects"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "c0e441f4",
+      "metadata": {},
+      "source": [
+        "Before you can run tests, you'll need to initialize a ValidMind dataset object, as well as a ValidMind model object that can be passed to other functions for analysis and tests on the data:\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "b2310bc4",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Initialize the dataset object\n",
+        "vm_raw_dataset = vm.init_dataset(\n",
+        "    dataset=raw_df,\n",
+        "    input_id=\"raw_dataset\",\n",
+        "    target_column=customer_churn.target_column,\n",
+        "    class_labels=customer_churn.class_labels,\n",
+        "    __log=False,\n",
+        ")\n",
+        "\n",
+        "# Initialize the datasets into their own ValidMind dataset objects\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    dataset=train_df,\n",
+        "    input_id=\"train_dataset\",\n",
+        "    target_column=customer_churn.target_column,\n",
+        "    __log=False,\n",
+        ")\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    dataset=test_df,\n",
+        "    input_id=\"test_dataset\",\n",
+        "    target_column=customer_churn.target_column,\n",
+        "    __log=False,\n",
+        ")\n",
+        "\n",
+        "# Initialize the ValidMind model object wrapper so that it can be passed as input to tests or test suites\n",
+        "# ValidMind model objects can be any type of record you want to test, document, validate, or monitor\n",
+        "vm_model = vm.init_model(\n",
+        "    model,\n",
+        "    input_id=\"model\",\n",
+        "    __log=False,\n",
+        ")\n",
+        "\n",
+        "# Assign predictions to the datasets\n",
+        "vm_train_ds.assign_predictions(\n",
+        "    model=vm_model,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds.assign_predictions(\n",
+        "    model=vm_model,\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "25ec99fc",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_'></a>\n",
+        "\n",
+        "## `RawData` usage examples\n",
+        "\n",
+        "Once you're set up to run tests, you can then try out the following examples:\n",
+        "\n",
+        "  - [Using `RawData` from the ROC Curve Test](#toc2_1_)    \n",
+        "  - [Pearson Correlation Matrix](#toc2_2_)    \n",
+        "  - [Precision-Recall Curve](#toc2_3_)    \n",
+        "  - [Using `RawData` in custom tests](#toc2_4_)  \n",
+        "  - [Using `RawData` in comparison tests](#toc2_5_)  "
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "33d79841",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1_'></a>\n",
+        "\n",
+        "### Using `RawData` from the ROC Curve Test\n",
+        "\n",
+        "In this introductory example, we run the `model_validation.sklearn.ROCCurve` test, inspect its `RawData` output, and then create a custom ROC curve using the raw data values.\n",
+        "\n",
+        "First, let's run the default ROC Curve test for comparison with later iterations:\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "58a3a779",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "from validmind.tests import run_test\n",
+        "\n",
+        "# Run the ROC Curve test normally\n",
+        "result_roc = run_test(\n",
+        "    \"validmind.model_validation.sklearn.ROCCurve\",\n",
+        "    inputs={\"dataset\": vm_test_ds, \"model\": vm_model},\n",
+        "    generate_description=False,\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "66c44fe0",
+      "metadata": {},
+      "source": [
+        "Now let's assume we want to create a custom version of the above figure. First, let's inspect the raw data that this test produces so we can see what we have to work with.\n",
+        "\n",
+        "`RawData` objects have a `inspect()` method that will pretty print the attributes of the object to be able to quickly see the data and its types:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "513ce01e",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Inspect the RawData output from the ROC test\n",
+        "print(\"RawData from ROC Curve Test:\")\n",
+        "result_roc.raw_data.inspect()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "586f3a12",
+      "metadata": {},
+      "source": [
+        "As we can see, the ROC Curve test returns a `RawData` object with the following attributes:\n",
+        "- **`fpr`:** A list of false positive rates\n",
+        "- **`tpr`:** A list of true positive rates\n",
+        "- **`auc`:** The area under the curve\n",
+        "\n",
+        "This should be enough to create our own custom ROC curve via a post-processing function without having to create a whole new test from scratch and without having to recompute any of the data:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "613778d2",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "import matplotlib.pyplot as plt\n",
+        "\n",
+        "from validmind.vm_models.result import TestResult\n",
+        "\n",
+        "\n",
+        "def custom_roc_curve(result: TestResult):\n",
+        "    # Extract raw data from the test result\n",
+        "    fpr = result.raw_data.fpr\n",
+        "    tpr = result.raw_data.tpr\n",
+        "    auc = result.raw_data.auc\n",
+        "\n",
+        "    # Create a custom ROC curve plot\n",
+        "    fig = plt.figure()\n",
+        "    plt.plot(fpr, tpr, label=f\"Custom ROC (AUC = {auc:.2f})\", color=\"blue\")\n",
+        "    plt.plot([0, 1], [0, 1], linestyle=\"--\", color=\"gray\", label=\"Random Guess\")\n",
+        "    plt.xlabel(\"False Positive Rate\")\n",
+        "    plt.ylabel(\"True Positive Rate\")\n",
+        "    plt.title(\"Custom ROC Curve from RawData\")\n",
+        "    plt.legend()\n",
+        "\n",
+        "    # close the plot to avoid it automatically being shown in the notebook\n",
+        "    plt.close()\n",
+        "\n",
+        "    # remove existing figure\n",
+        "    result.remove_figure(0)\n",
+        "\n",
+        "    # add new figure\n",
+        "    result.add_figure(fig)\n",
+        "\n",
+        "    return result\n",
+        "\n",
+        "# test it on the existing result\n",
+        "modified_result = custom_roc_curve(result_roc)\n",
+        "\n",
+        "# show the modified result\n",
+        "modified_result.show()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "794d026c",
+      "metadata": {},
+      "source": [
+        "Now that we have created a post-processing function and verified that it works on our existing test result, we can use it directly in `run_test()` from now on:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "7c7566f3",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "result = run_test(\n",
+        "    \"validmind.model_validation.sklearn.ROCCurve\",\n",
+        "    inputs={\"dataset\": vm_test_ds, \"model\": vm_model},\n",
+        "    post_process_fn=custom_roc_curve,\n",
+        "    generate_description=False,\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "1d0b94aa",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_'></a>\n",
+        "\n",
+        "### Pearson Correlation Matrix\n",
+        "\n",
+        "In this next example, try commenting out the `post_process_fn` argument in the following cell and see what happens between different runs:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "c57fb01b",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "import plotly.graph_objects as go\n",
+        "\n",
+        "\n",
+        "def custom_heatmap(result: TestResult):\n",
+        "    corr_matrix = result.raw_data.correlation_matrix\n",
+        "\n",
+        "    heatmap = go.Heatmap(\n",
+        "        z=corr_matrix.values,\n",
+        "        x=list(corr_matrix.columns),\n",
+        "        y=list(corr_matrix.index),\n",
+        "        colorscale=\"Viridis\",\n",
+        "    )\n",
+        "    fig = go.Figure(data=[heatmap])\n",
+        "    fig.update_layout(title=\"Custom Heatmap from RawData\")\n",
+        "\n",
+        "    plt.close()\n",
+        "\n",
+        "    result.remove_figure(0)\n",
+        "    result.add_figure(fig)\n",
+        "\n",
+        "    return result\n",
+        "\n",
+        "\n",
+        "result_corr = run_test(\n",
+        "    \"validmind.data_validation.PearsonCorrelationMatrix\",\n",
+        "    inputs={\"dataset\": vm_test_ds},\n",
+        "    generate_description=False,\n",
+        "    # COMMENT OUT `post_process_fn`\n",
+        "    post_process_fn=custom_heatmap,\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "0a7cbbc6",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3_'></a>\n",
+        "\n",
+        "### Precision-Recall Curve\n",
+        "\n",
+        "Then, let's try the same thing with the `model_validation.sklearn.PrecisionRecallCurve` test:\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "d16c5209",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "def custom_pr_curve(result: TestResult):\n",
+        "    precision = result.raw_data.precision\n",
+        "    recall = result.raw_data.recall\n",
+        "\n",
+        "    fig = plt.figure()\n",
+        "    plt.plot(recall, precision, label=\"Precision-Recall Curve\")\n",
+        "    plt.xlabel(\"Recall\")\n",
+        "    plt.ylabel(\"Precision\")\n",
+        "    plt.title(\"Custom Precision-Recall Curve from RawData\")\n",
+        "    plt.legend()\n",
+        "\n",
+        "    plt.close()\n",
+        "    result.remove_figure(0)\n",
+        "    result.add_figure(fig)\n",
+        "\n",
+        "    return result\n",
+        "\n",
+        "result_pr = run_test(\n",
+        "    \"validmind.model_validation.sklearn.PrecisionRecallCurve\",\n",
+        "    inputs={\"dataset\": vm_test_ds, \"model\": vm_model},\n",
+        "    generate_description=False,\n",
+        "    # COMMENT OUT `post_process_fn`\n",
+        "    post_process_fn=custom_pr_curve,\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "e25391a4",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_4_'></a>\n",
+        "\n",
+        "### Using `RawData` in custom tests\n",
+        "\n",
+        "These examples demonstrate some very simple ways to use the `RawData` feature of ValidMind tests. The majority of ValidMind-developed tests return some form of raw data that can be used to customize the output of the test, but you can also create your own tests that return `RawData` objects and use them in the same way.\n",
+        "\n",
+        "Let's take a look at how this can be done in custom tests. To start, define and run your custom test:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "dc6a389f",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "import pandas as pd\n",
+        "\n",
+        "from validmind import test, RawData\n",
+        "from validmind.vm_models import VMDataset, VMModel\n",
+        "\n",
+        "\n",
+        "@test(\"custom.MyCustomTest\")\n",
+        "def MyCustomTest(dataset: VMDataset, model: VMModel) -> tuple[go.Figure, RawData]:\n",
+        "    \"\"\"Custom test that produces a figure and a RawData object\"\"\"\n",
+        "    # pretend we are using the dataset and model to compute some data\n",
+        "    # ...\n",
+        "\n",
+        "    # create some fake data that will be used to generate a figure\n",
+        "    data = pd.DataFrame({\"x\": [10, 20, 30, 40, 50], \"y\": [10, 20, 30, 40, 50]})\n",
+        "\n",
+        "    # create the figure (scatter plot)\n",
+        "    fig = go.Figure(data=go.Scatter(x=data[\"x\"], y=data[\"y\"]))\n",
+        "\n",
+        "    # now let's create a RawData object that holds the \"computed\" data\n",
+        "    raw_data = RawData(scatter_data_df=data)\n",
+        "\n",
+        "    # finally, return both the figure and the raw data\n",
+        "    return fig, raw_data\n",
+        "\n",
+        "\n",
+        "my_result = run_test(\n",
+        "    \"custom.MyCustomTest\",\n",
+        "    inputs={\"dataset\": vm_test_ds, \"model\": vm_model},\n",
+        "    generate_description=False,\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "854c219c",
+      "metadata": {},
+      "source": [
+        "We can see that the test result shows the figure. But since we returned a `RawData` object, we can also inspect the contents and see how we could use it to customize or regenerate the figure in the post-processing function:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "1cb661d1",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "my_result.raw_data.inspect()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "55ad4acd",
+      "metadata": {},
+      "source": [
+        "We can see that we get a nicely-formatted preview of the dataframe we stored in the raw data object. Let's go ahead and use it to re-plot our data:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "c1242083",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "def custom_plot(result: TestResult):\n",
+        "    data = result.raw_data.scatter_data_df\n",
+        "\n",
+        "    # use something other than a scatter plot\n",
+        "    fig = go.Figure(data=go.Bar(x=data[\"x\"], y=data[\"y\"]))\n",
+        "    fig.update_layout(title=\"Custom Bar Chart from RawData\")\n",
+        "    fig.update_xaxes(title=\"X Axis\")\n",
+        "    fig.update_yaxes(title=\"Y Axis\")\n",
+        "\n",
+        "    result.remove_figure(0)\n",
+        "    result.add_figure(fig)\n",
+        "\n",
+        "    return result\n",
+        "\n",
+        "result = run_test(\n",
+        "    \"custom.MyCustomTest\",\n",
+        "    inputs={\"dataset\": vm_test_ds, \"model\": vm_model},\n",
+        "    post_process_fn=custom_plot,\n",
+        "    generate_description=False,\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "53084493",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_5_'></a>\n",
+        "\n",
+        "### Using `RawData` in comparison tests\n",
+        "\n",
+        "When running comparison tests, the `RawData` object will contain the raw data for each individual test result as well as the comparison results between the test results. To support this, the RawData object contains the model and dataset input_ids for each of the datasets and models in the test, so that the post-processing function can use them to customize the output. The example below shows how to use the `RawData` object to customize the output of a comparison test and add a table to the test result that shows the confusion matrix for each individual test result as well as the comparison results between the test results.\n",
+        "\n",
+        "When designing post-processing functions that need to handle both individual and comparison test results, you can check the structure of the raw data to determine which case you're dealing with. In the example below, we check if `confusion_matrix` is a list (comparison test with multiple matrices) or a single matrix (individual test). For comparison tests, the function creates two tables: one showing the confusion matrices for each test case, and another showing the percentage drift between them. For individual tests, it creates a single table with the confusion matrix values. This pattern of checking the raw data structure can be applied to other tests to create versatile post-processing functions that work in both scenarios.\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": 13,
+      "id": "bcbbe9f4",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "def cm_table(result: TestResult):\n",
+        "    # For individual results\n",
+        "    if not isinstance(result.raw_data.confusion_matrix, list):\n",
+        "        # Extract values from single confusion matrix\n",
+        "        cm = result.raw_data.confusion_matrix\n",
+        "        tn, fp = cm[0, 0], cm[0, 1]\n",
+        "        fn, tp = cm[1, 0], cm[1, 1]\n",
+        "        \n",
+        "        # Create DataFrame for individual matrix\n",
+        "        cm_df = pd.DataFrame({\n",
+        "            'TN': [tn],\n",
+        "            'FP': [fp],\n",
+        "            'FN': [fn],\n",
+        "            'TP': [tp]\n",
+        "        })\n",
+        "        \n",
+        "        # Add individual table\n",
+        "        result.add_table(cm_df, title=\"Confusion Matrix\")\n",
+        "        \n",
+        "    # For comparison results\n",
+        "    else:\n",
+        "        cms = result.raw_data.confusion_matrix\n",
+        "        cm1, cm2 = cms[0], cms[1]\n",
+        "        \n",
+        "        # Create individual results table\n",
+        "        rows = []\n",
+        "        for i, cm in enumerate(cms):\n",
+        "            rows.append({\n",
+        "                'dataset': result.raw_data.dataset[i],\n",
+        "                'model': result.raw_data.model[i],\n",
+        "                'TN': cm[0, 0],\n",
+        "                'FP': cm[0, 1],\n",
+        "                'FN': cm[1, 0],\n",
+        "                'TP': cm[1, 1]\n",
+        "            })\n",
+        "        individual_df = pd.DataFrame(rows)\n",
+        "        \n",
+        "        # Calculate percentage differences\n",
+        "        diff_df = pd.DataFrame({\n",
+        "            'TN_drift (%)': [(cm2[0, 0] - cm1[0, 0]) / cm1[0, 0] * 100],\n",
+        "            'FP_drift (%)': [(cm2[0, 1] - cm1[0, 1]) / cm1[0, 1] * 100],\n",
+        "            'FN_drift (%)': [(cm2[1, 0] - cm1[1, 0]) / cm1[1, 0] * 100],\n",
+        "            'TP_drift (%)': [(cm2[1, 1] - cm1[1, 1]) / cm1[1, 1] * 100]\n",
+        "        }).round(2)\n",
+        "        \n",
+        "        # Add both tables\n",
+        "        result.add_table(individual_df, title=\"Individual Confusion Matrices\")\n",
+        "        result.add_table(diff_df, title=\"Confusion Matrix Drift\")\n",
+        "        \n",
+        "    return result"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "41edd959",
+      "metadata": {},
+      "source": [
+        "Let's first run the confusion matrix test on a single dataset-model pair to see how our post-processing function handles individual results:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "cf3c47fe",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "from validmind.tests import run_test\n",
+        "\n",
+        "result_cm = run_test(\n",
+        "    \"validmind.model_validation.sklearn.ConfusionMatrix\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_test_ds,\n",
+        "        \"model\": vm_model,\n",
+        "    },\n",
+        "    post_process_fn=cm_table,\n",
+        "    generate_description=False,\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "a2482c54",
+      "metadata": {},
+      "source": [
+        "Now let's run a comparison test between test and train datasets to see how the function handles multiple results:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "6a1b4388",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "result_cm = run_test(\n",
+        "    \"validmind.model_validation.sklearn.ConfusionMatrix\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_test_ds, vm_train_ds],\n",
+        "        \"model\": [vm_model]\n",
+        "    },\n",
+        "    post_process_fn=cm_table,\n",
+        "    generate_description=False,\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "9f7d361a",
+      "metadata": {},
+      "source": [
+        "Let's inspect the raw data to see how comparison tests structure their data - notice how the `RawData` object contains not just the confusion matrices for both datasets, but also tracks which dataset and model each result came from:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "012ec495",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "result_cm.raw_data.inspect()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "copyright-d9a502e868ba4fc1a70056873609b472",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ]
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.10.15"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 5
 }
diff --git a/site/notebooks/how_to/tests/run_tests/documentation_tests/document_multiple_results_for_the_same_test.ipynb b/site/notebooks/how_to/tests/run_tests/documentation_tests/document_multiple_results_for_the_same_test.ipynb
index c7c0aa2cce..fc7446d036 100644
--- a/site/notebooks/how_to/tests/run_tests/documentation_tests/document_multiple_results_for_the_same_test.ipynb
+++ b/site/notebooks/how_to/tests/run_tests/documentation_tests/document_multiple_results_for_the_same_test.ipynb
@@ -1,627 +1,639 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Document multiple results for the same test\n",
-    "\n",
-    "Documentation templates facilitate the presentation of multiple unique test results for a single test. \n",
-    "\n",
-    "Consider various scenarios where you may intend to showcase results of the same test with diverse inputs:\n",
-    "\n",
-    "- **Comparing test results with varied parameter values:** Illustrate model performance by contrasting test results achieved with different parameter values to identify optimal settings.\n",
-    "- **Displaying test results with distinct datasets:** Showcase test versatility by presenting results on diverse datasets, such as providing confusion matrices for both training and test data.\n",
-    "- **Model comparison:** Conduct a comprehensive model evaluation by comparing tests like `ROC curve` and `Accuracy` to discern and select the superior-performing model.\n",
-    "\n",
-    "This interactive notebook guides you through the process of documenting a model with the ValidMind Library. It uses the [Bank Customer Churn Prediction](https://www.kaggle.com/code/kmalit/bank-customer-churn-prediction/data) sample dataset from Kaggle to train a simple classification model. As part of the notebook, you will learn how to render more than one unique test result for the same test while exploring how the documentation process works:\n",
-    "\n",
-    "- Initializing the ValidMind Library\n",
-    "- Loading a sample dataset provided by the library to train a simple classification model\n",
-    "- Running a ValidMind test suite to quickly generate documentation about the data and model"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "- [Update the customer churn demo template](#toc3__)    \n",
-    "- [Initialize the Python environment](#toc4__)    \n",
-    "  - [Preview the documentation template](#toc4_1__)    \n",
-    "- [Load the sample dataset](#toc5__)    \n",
-    "  - [Initialize a ValidMind dataset object](#toc5_1__)    \n",
-    "- [Document the model](#toc6__)    \n",
-    "  - [Prepare datasets](#toc6_1__)    \n",
-    "  - [Initialize the training and test datasets](#toc6_2__)    \n",
-    "  - [Run documentation tests](#toc6_3__)    \n",
-    "  - [Run the individual tests using the `run_test`](#toc6_4__)    \n",
-    "- [Next steps](#toc7__)    \n",
-    "  - [Work with your model documentation](#toc7_1__)    \n",
-    "  - [Discover more learning resources](#toc7_2__)    \n",
-    "- [Upgrade ValidMind](#toc8__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
-    "\n",
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Custom tests**: Custom tests are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom test.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom test. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Binary classification`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Update the customer churn demo template\n",
-    "\n",
-    "Before you initialize the ValidMind Library by running the notebook, edit the **Binary classification** template to make a copy of a test of interest and update it with different `result_id` fields for each entry:\n",
-    "\n",
-    "- Go to **Settings > Templates** and click on the **Binary classification** template. Let's say we want to show `Skewness` results for `training` and `test` datasets.\n",
-    "\n",
-    "To do this we replace\n",
-    "\n",
-    "```yaml\n",
-    "- content_type: test\n",
-    "  content_id: validmind.data_validation.Skewness\n",
-    "```\n",
-    "\n",
-    "with\n",
-    "\n",
-    "```yaml\n",
-    "- content_type: test\n",
-    "  content_id: validmind.data_validation.Skewness:training_data\n",
-    "- content_type: test\n",
-    "  content_id: validmind.data_validation.Skewness:test_data\n",
-    "```\n",
-    "\n",
-    "This way, we can show two results of the same test in the model document. Here, the `training_data` and `test_data` could be any string. However, they should be unique for the same test.\n",
-    "\n",
-    "- Click on **Prepare new version**, provide some version notes and click on **Save new version** to save a new version of this template.\n",
-    "- Next, we need to swap our model documentation to use this new version of the template. Follow the steps on [Swap documentation templates](https://docs.validmind.ai/guide/model-documentation/swap-documentation-templates.html) to swap the template of our customer churn model.\n",
-    "\n",
-    "In the following sections we provide more context on how these `content_id` fields mentioned earlier get mapped to the actual tests."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Initialize the Python environment\n",
-    "\n",
-    "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import pandas as pd\n",
-    "import xgboost as xgb\n",
-    "\n",
-    "from sklearn.metrics import accuracy_score\n",
-    "from sklearn.model_selection import train_test_split\n",
-    "\n",
-    "%matplotlib inline"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Load the sample dataset\n",
-    "\n",
-    "The sample dataset used here is provided by the ValidMind library, along with a second, different dataset (`taiwan_credit`) you can try as well.\n",
-    "\n",
-    "To be able to use either sample dataset, you need to import the dataset and load it into a pandas [DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html), a two-dimensional tabular data structure that makes use of rows and columns:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Import the sample dataset from the library\n",
-    "\n",
-    "from validmind.datasets.classification import customer_churn as demo_dataset\n",
-    "\n",
-    "df = demo_dataset.load_data()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_1__'></a>\n",
-    "\n",
-    "### Initialize a ValidMind dataset object\n",
-    "\n",
-    "Before you can run a test suite, which are a collection of tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
-    "\n",
-    "This function takes a number of arguments:\n",
-    "\n",
-    "- `dataset` — the raw dataset that you want to analyze\n",
-    "- `target_column` — the name of the target column in the dataset\n",
-    "- `class_labels` — the list of class labels used for classification model training"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_dataset = vm.init_dataset(\n",
-    "    input_id=\"raw_dataset\",\n",
-    "    dataset=df,\n",
-    "    target_column=demo_dataset.target_column,\n",
-    "    class_labels=demo_dataset.class_labels,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Document the model\n",
-    "\n",
-    "As part of documenting the model with the ValidMind Library, you need to preprocess the raw dataset, initialize some training and test datasets, initialize a model object you can use for testing, and then run the full suite of tests."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1__'></a>\n",
-    "\n",
-    "### Prepare datasets\n",
-    "\n",
-    "DataFrame (df) preprocessing is simplified by employing `demo_dataset.preprocess` to partition it into distinct datasets (`train_df`, `validation_df`, and `test_df`)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "train_df, validation_df, test_df = demo_dataset.preprocess(df)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2__'></a>\n",
-    "\n",
-    "### Initialize the training and test datasets\n",
-    "\n",
-    "With the datasets ready, you can now initialize the training and test datasets (`train_df` and `test_df`) created earlier into their own dataset objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds = vm.init_dataset(\n",
-    "    input_id=\"train_dataset\", dataset=train_df, target_column=demo_dataset.target_column\n",
-    ")\n",
-    "\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    input_id=\"test_dataset\", dataset=test_df, target_column=demo_dataset.target_column\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_3__'></a>\n",
-    "\n",
-    "### Run documentation tests\n",
-    "\n",
-    "Now specify `inputs` and `params` for individual tests using `config` parameter. The results for the both the datasets will be visible in the documentation. The `inputs` in the config get priority over global `inputs` in the `run_documentation_tests`."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "config = {\n",
-    "    \"validmind.data_validation.Skewness:training_data\": {\n",
-    "        \"params\": {\"max_threshold\": 1},\n",
-    "        \"inputs\": {\"dataset\": vm_train_ds},\n",
-    "    },\n",
-    "    \"validmind.data_validation.Skewness:test_data\": {\n",
-    "        \"params\": {\"max_threshold\": 1.5},\n",
-    "        \"inputs\": {\"dataset\": vm_test_ds},\n",
-    "    },\n",
-    "}\n",
-    "\n",
-    "tests_suite = vm.run_documentation_tests(\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_dataset,\n",
-    "    },\n",
-    "    config=config,\n",
-    "    section=[\"data_preparation\"],\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_4__'></a>\n",
-    "\n",
-    "### Run the individual tests using the `run_test`\n",
-    "\n",
-    "Now run the `Skewness` tests for training and test datasets. The results for the both the datasets will be visible in the documentation."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.Skewness:training_data\",\n",
-    "    params={\"max_threshold\": 1},\n",
-    "    inputs={\"dataset\": vm_train_ds},\n",
-    ")\n",
-    "test.log()\n",
-    "\n",
-    "test = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.Skewness:test_data\",\n",
-    "    params={\"max_threshold\": 1.5},\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_test_ds,\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
-    "\n",
-    "<a id='toc7_1__'></a>\n",
-    "\n",
-    "### Work with your model documentation\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "3. Expand the **2. Data Preparation** section and take a look around.\n",
-    "\n",
-    "   You can now see the skewness tests results of training and test datasets in the `Data Preparation` section.\n",
-    "\n",
-    "From here, you can also make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/model-documentation/working-with-model-documentation.html)\n",
-    "\n",
-    "<a id='toc7_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc8__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-6ce412276b6244aab16b2e3443c6a861",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "colab": {
-   "provenance": []
-  },
-  "gpuClass": "standard",
-  "kernelspec": {
-   "display_name": "validmind-1QuffXMV-py3.9",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.8.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 0
-}
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Document multiple results for the same test\n",
+        "\n",
+        "Documentation templates facilitate the presentation of multiple unique test results for a single test. \n",
+        "\n",
+        "Consider various scenarios where you may intend to showcase results of the same test with diverse inputs:\n",
+        "\n",
+        "- **Comparing test results with varied parameter values:** Illustrate model performance by contrasting test results achieved with different parameter values to identify optimal settings.\n",
+        "- **Displaying test results with distinct datasets:** Showcase test versatility by presenting results on diverse datasets, such as providing confusion matrices for both training and test data.\n",
+        "- **Model comparison:** Conduct a comprehensive model evaluation by comparing tests like `ROC curve` and `Accuracy` to discern and select the superior-performing model.\n",
+        "\n",
+        "This interactive notebook guides you through the process of documenting a model with the ValidMind Library. It uses the [Bank Customer Churn Prediction](https://www.kaggle.com/code/kmalit/bank-customer-churn-prediction/data) sample dataset from Kaggle to train a simple classification model. As part of the notebook, you will learn how to render more than one unique test result for the same test while exploring how the documentation process works:\n",
+        "\n",
+        "- Initializing the ValidMind Library\n",
+        "- Loading a sample dataset provided by the library to train a simple classification model\n",
+        "- Running a ValidMind test suite to quickly generate documentation about the data and model"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "- [Update the customer churn demo template](#toc3__)    \n",
+        "- [Initialize the Python environment](#toc4__)    \n",
+        "  - [Preview the documentation template](#toc4_1__)    \n",
+        "- [Load the sample dataset](#toc5__)    \n",
+        "  - [Initialize a ValidMind dataset object](#toc5_1__)    \n",
+        "- [Document the model](#toc6__)    \n",
+        "  - [Prepare datasets](#toc6_1__)    \n",
+        "  - [Initialize the training and test datasets](#toc6_2__)    \n",
+        "  - [Run documentation tests](#toc6_3__)    \n",
+        "  - [Run the individual tests using the `run_test`](#toc6_4__)    \n",
+        "- [Next steps](#toc7__)    \n",
+        "  - [Work with your model documentation](#toc7_1__)    \n",
+        "  - [Discover more learning resources](#toc7_2__)    \n",
+        "- [Upgrade ValidMind](#toc8__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+        "\n",
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Binary classification`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Update the customer churn demo template\n",
+        "\n",
+        "Before you initialize the ValidMind Library by running the notebook, edit the **Binary classification** template to make a copy of a test of interest and update it with different `result_id` fields for each entry:\n",
+        "\n",
+        "- Go to **Settings > Templates** and click on the **Binary classification** template. Let's say we want to show `Skewness` results for `training` and `test` datasets.\n",
+        "\n",
+        "To do this we replace\n",
+        "\n",
+        "```yaml\n",
+        "- content_type: test\n",
+        "  content_id: validmind.data_validation.Skewness\n",
+        "```\n",
+        "\n",
+        "with\n",
+        "\n",
+        "```yaml\n",
+        "- content_type: test\n",
+        "  content_id: validmind.data_validation.Skewness:training_data\n",
+        "- content_type: test\n",
+        "  content_id: validmind.data_validation.Skewness:test_data\n",
+        "```\n",
+        "\n",
+        "This way, we can show two results of the same test in the model document. Here, the `training_data` and `test_data` could be any string. However, they should be unique for the same test.\n",
+        "\n",
+        "- Click on **Prepare new version**, provide some version notes and click on **Save new version** to save a new version of this template.\n",
+        "- Next, we need to swap our model documentation to use this new version of the template. Follow the steps on [Manage document templates](https://docs.validmind.ai/guide/templates/manage-document-templates.html) to swap the template of our customer churn model.\n",
+        "\n",
+        "In the following sections we provide more context on how these `content_id` fields mentioned earlier get mapped to the actual tests."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Initialize the Python environment\n",
+        "\n",
+        "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import pandas as pd\n",
+        "import xgboost as xgb\n",
+        "\n",
+        "from sklearn.metrics import accuracy_score\n",
+        "from sklearn.model_selection import train_test_split\n",
+        "\n",
+        "%matplotlib inline"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Load the sample dataset\n",
+        "\n",
+        "The sample dataset used here is provided by the ValidMind library, along with a second, different dataset (`taiwan_credit`) you can try as well.\n",
+        "\n",
+        "To be able to use either sample dataset, you need to import the dataset and load it into a pandas [DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html), a two-dimensional tabular data structure that makes use of rows and columns:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Import the sample dataset from the library\n",
+        "\n",
+        "from validmind.datasets.classification import customer_churn as demo_dataset\n",
+        "\n",
+        "df = demo_dataset.load_data()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Initialize a ValidMind dataset object\n",
+        "\n",
+        "Before you can run a test suite, which are a collection of tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
+        "\n",
+        "This function takes a number of arguments:\n",
+        "\n",
+        "- `dataset` — the raw dataset that you want to analyze\n",
+        "- `target_column` — the name of the target column in the dataset\n",
+        "- `class_labels` — the list of class labels used for classification model training"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_dataset = vm.init_dataset(\n",
+        "    input_id=\"raw_dataset\",\n",
+        "    dataset=df,\n",
+        "    target_column=demo_dataset.target_column,\n",
+        "    class_labels=demo_dataset.class_labels,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Document the model\n",
+        "\n",
+        "As part of documenting the model with the ValidMind Library, you need to preprocess the raw dataset, initialize some training and test datasets, initialize a model object you can use for testing, and then run the full suite of tests."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_1__'></a>\n",
+        "\n",
+        "### Prepare datasets\n",
+        "\n",
+        "DataFrame (df) preprocessing is simplified by employing `demo_dataset.preprocess` to partition it into distinct datasets (`train_df`, `validation_df`, and `test_df`)"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "train_df, validation_df, test_df = demo_dataset.preprocess(df)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2__'></a>\n",
+        "\n",
+        "### Initialize the training and test datasets\n",
+        "\n",
+        "With the datasets ready, you can now initialize the training and test datasets (`train_df` and `test_df`) created earlier into their own dataset objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds = vm.init_dataset(\n",
+        "    input_id=\"train_dataset\", dataset=train_df, target_column=demo_dataset.target_column\n",
+        ")\n",
+        "\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    input_id=\"test_dataset\", dataset=test_df, target_column=demo_dataset.target_column\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_3__'></a>\n",
+        "\n",
+        "### Run documentation tests\n",
+        "\n",
+        "Now specify `inputs` and `params` for individual tests using `config` parameter. The results for the both the datasets will be visible in the documentation. The `inputs` in the config get priority over global `inputs` in the `run_documentation_tests`."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "config = {\n",
+        "    \"validmind.data_validation.Skewness:training_data\": {\n",
+        "        \"params\": {\"max_threshold\": 1},\n",
+        "        \"inputs\": {\"dataset\": vm_train_ds},\n",
+        "    },\n",
+        "    \"validmind.data_validation.Skewness:test_data\": {\n",
+        "        \"params\": {\"max_threshold\": 1.5},\n",
+        "        \"inputs\": {\"dataset\": vm_test_ds},\n",
+        "    },\n",
+        "}\n",
+        "\n",
+        "tests_suite = vm.run_documentation_tests(\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_dataset,\n",
+        "    },\n",
+        "    config=config,\n",
+        "    section=[\"data_preparation\"],\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_4__'></a>\n",
+        "\n",
+        "### Run the individual tests using the `run_test`\n",
+        "\n",
+        "Now run the `Skewness` tests for training and test datasets. The results for the both the datasets will be visible in the documentation."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.Skewness:training_data\",\n",
+        "    params={\"max_threshold\": 1},\n",
+        "    inputs={\"dataset\": vm_train_ds},\n",
+        ")\n",
+        "test.log()\n",
+        "\n",
+        "test = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.Skewness:test_data\",\n",
+        "    params={\"max_threshold\": 1.5},\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_test_ds,\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
+        "\n",
+        "<a id='toc7_1__'></a>\n",
+        "\n",
+        "### Work with your documentation\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "3. Expand the **2. Data Preparation** section and take a look around.\n",
+        "\n",
+        "   You can now see the skewness tests results of training and test datasets in the `Data Preparation` section.\n",
+        "\n",
+        "From here, you can also make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
+        "\n",
+        "<a id='toc7_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-6ce412276b6244aab16b2e3443c6a861"
+    }
+  ],
+  "metadata": {
+    "colab": {
+      "provenance": []
+    },
+    "gpuClass": "standard",
+    "kernelspec": {
+      "display_name": "validmind-1QuffXMV-py3.9",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.8.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 0
+}
\ No newline at end of file
diff --git a/site/notebooks/how_to/tests/run_tests/documentation_tests/run_documentation_sections.ipynb b/site/notebooks/how_to/tests/run_tests/documentation_tests/run_documentation_sections.ipynb
index 63c8d02a62..42ef742f8e 100644
--- a/site/notebooks/how_to/tests/run_tests/documentation_tests/run_documentation_sections.ipynb
+++ b/site/notebooks/how_to/tests/run_tests/documentation_tests/run_documentation_sections.ipynb
@@ -1,595 +1,605 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Run individual documentation sections\n",
-    "\n",
-    "For targeted testing, you can run tests on individual sections or specific groups of sections in your model documentation.\n",
-    "\n",
-    "As a model developer, running individual documentation sections is useful in various development scenarios. For instance, when updates are made to a model, often only certain parts of the documentation require revision. The `run_documentation_tests()` function allows you to directly test only these affected sections, thus saving you time and ensuring that the documentation accurately reflects the latest changes.\n",
-    "\n",
-    "This interactive notebook includes the code required to load the demo dataset, preprocess the raw dataset, train a model for testing, initialize ValidMind objects, and run the data preparation, model development, and multiple documentation sections."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "  - [Preview the documentation template](#toc2_3__)    \n",
-    "- [Load the Demo Dataset](#toc3__)    \n",
-    "  - [Prepocess the raw dataset](#toc3_1__)    \n",
-    "- [Train a model for testing](#toc4__)    \n",
-    "- [Initialize ValidMind objects](#toc5__)    \n",
-    "  - [Assign predictions to the datasets](#toc5_1__)    \n",
-    "- [Run the data preparation section](#toc6__)    \n",
-    "- [Run the model development section](#toc7__)    \n",
-    "- [Run multiple model documentation sections](#toc8__)    \n",
-    "- [Next steps](#toc9__)    \n",
-    "  - [Work with your model documentation](#toc9_1__)    \n",
-    "  - [Discover more learning resources](#toc9_2__)    \n",
-    "- [Upgrade ValidMind](#toc10__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
-    "\n",
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Metrics**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
-    "\n",
-    "**Custom metrics**: Custom metrics are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom metric.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom metric. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a metric, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom metrics can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Binary classification`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%matplotlib inline\n",
-    "\n",
-    "import xgboost as xgb"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Load the Demo Dataset"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# You can also import taiwan_credit like this:\n",
-    "# from validmind.datasets.classification import taiwan_credit as demo_dataset\n",
-    "from validmind.datasets.classification import customer_churn as demo_dataset\n",
-    "\n",
-    "df = demo_dataset.load_data()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Prepocess the raw dataset"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "train_df, validation_df, test_df = demo_dataset.preprocess(df)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Train a model for testing\n",
-    "\n",
-    "We train a simple customer churn model for our test."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "x_train = train_df.drop(demo_dataset.target_column, axis=1)\n",
-    "y_train = train_df[demo_dataset.target_column]\n",
-    "x_val = validation_df.drop(demo_dataset.target_column, axis=1)\n",
-    "y_val = validation_df[demo_dataset.target_column]\n",
-    "\n",
-    "model = xgb.XGBClassifier(early_stopping_rounds=10)\n",
-    "model.set_params(\n",
-    "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
-    ")\n",
-    "model.fit(\n",
-    "    x_train,\n",
-    "    y_train,\n",
-    "    eval_set=[(x_val, y_val)],\n",
-    "    verbose=False,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Initialize ValidMind objects\n",
-    "\n",
-    "We initize the objects required to run test suites using the ValidMind Library."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_dataset = vm.init_dataset(\n",
-    "    input_id=\"raw_dataset\",\n",
-    "    dataset=df,\n",
-    "    target_column=demo_dataset.target_column,\n",
-    "    class_labels=demo_dataset.class_labels,\n",
-    ")\n",
-    "\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    input_id=\"train_dataset\",\n",
-    "    dataset=train_df,\n",
-    "    type=\"generic\",\n",
-    "    target_column=demo_dataset.target_column,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    input_id=\"test_dataset\",\n",
-    "    dataset=test_df,\n",
-    "    type=\"generic\",\n",
-    "    target_column=demo_dataset.target_column,\n",
-    ")\n",
-    "\n",
-    "vm_model = vm.init_model(model, input_id=\"model\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_1__'></a>\n",
-    "\n",
-    "### Assign predictions to the datasets\n",
-    "\n",
-    "We can now use the `assign_predictions()` method from the `Dataset` object to link existing predictions to any model. If no prediction values are passed, the method will compute predictions automatically:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds.assign_predictions(\n",
-    "    model=vm_model,\n",
-    ")\n",
-    "vm_test_ds.assign_predictions(\n",
-    "    model=vm_model,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Run the data preparation section\n",
-    "\n",
-    "In this section, we focus on running the tests within the data preparation section of the model documentation. After running this function, only the tests associated with this section will be executed, and the corresponding section in the model documentation will be updated."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "results = vm.run_documentation_tests(\n",
-    "    section=\"data_preparation\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_dataset,\n",
-    "    },\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Run the model development section\n",
-    "\n",
-    "In this section, we focus on running the tests within the model development section of the model documentation. After running this function, only the tests associated with this section will be executed, and the corresponding section in the model documentation will be updated."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "results = vm.run_documentation_tests(\n",
-    "    section=\"model_development\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_train_ds,\n",
-    "        \"model\": vm_model,\n",
-    "        \"datasets\": (vm_train_ds, vm_test_ds),\n",
-    "    },\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc8__'></a>\n",
-    "\n",
-    "## Run multiple model documentation sections\n",
-    "\n",
-    "This section demonstrates how you can execute both the data preparation and model development sections using `run_documentation_tests()`. After running this function, the tests associated with both sections will be executed, and their corresponding model documentation sections updated."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "results = vm.run_documentation_tests(\n",
-    "    section=[\"model_development\", \"model_diagnosis\"],\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_test_ds,\n",
-    "        \"model\": vm_model,\n",
-    "        \"datasets\": (vm_train_ds, vm_test_ds),\n",
-    "    },\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc9__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
-    "\n",
-    "<a id='toc9_1__'></a>\n",
-    "\n",
-    "### Work with your model documentation\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)\n",
-    "\n",
-    "<a id='toc9_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc10__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-f4756a1f66ab49598b696ed86685fcc6",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": ".venv",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.8.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
-}
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Run individual documentation sections\n",
+        "\n",
+        "For targeted testing, you can run tests on individual sections or specific groups of sections in your model documentation.\n",
+        "\n",
+        "As a model developer, running individual documentation sections is useful in various development scenarios. For instance, when updates are made to a model, often only certain parts of the documentation require revision. The `run_documentation_tests()` function allows you to directly test only these affected sections, thus saving you time and ensuring that the documentation accurately reflects the latest changes.\n",
+        "\n",
+        "This interactive notebook includes the code required to load the demo dataset, preprocess the raw dataset, train a model for testing, initialize ValidMind objects, and run the data preparation, model development, and multiple documentation sections."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "  - [Preview the documentation template](#toc2_3__)    \n",
+        "- [Load the Demo Dataset](#toc3__)    \n",
+        "  - [Prepocess the raw dataset](#toc3_1__)    \n",
+        "- [Train a model for testing](#toc4__)    \n",
+        "- [Initialize ValidMind objects](#toc5__)    \n",
+        "  - [Assign predictions to the datasets](#toc5_1__)    \n",
+        "- [Run the data preparation section](#toc6__)    \n",
+        "- [Run the model development section](#toc7__)    \n",
+        "- [Run multiple model documentation sections](#toc8__)    \n",
+        "- [Next steps](#toc9__)    \n",
+        "  - [Work with your model documentation](#toc9_1__)    \n",
+        "  - [Discover more learning resources](#toc9_2__)    \n",
+        "- [Upgrade ValidMind](#toc10__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+        "\n",
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Binary classification`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%matplotlib inline\n",
+        "\n",
+        "import xgboost as xgb"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Load the Demo Dataset"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# You can also import taiwan_credit like this:\n",
+        "# from validmind.datasets.classification import taiwan_credit as demo_dataset\n",
+        "from validmind.datasets.classification import customer_churn as demo_dataset\n",
+        "\n",
+        "df = demo_dataset.load_data()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Prepocess the raw dataset"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "train_df, validation_df, test_df = demo_dataset.preprocess(df)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Train a model for testing\n",
+        "\n",
+        "We train a simple customer churn model for our test."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "x_train = train_df.drop(demo_dataset.target_column, axis=1)\n",
+        "y_train = train_df[demo_dataset.target_column]\n",
+        "x_val = validation_df.drop(demo_dataset.target_column, axis=1)\n",
+        "y_val = validation_df[demo_dataset.target_column]\n",
+        "\n",
+        "model = xgb.XGBClassifier(early_stopping_rounds=10)\n",
+        "model.set_params(\n",
+        "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
+        ")\n",
+        "model.fit(\n",
+        "    x_train,\n",
+        "    y_train,\n",
+        "    eval_set=[(x_val, y_val)],\n",
+        "    verbose=False,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Initialize ValidMind objects\n",
+        "\n",
+        "We initize the objects required to run test suites using the ValidMind Library."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_dataset = vm.init_dataset(\n",
+        "    input_id=\"raw_dataset\",\n",
+        "    dataset=df,\n",
+        "    target_column=demo_dataset.target_column,\n",
+        "    class_labels=demo_dataset.class_labels,\n",
+        ")\n",
+        "\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    input_id=\"train_dataset\",\n",
+        "    dataset=train_df,\n",
+        "    type=\"generic\",\n",
+        "    target_column=demo_dataset.target_column,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    input_id=\"test_dataset\",\n",
+        "    dataset=test_df,\n",
+        "    type=\"generic\",\n",
+        "    target_column=demo_dataset.target_column,\n",
+        ")\n",
+        "\n",
+        "vm_model = vm.init_model(model, input_id=\"model\")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Assign predictions to the datasets\n",
+        "\n",
+        "We can now use the `assign_predictions()` method from the `Dataset` object to link existing predictions to any model. If no prediction values are passed, the method will compute predictions automatically:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds.assign_predictions(\n",
+        "    model=vm_model,\n",
+        ")\n",
+        "vm_test_ds.assign_predictions(\n",
+        "    model=vm_model,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Run the data preparation section\n",
+        "\n",
+        "In this section, we focus on running the tests within the data preparation section of the model documentation. After running this function, only the tests associated with this section will be executed, and the corresponding section in the model documentation will be updated."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "results = vm.run_documentation_tests(\n",
+        "    section=\"data_preparation\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_dataset,\n",
+        "    },\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Run the model development section\n",
+        "\n",
+        "In this section, we focus on running the tests within the model development section of the model documentation. After running this function, only the tests associated with this section will be executed, and the corresponding section in the model documentation will be updated."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "results = vm.run_documentation_tests(\n",
+        "    section=\"model_development\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_train_ds,\n",
+        "        \"model\": vm_model,\n",
+        "        \"datasets\": (vm_train_ds, vm_test_ds),\n",
+        "    },\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## Run multiple model documentation sections\n",
+        "\n",
+        "This section demonstrates how you can execute both the data preparation and model development sections using `run_documentation_tests()`. After running this function, the tests associated with both sections will be executed, and their corresponding model documentation sections updated."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "results = vm.run_documentation_tests(\n",
+        "    section=[\"model_development\", \"model_diagnosis\"],\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_test_ds,\n",
+        "        \"model\": vm_model,\n",
+        "        \"datasets\": (vm_train_ds, vm_test_ds),\n",
+        "    },\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc9__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
+        "\n",
+        "<a id='toc9_1__'></a>\n",
+        "\n",
+        "### Work with your documentation\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
+        "\n",
+        "<a id='toc9_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc10__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-f4756a1f66ab49598b696ed86685fcc6"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": ".venv",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.8.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 2
+}
\ No newline at end of file
diff --git a/site/notebooks/how_to/tests/run_tests/documentation_tests/run_documentation_tests_with_config.ipynb b/site/notebooks/how_to/tests/run_tests/documentation_tests/run_documentation_tests_with_config.ipynb
index d74a3773f7..48a3e439d8 100644
--- a/site/notebooks/how_to/tests/run_tests/documentation_tests/run_documentation_tests_with_config.ipynb
+++ b/site/notebooks/how_to/tests/run_tests/documentation_tests/run_documentation_tests_with_config.ipynb
@@ -1,724 +1,738 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Run documentation tests with custom configurations\n",
-    "\n",
-    "When running documentation tests, you can configure inputs and parameters for individual tests by passing a config as a parameter.\n",
-    "\n",
-    "As a model developer, configuring individual tests is useful in various models development scenarios. For instance, based on a use case, a model might require changing inputs and/or parameters for certain tests. The `run_documentation_tests()` function allows you to directly configure tests through `config`, thus giving you flexibility to run tests according to your use case.\n",
-    "\n",
-    "This interactive notebook includes the code required to load the demo dataset, preprocess the raw dataset, train a model for testing, initialize ValidMind objects, and run documentation tests with custom configurations."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "  - [Preview the documentation template](#toc2_3__)    \n",
-    "- [Load the sample dataset](#toc3__)    \n",
-    "- [Document the model](#toc4__)    \n",
-    "- [Prepocess the raw dataset](#toc5__)    \n",
-    "- [Train a model for testing](#toc6__)    \n",
-    "- [Initialize ValidMind objects](#toc7__)    \n",
-    "  - [Initialize ValidMind model object](#toc7_1__)    \n",
-    "  - [Initialize the ValidMind datasets](#toc7_2__)    \n",
-    "  - [Run predictions through `assign_predictions` interface](#toc7_3__)    \n",
-    "- [Run documentation tests](#toc8__)    \n",
-    "  - [Preview config](#toc8_1__)    \n",
-    "  - [Updating config](#toc8_2__)    \n",
-    "  - [Run documentation tests](#toc8_3__)    \n",
-    "- [Next steps](#toc9__)    \n",
-    "  - [Work with your model documentation](#toc9_1__)    \n",
-    "  - [Discover more learning resources](#toc9_2__)    \n",
-    "- [Upgrade ValidMind](#toc10__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
-    "\n",
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Metrics**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
-    "\n",
-    "**Custom metrics**: Custom metrics are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom metric.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom metric. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a metric, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom metrics can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Binary classification`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Load the sample dataset\n",
-    "\n",
-    "The sample dataset used here is provided by the ValidMind library. To be able to use it, you need to import the dataset and load it into a pandas [DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html), a two-dimensional tabular data structure that makes use of rows and columns:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Import the sample dataset from the library\n",
-    "\n",
-    "from validmind.datasets.classification import customer_churn as demo_dataset\n",
-    "\n",
-    "print(\n",
-    "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{demo_dataset.target_column}' \\n\\t• Class labels: {demo_dataset.class_labels}\"\n",
-    ")\n",
-    "\n",
-    "raw_df = demo_dataset.load_data()\n",
-    "raw_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Document the model\n",
-    "\n",
-    "As part of documenting the model with the ValidMind Library, you need to preprocess the raw dataset, initialize some training and test datasets, initialize a model object you can use for testing, and then run the full suite of tests."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Prepocess the raw dataset\n",
-    "\n",
-    "Preprocessing performs a number of operations to get ready for the subsequent steps:\n",
-    "\n",
-    "- Preprocess the data: Splits the DataFrame (`df`) into multiple datasets (`train_df`, `validation_df`, and `test_df`) using `demo_dataset.preprocess` to simplify preprocessing.\n",
-    "- Separate features and targets: Drops the target column to create feature sets (`x_train`, `x_val`) and target sets (`y_train`, `y_val`).\n",
-    "- Initialize XGBoost classifier: Creates an `XGBClassifier` object with early stopping rounds set to 10.\n",
-    "- Set evaluation metrics: Specifies metrics for model evaluation as \"error,\" \"logloss,\" and \"auc.\"\n",
-    "- Fit the model: Trains the model on `x_train` and `y_train` using the validation set `(x_val, y_val)`. Verbose output is disabled."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "train_df, validation_df, test_df = demo_dataset.preprocess(raw_df)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Train a model for testing\n",
-    "\n",
-    "We train a simple customer churn model for our test."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import xgboost\n",
-    "%matplotlib inline\n",
-    "\n",
-    "x_train = train_df.drop(demo_dataset.target_column, axis=1)\n",
-    "y_train = train_df[demo_dataset.target_column]\n",
-    "x_val = validation_df.drop(demo_dataset.target_column, axis=1)\n",
-    "y_val = validation_df[demo_dataset.target_column]\n",
-    "\n",
-    "xgb = xgboost.XGBClassifier(early_stopping_rounds=10)\n",
-    "xgb.set_params(\n",
-    "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
-    ")\n",
-    "xgb.fit(\n",
-    "    x_train,\n",
-    "    y_train,\n",
-    "    eval_set=[(x_val, y_val)],\n",
-    "    verbose=False,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Initialize ValidMind objects"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_1__'></a>\n",
-    "\n",
-    "### Initialize ValidMind model object\n",
-    "\n",
-    "Before you can run tests, you must first initialize a ValidMind model object using the [`init_model`](https://docs.validmind.ai/validmind/validmind.html#init_model) function from the ValidMind (`vm`) module.\n",
-    "\n",
-    "This function takes a number of arguments:\n",
-    "\n",
-    "- `model` — the model that you want to provide as input to tests\n",
-    "- `input_id` - a unique identifier that allows tracking what inputs are used when running each individual test"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_model_xgb = vm.init_model(\n",
-    "    xgb,\n",
-    "    input_id=\"xgb\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind datasets\n",
-    "\n",
-    "Similarly, initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
-    "\n",
-    "This function takes a number of arguments:\n",
-    "\n",
-    "- `dataset` — the raw dataset that you want to provide as input to tests\n",
-    "- `input_id` - a unique identifier that allows tracking what inputs are used when running each individual test\n",
-    "- `target_column` — a required argument if tests require access to true values. This is the name of the target column in the dataset\n",
-    "- `class_labels` — an optional value to map predicted classes to class labels\n",
-    "\n",
-    "With all datasets ready, you can now initialize the raw, training and test datasets (`raw_df`, `train_df` and `test_df`) created earlier into their own dataset objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_raw_ds = vm.init_dataset(\n",
-    "    input_id=\"raw_dataset\",\n",
-    "    dataset=raw_df,\n",
-    "    target_column=demo_dataset.target_column,\n",
-    ")\n",
-    "\n",
-    "feature_columns = [\n",
-    "    \"CreditScore\",\n",
-    "    \"Gender\",\n",
-    "    \"Age\",\n",
-    "    \"Tenure\",\n",
-    "    \"Balance\",\n",
-    "    \"NumOfProducts\",\n",
-    "    \"HasCrCard\",\n",
-    "    \"IsActiveMember\",\n",
-    "    \"EstimatedSalary\",\n",
-    "    \"Geography_France\",\n",
-    "    \"Geography_Germany\",\n",
-    "    \"Geography_Spain\",\n",
-    "]\n",
-    "\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    input_id=\"train_dataset\",\n",
-    "    dataset=train_df,\n",
-    "    target_column=demo_dataset.target_column,\n",
-    "    feature_columns=feature_columns,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    input_id=\"test_dataset\",\n",
-    "    dataset=test_df,\n",
-    "    target_column=demo_dataset.target_column,\n",
-    "    feature_columns=feature_columns,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_3__'></a>\n",
-    "\n",
-    "### Run predictions through `assign_predictions` interface\n",
-    "\n",
-    "We can use `assign_predictions()` to run and assign model predictions to our training and test datasets:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds.assign_predictions(model=vm_model_xgb)\n",
-    "vm_test_ds.assign_predictions(model=vm_model_xgb)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc8__'></a>\n",
-    "\n",
-    "## Run documentation tests"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc8_1__'></a>\n",
-    "\n",
-    "### Preview config\n",
-    "\n",
-    "You can preview the default config for the documentation template using the `vm.get_test_suite().get_default_config()` interface."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import json\n",
-    "\n",
-    "model_test_suite = vm.get_test_suite()\n",
-    "config = model_test_suite.get_default_config()\n",
-    "print(\"Suite Config: \\n\", json.dumps(config, indent=2))"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc8_2__'></a>\n",
-    "\n",
-    "### Updating config\n",
-    "\n",
-    "The test configuration can be updated to fit with your use case and requirements"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "config = {\n",
-    "    \"validmind.data_validation.DatasetSplit\": {\n",
-    "        \"inputs\": {\"datasets\": (vm_train_ds, vm_test_ds)},\n",
-    "    },\n",
-    "    \"validmind.model_validation.sklearn.PopulationStabilityIndex\": {\n",
-    "        \"inputs\": {\"model\": vm_model_xgb, \"datasets\": (vm_train_ds, vm_test_ds)},\n",
-    "    },\n",
-    "    \"validmind.model_validation.sklearn.ConfusionMatrix\": {\n",
-    "        \"inputs\": {\"model\": vm_model_xgb, \"dataset\": vm_test_ds},\n",
-    "    },\n",
-    "    \"validmind.model_validation.sklearn.ClassifierPerformance:in_sample\": {\n",
-    "        \"inputs\": {\"model\": vm_model_xgb, \"dataset\": vm_train_ds},\n",
-    "    },\n",
-    "    \"validmind.model_validation.sklearn.ClassifierPerformance:out_of_sample\": {\n",
-    "        \"inputs\": {\"model\": vm_model_xgb, \"dataset\": vm_test_ds},\n",
-    "    },\n",
-    "    \"validmind.model_validation.sklearn.PrecisionRecallCurve\": {\n",
-    "        \"inputs\": {\"model\": vm_model_xgb, \"dataset\": vm_test_ds},\n",
-    "    },\n",
-    "    \"validmind.model_validation.sklearn.ROCCurve\": {\n",
-    "        \"inputs\": {\"model\": vm_model_xgb, \"dataset\": vm_test_ds},\n",
-    "    },\n",
-    "    \"validmind.model_validation.sklearn.TrainingTestDegradation\": {\n",
-    "        \"inputs\": {\"model\": vm_model_xgb, \"datasets\": (vm_train_ds, vm_test_ds)},\n",
-    "    },\n",
-    "    \"validmind.model_validation.sklearn.MinimumAccuracy\": {\n",
-    "        \"inputs\": {\"model\": vm_model_xgb, \"dataset\": vm_test_ds},\n",
-    "    },\n",
-    "    \"validmind.model_validation.sklearn.MinimumF1Score\": {\n",
-    "        \"inputs\": {\"model\": vm_model_xgb, \"dataset\": vm_test_ds},\n",
-    "    },\n",
-    "    \"validmind.model_validation.sklearn.MinimumROCAUCScore\": {\n",
-    "        \"inputs\": {\"model\": vm_model_xgb, \"dataset\": vm_test_ds},\n",
-    "    },\n",
-    "    \"validmind.model_validation.sklearn.PermutationFeatureImportance\": {\n",
-    "        \"inputs\": {\"model\": vm_model_xgb, \"dataset\": vm_test_ds},\n",
-    "    },\n",
-    "    \"validmind.model_validation.sklearn.SHAPGlobalImportance\": {\n",
-    "        \"inputs\": {\"model\": vm_model_xgb, \"dataset\": vm_test_ds},\n",
-    "    },\n",
-    "    \"validmind.model_validation.sklearn.WeakspotsDiagnosis\": {\n",
-    "        \"inputs\": {\"model\": vm_model_xgb, \"datasets\": (vm_train_ds, vm_test_ds)},\n",
-    "    },\n",
-    "    \"validmind.model_validation.sklearn.OverfitDiagnosis\": {\n",
-    "        \"inputs\": {\"model\": vm_model_xgb, \"datasets\": (vm_train_ds, vm_test_ds)},\n",
-    "    },\n",
-    "    \"validmind.model_validation.sklearn.RobustnessDiagnosis\": {\n",
-    "        \"inputs\": {\"model\": vm_model_xgb, \"datasets\": (vm_train_ds, vm_test_ds)},\n",
-    "    },\n",
-    "}"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc8_3__'></a>\n",
-    "\n",
-    "### Run documentation tests\n",
-    "\n",
-    "You can now run all documentation tests and pass an extra `config` parameter that overrides input and parameter configuration for the tests specified in the object."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "full_suite = vm.run_documentation_tests(\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_raw_ds,\n",
-    "        \"model\": vm_model_xgb,\n",
-    "    },\n",
-    "    config=config,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc9__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
-    "\n",
-    "<a id='toc9_1__'></a>\n",
-    "\n",
-    "### Work with your model documentation\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)\n",
-    "\n",
-    "<a id='toc9_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc10__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-d1660c97181e4b7e9470b3529ffef83d",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "colab": {
-   "provenance": []
-  },
-  "gpuClass": "standard",
-  "kernelspec": {
-   "display_name": ".venv",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.8.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 0
-}
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Run documentation tests with custom configurations\n",
+        "\n",
+        "When running documentation tests, you can configure inputs and parameters for individual tests by passing a config as a parameter.\n",
+        "\n",
+        "As a model developer, configuring individual tests is useful in various models development scenarios. For instance, based on a use case, a model might require changing inputs and/or parameters for certain tests. The `run_documentation_tests()` function allows you to directly configure tests through `config`, thus giving you flexibility to run tests according to your use case.\n",
+        "\n",
+        "This interactive notebook includes the code required to load the demo dataset, preprocess the raw dataset, train a model for testing, initialize ValidMind objects, and run documentation tests with custom configurations."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "  - [Preview the documentation template](#toc2_3__)    \n",
+        "- [Load the sample dataset](#toc3__)    \n",
+        "- [Document the model](#toc4__)    \n",
+        "- [Prepocess the raw dataset](#toc5__)    \n",
+        "- [Train a model for testing](#toc6__)    \n",
+        "- [Initialize ValidMind objects](#toc7__)    \n",
+        "  - [Initialize the ValidMind model](#toc7_1__)    \n",
+        "  - [Initialize the ValidMind datasets](#toc7_2__)    \n",
+        "  - [Run predictions through `assign_predictions` interface](#toc7_3__)    \n",
+        "- [Run documentation tests](#toc8__)    \n",
+        "  - [Preview config](#toc8_1__)    \n",
+        "  - [Updating config](#toc8_2__)    \n",
+        "  - [Run documentation tests](#toc8_3__)    \n",
+        "- [Next steps](#toc9__)    \n",
+        "  - [Work with your documentation](#toc9_1__)    \n",
+        "  - [Discover more learning resources](#toc9_2__)    \n",
+        "- [Upgrade ValidMind](#toc10__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+        "\n",
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Binary classification`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Load the sample dataset\n",
+        "\n",
+        "The sample dataset used here is provided by the ValidMind library. To be able to use it, you need to import the dataset and load it into a pandas [DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html), a two-dimensional tabular data structure that makes use of rows and columns:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Import the sample dataset from the library\n",
+        "\n",
+        "from validmind.datasets.classification import customer_churn as demo_dataset\n",
+        "\n",
+        "print(\n",
+        "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{demo_dataset.target_column}' \\n\\t• Class labels: {demo_dataset.class_labels}\"\n",
+        ")\n",
+        "\n",
+        "raw_df = demo_dataset.load_data()\n",
+        "raw_df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Document the model\n",
+        "\n",
+        "As part of documenting the model with the ValidMind Library, you need to preprocess the raw dataset, initialize some training and test datasets, initialize a model object you can use for testing, and then run the full suite of tests."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Prepocess the raw dataset\n",
+        "\n",
+        "Preprocessing performs a number of operations to get ready for the subsequent steps:\n",
+        "\n",
+        "- Preprocess the data: Splits the DataFrame (`df`) into multiple datasets (`train_df`, `validation_df`, and `test_df`) using `demo_dataset.preprocess` to simplify preprocessing.\n",
+        "- Separate features and targets: Drops the target column to create feature sets (`x_train`, `x_val`) and target sets (`y_train`, `y_val`).\n",
+        "- Initialize XGBoost classifier: Creates an `XGBClassifier` object with early stopping rounds set to 10.\n",
+        "- Set evaluation metrics: Specifies metrics for model evaluation as \"error,\" \"logloss,\" and \"auc.\"\n",
+        "- Fit the model: Trains the model on `x_train` and `y_train` using the validation set `(x_val, y_val)`. Verbose output is disabled."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "train_df, validation_df, test_df = demo_dataset.preprocess(raw_df)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Train a model for testing\n",
+        "\n",
+        "We train a simple customer churn model for our test."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import xgboost\n",
+        "%matplotlib inline\n",
+        "\n",
+        "x_train = train_df.drop(demo_dataset.target_column, axis=1)\n",
+        "y_train = train_df[demo_dataset.target_column]\n",
+        "x_val = validation_df.drop(demo_dataset.target_column, axis=1)\n",
+        "y_val = validation_df[demo_dataset.target_column]\n",
+        "\n",
+        "xgb = xgboost.XGBClassifier(early_stopping_rounds=10)\n",
+        "xgb.set_params(\n",
+        "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
+        ")\n",
+        "xgb.fit(\n",
+        "    x_train,\n",
+        "    y_train,\n",
+        "    eval_set=[(x_val, y_val)],\n",
+        "    verbose=False,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Initialize ValidMind objects"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_1__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind model\n",
+        "\n",
+        "Before you run tests, you'll need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for our model.\n",
+        "\n",
+        "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+        "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
+        "\n",
+        "Initialize your model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# FUNCTION ARGUMENTS:\n",
+        "# model - the model that you want to provide as input to tests\n",
+        "# input_id - a unique identifier that allows tracking what inputs are used when running each individual test\n",
+        "\n",
+        "vm_model_xgb = vm.init_model(\n",
+        "    xgb,\n",
+        "    input_id=\"xgb\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind datasets\n",
+        "\n",
+        "Similarly, initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
+        "\n",
+        "This function takes a number of arguments:\n",
+        "\n",
+        "- `dataset` — the raw dataset that you want to provide as input to tests\n",
+        "- `input_id` - a unique identifier that allows tracking what inputs are used when running each individual test\n",
+        "- `target_column` — a required argument if tests require access to true values. This is the name of the target column in the dataset\n",
+        "- `class_labels` — an optional value to map predicted classes to class labels\n",
+        "\n",
+        "With all datasets ready, you can now initialize the raw, training and test datasets (`raw_df`, `train_df` and `test_df`) created earlier into their own dataset objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_raw_ds = vm.init_dataset(\n",
+        "    input_id=\"raw_dataset\",\n",
+        "    dataset=raw_df,\n",
+        "    target_column=demo_dataset.target_column,\n",
+        ")\n",
+        "\n",
+        "feature_columns = [\n",
+        "    \"CreditScore\",\n",
+        "    \"Gender\",\n",
+        "    \"Age\",\n",
+        "    \"Tenure\",\n",
+        "    \"Balance\",\n",
+        "    \"NumOfProducts\",\n",
+        "    \"HasCrCard\",\n",
+        "    \"IsActiveMember\",\n",
+        "    \"EstimatedSalary\",\n",
+        "    \"Geography_France\",\n",
+        "    \"Geography_Germany\",\n",
+        "    \"Geography_Spain\",\n",
+        "]\n",
+        "\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    input_id=\"train_dataset\",\n",
+        "    dataset=train_df,\n",
+        "    target_column=demo_dataset.target_column,\n",
+        "    feature_columns=feature_columns,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    input_id=\"test_dataset\",\n",
+        "    dataset=test_df,\n",
+        "    target_column=demo_dataset.target_column,\n",
+        "    feature_columns=feature_columns,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_3__'></a>\n",
+        "\n",
+        "### Run predictions through `assign_predictions` interface\n",
+        "\n",
+        "We can use `assign_predictions()` to run and assign model predictions to our training and test datasets:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds.assign_predictions(model=vm_model_xgb)\n",
+        "vm_test_ds.assign_predictions(model=vm_model_xgb)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## Run documentation tests"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8_1__'></a>\n",
+        "\n",
+        "### Preview config\n",
+        "\n",
+        "You can preview the default config for the documentation template using the `vm.get_test_suite().get_default_config()` interface."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import json\n",
+        "\n",
+        "model_test_suite = vm.get_test_suite()\n",
+        "config = model_test_suite.get_default_config()\n",
+        "print(\"Suite Config: \\n\", json.dumps(config, indent=2))"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8_2__'></a>\n",
+        "\n",
+        "### Updating config\n",
+        "\n",
+        "The test configuration can be updated to fit with your use case and requirements"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "config = {\n",
+        "    \"validmind.data_validation.DatasetSplit\": {\n",
+        "        \"inputs\": {\"datasets\": (vm_train_ds, vm_test_ds)},\n",
+        "    },\n",
+        "    \"validmind.model_validation.sklearn.PopulationStabilityIndex\": {\n",
+        "        \"inputs\": {\"model\": vm_model_xgb, \"datasets\": (vm_train_ds, vm_test_ds)},\n",
+        "    },\n",
+        "    \"validmind.model_validation.sklearn.ConfusionMatrix\": {\n",
+        "        \"inputs\": {\"model\": vm_model_xgb, \"dataset\": vm_test_ds},\n",
+        "    },\n",
+        "    \"validmind.model_validation.sklearn.ClassifierPerformance:in_sample\": {\n",
+        "        \"inputs\": {\"model\": vm_model_xgb, \"dataset\": vm_train_ds},\n",
+        "    },\n",
+        "    \"validmind.model_validation.sklearn.ClassifierPerformance:out_of_sample\": {\n",
+        "        \"inputs\": {\"model\": vm_model_xgb, \"dataset\": vm_test_ds},\n",
+        "    },\n",
+        "    \"validmind.model_validation.sklearn.PrecisionRecallCurve\": {\n",
+        "        \"inputs\": {\"model\": vm_model_xgb, \"dataset\": vm_test_ds},\n",
+        "    },\n",
+        "    \"validmind.model_validation.sklearn.ROCCurve\": {\n",
+        "        \"inputs\": {\"model\": vm_model_xgb, \"dataset\": vm_test_ds},\n",
+        "    },\n",
+        "    \"validmind.model_validation.sklearn.TrainingTestDegradation\": {\n",
+        "        \"inputs\": {\"model\": vm_model_xgb, \"datasets\": (vm_train_ds, vm_test_ds)},\n",
+        "    },\n",
+        "    \"validmind.model_validation.sklearn.MinimumAccuracy\": {\n",
+        "        \"inputs\": {\"model\": vm_model_xgb, \"dataset\": vm_test_ds},\n",
+        "    },\n",
+        "    \"validmind.model_validation.sklearn.MinimumF1Score\": {\n",
+        "        \"inputs\": {\"model\": vm_model_xgb, \"dataset\": vm_test_ds},\n",
+        "    },\n",
+        "    \"validmind.model_validation.sklearn.MinimumROCAUCScore\": {\n",
+        "        \"inputs\": {\"model\": vm_model_xgb, \"dataset\": vm_test_ds},\n",
+        "    },\n",
+        "    \"validmind.model_validation.sklearn.PermutationFeatureImportance\": {\n",
+        "        \"inputs\": {\"model\": vm_model_xgb, \"dataset\": vm_test_ds},\n",
+        "    },\n",
+        "    \"validmind.model_validation.sklearn.SHAPGlobalImportance\": {\n",
+        "        \"inputs\": {\"model\": vm_model_xgb, \"dataset\": vm_test_ds},\n",
+        "    },\n",
+        "    \"validmind.model_validation.sklearn.WeakspotsDiagnosis\": {\n",
+        "        \"inputs\": {\"model\": vm_model_xgb, \"datasets\": (vm_train_ds, vm_test_ds)},\n",
+        "    },\n",
+        "    \"validmind.model_validation.sklearn.OverfitDiagnosis\": {\n",
+        "        \"inputs\": {\"model\": vm_model_xgb, \"datasets\": (vm_train_ds, vm_test_ds)},\n",
+        "    },\n",
+        "    \"validmind.model_validation.sklearn.RobustnessDiagnosis\": {\n",
+        "        \"inputs\": {\"model\": vm_model_xgb, \"datasets\": (vm_train_ds, vm_test_ds)},\n",
+        "    },\n",
+        "}"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8_3__'></a>\n",
+        "\n",
+        "### Run documentation tests\n",
+        "\n",
+        "You can now run all documentation tests and pass an extra `config` parameter that overrides input and parameter configuration for the tests specified in the object."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "full_suite = vm.run_documentation_tests(\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_raw_ds,\n",
+        "        \"model\": vm_model_xgb,\n",
+        "    },\n",
+        "    config=config,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc9__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
+        "\n",
+        "<a id='toc9_1__'></a>\n",
+        "\n",
+        "### Work with your documentation\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
+        "\n",
+        "<a id='toc9_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc10__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-d0990f47a72e4eaab065be1540234792"
+    }
+  ],
+  "metadata": {
+    "colab": {
+      "provenance": []
+    },
+    "gpuClass": "standard",
+    "kernelspec": {
+      "display_name": ".venv",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.8.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 0
+}
\ No newline at end of file
diff --git a/site/notebooks/quickstart/quickstart_model_documentation.Rmd b/site/notebooks/quickstart/quickstart_documentation.Rmd
similarity index 69%
rename from site/notebooks/quickstart/quickstart_model_documentation.Rmd
rename to site/notebooks/quickstart/quickstart_documentation.Rmd
index fc48d8c445..d9bfdc2c56 100644
--- a/site/notebooks/quickstart/quickstart_model_documentation.Rmd
+++ b/site/notebooks/quickstart/quickstart_documentation.Rmd
@@ -1,20 +1,20 @@
 ---
-title: "Quickstart for Model Documentation (R)"
+title: "Quickstart for documentation (R)"
 author: "ValidMind"
 date: "2026-03-18"
 output: html_document
 ---
 
-# Quickstart for Model Documentation
+# Quickstart for documentation
 
-Learn the basics of using ValidMind to document models as part of a model development workflow using R. This notebook uses the ValidMind R package (a `reticulate` wrapper around the Python library) to generate a draft of documentation for a binary classification model.
+Learn the basics of using ValidMind to document records as part of a development workflow with R. Using the ValidMind R package (a `reticulate` wrapper around the Python library), you'll generate a draft of documentation using ValidMind tests for a binary classification model.
 
-We will:
+To document our model with the ValidMind Library, we'll:
 
 1. Import a sample dataset and preprocess it
 2. Split the datasets and initialize them for use with ValidMind
-3. Train a logistic regression (GLM) model and initialize it for use with testing
-4. Run the full suite of documentation tests, sending results to the ValidMind Platform
+3. Initialize a ValidMind model object for use with testing
+4. Run a full suite of tests as defined by our documentation template, which will send the results of those tests to the ValidMind Platform
 
 ## Setting up
 
@@ -39,15 +39,41 @@ library(knitr)
 knitr::opts_chunk$set(warning = FALSE, message = FALSE)
 ```
 
-## Initialize the ValidMind Library
+### Initialize the ValidMind Library
 
-Log in to the [ValidMind Platform](https://app.prod.validmind.ai) and register a model:
+#### Register sample model
 
-1. Navigate to **Inventory** and click **+ Register Model**.
-2. Under **Documents > Development**, select the `Binary classification` template.
-3. Go to **Getting Started**, select `Development` from the **DOCUMENT** drop-down, and copy the code snippet.
+Log in to the [ValidMind Platform](https://app.prod.validmind.ai) and register a sample record (model):
 
-Replace the placeholder values below with your own credentials:
+1. In the left sidebar, select **Inventory**.
+
+2. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))
+
+3. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.
+
+4. Select your own name under the **RECORD OWNER** drop-down.
+
+5. Click **Register Model** to add the model to your inventory.
+
+#### Apply documentation template
+
+Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.
+
+1. In the left sidebar that appears for your model, click **Documents** and select **Development**.
+
+2. Under **TEMPLATE**, select `Binary classification`.
+
+3. Click **Use Template** to apply the template.
+
+#### Get your code snippet
+
+Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.
+
+1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.
+
+2. Click **Copy snippet to clipboard**. Paste the snippet into an editor and make note of the credentials.
+
+3. Next, replace the placeholder values below with your own credentials:
 
 ```{r}
 vm_r <- vm(
@@ -164,7 +190,7 @@ vm_test_ds <- vm_r$init_dataset(
 )
 ```
 
-## Initialize a model object
+## Initialize the ValidMind model
 
 Save the R model and initialize it with ValidMind:
 
@@ -216,7 +242,7 @@ full_suite <- vm_r$run_documentation_tests(config = test_config)
 Head to the [ValidMind Platform](https://app.prod.validmind.ai) to view the generated documentation:
 
 1. Navigate to **Inventory** and select your model.
-2. Click **Development** under Documents to see the full draft of your model documentation.
+2. Click **Development** under Documents to see the full draft of your documentation.
 
 From there, you can make qualitative edits, collaborate with validators, and submit for approval.
 
diff --git a/site/notebooks/quickstart/quickstart_documentation.ipynb b/site/notebooks/quickstart/quickstart_documentation.ipynb
new file mode 100644
index 0000000000..033e023454
--- /dev/null
+++ b/site/notebooks/quickstart/quickstart_documentation.ipynb
@@ -0,0 +1,930 @@
+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "id": "7b021b0d",
+      "metadata": {},
+      "source": [
+        "# Quickstart for documentation\n",
+        "\n",
+        "Learn the basics of using ValidMind to document records as part of a development workflow. Set up the ValidMind Library in your environment, and generate a draft of documentation using ValidMind tests for a binary classification model.\n",
+        "\n",
+        "To document our model with the ValidMind Library, we'll:\n",
+        "\n",
+        "1. Import a sample dataset and preprocess it\n",
+        "2. Split the datasets and initialize them for use with ValidMind\n",
+        "3. Initialize a ValidMind model object for use with testing\n",
+        "4. Run a full suite of tests as defined by our documentation template, which will send the results of those tests to the ValidMind Platform"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "167aef58",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [Introduction](#toc1__)    \n",
+        "- [About ValidMind](#toc2__)    \n",
+        "  - [Before you begin](#toc2_1__)    \n",
+        "  - [New to ValidMind?](#toc2_2__)    \n",
+        "  - [Key concepts](#toc2_3__)    \n",
+        "- [Setting up](#toc3__)    \n",
+        "  - [Install the ValidMind Library](#toc3_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc3_2__)    \n",
+        "    - [Register sample model](#toc3_2_1__)    \n",
+        "    - [Apply documentation template](#toc3_2_2__)    \n",
+        "    - [Get your code snippet](#toc3_2_3__)    \n",
+        "  - [Initialize the Python environment](#toc3_3__)    \n",
+        "- [Getting to know ValidMind](#toc4__)    \n",
+        "  - [Preview the documentation template](#toc4_1__)    \n",
+        "  - [View documentation in the ValidMind Platform](#toc4_2__)    \n",
+        "- [Working with ValidMind datasets](#toc5__)    \n",
+        "  - [Prepare the sample dataset](#toc5_1__)    \n",
+        "    - [Import the sample dataset](#toc5_1_1__)    \n",
+        "    - [Preprocess the raw dataset](#toc5_1_2__)    \n",
+        "    - [Split the dataset](#toc5_1_3__)    \n",
+        "    - [Separate features and targets](#toc5_1_4__)    \n",
+        "  - [Initialize the ValidMind datasets](#toc5_2__)    \n",
+        "- [Working with ValidMind models](#toc6__)    \n",
+        "  - [Train an XGBoost classifier model](#toc6_1__)    \n",
+        "    - [Set evaluation metrics](#toc6_1_1__)    \n",
+        "    - [Fit the model](#toc6_1_2__)    \n",
+        "  - [Initialize the ValidMind model](#toc6_2__)    \n",
+        "  - [Assign predictions](#toc6_3__)    \n",
+        "- [Run a ValidMind test suite](#toc7__)    \n",
+        "- [In summary](#toc8__)    \n",
+        "- [Next steps](#toc9__)    \n",
+        "  - [Work with your documentation](#toc9_1__)    \n",
+        "  - [Discover more learning resources](#toc9_2__)    \n",
+        "- [Upgrade ValidMind](#toc10__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "1cce526f",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## Introduction\n",
+        "\n",
+        "Development aims to produce a fit-for-purpose *champion* by conducting thorough testing and analysis, supporting the capabilities of the champion with evidence in the form of documentation and test results. Documentation should be clear and comprehensive, ideally following a structure or template covering all aspects of compliance with risk regulation.\n",
+        "\n",
+        "A *binary classification model* is a type of predictive model used in churn analysis to identify customers who are likely to leave a service or subscription by analyzing various behavioral, transactional, and demographic factors.\n",
+        "\n",
+        "- This model helps businesses take proactive measures to retain at-risk customers by offering personalized incentives, improving customer service, or adjusting pricing strategies.\n",
+        "- Effective validation of a churn prediction model ensures that businesses can accurately identify potential churners, optimize retention efforts, and enhance overall customer satisfaction while minimizing revenue loss."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "f9b5eac2",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "650236de",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "b9d9d4cf",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "59b308f7",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "61b5cbeb",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "0f08166e",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
+        "<br></br>\n",
+        "Python 3.8 <= x <= 3.14</div>\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "d1f6dbed",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "%pip install -q validmind"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "1bf4e4cb",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "cb6e369b",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "7167d002",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Binary classification`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "43037f46",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "e2c1dd22",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "1a6933d3",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_3__'></a>\n",
+        "\n",
+        "### Initialize the Python environment\n",
+        "\n",
+        "Then, let's import the necessary libraries and set up your Python environment for data analysis:\n",
+        "\n",
+        "- Import **Extreme Gradient Boosting** (XGBoost) with an alias so that we can reference its functions in later calls. XGBoost is a powerful machine learning library designed for speed and performance, especially in handling structured or tabular data.\n",
+        "- Enable **`matplotlib`**, a plotting library used for visualizing data. Ensures that any plots you generate will render inline in our notebook output rather than opening in a separate window."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "62d7c2c1",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "import xgboost as xgb\n",
+        "\n",
+        "%matplotlib inline"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "fafe8fc2",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Getting to know ValidMind"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "d7ee565f",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "b2bce375",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "vm.preview_template()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "fa0e43cb",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### View documentation in the ValidMind Platform\n",
+        "\n",
+        "Next, let's head to the ValidMind Platform to see the template in action:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, navigate to **Inventory** and select the model you registered for this notebook.\n",
+        "\n",
+        "3. Click **Development** under Documents for your model and note how the structure of the documentation matches our preview above."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "9d0d1005",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Working with ValidMind datasets"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "1b94e39f",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Prepare the sample dataset"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "6fc79fc1",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1_1__'></a>\n",
+        "\n",
+        "#### Import the sample dataset\n",
+        "\n",
+        "First, let's import the public [Bank Customer Churn Prediction](https://www.kaggle.com/datasets/shantanudhakadd/bank-customer-churn-prediction) dataset from Kaggle so that we have something to work with.\n",
+        "\n",
+        "In our below example, note that: \n",
+        "\n",
+        "- The target column, `Exited` has a value of `1` when a customer has churned and `0` otherwise.\n",
+        "- The ValidMind Library provides a wrapper to automatically load the dataset as a [Pandas DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html) object. A Pandas Dataframe is a two-dimensional tabular data structure that makes use of rows and columns."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "58d1c94b",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "from validmind.datasets.classification import customer_churn\n",
+        "\n",
+        "print(\n",
+        "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{customer_churn.target_column}' \\n\\t• Class labels: {customer_churn.class_labels}\"\n",
+        ")\n",
+        "\n",
+        "raw_df = customer_churn.load_data()\n",
+        "raw_df.head()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "4fe0f216",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1_2__'></a>\n",
+        "\n",
+        "#### Preprocess the raw dataset\n",
+        "\n",
+        "Before running tests with ValidMind, we'll need to preprocess our imported dataset. This involves splitting the data and separating the features (inputs) from the targets (outputs)."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "9f690a04",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1_3__'></a>\n",
+        "\n",
+        "#### Split the dataset\n",
+        "\n",
+        "Splitting our dataset helps assess how well the model generalizes to unseen data.\n",
+        "\n",
+        "Use [`preprocess()`](https://docs.validmind.ai/validmind/validmind/datasets/classification/customer_churn.html#preprocess) to split our dataset into three subsets:\n",
+        "\n",
+        "1. **train_df** — Used to train the model.\n",
+        "2. **validation_df** — Used to evaluate the model's performance during training.\n",
+        "3. **test_df** — Used later on to asses the model's performance on new, unseen data."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "418cb5aa",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "train_df, validation_df, test_df = customer_churn.preprocess(raw_df)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "a9ad2104",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1_4__'></a>\n",
+        "\n",
+        "#### Separate features and targets\n",
+        "\n",
+        "To train the model, we need to provide it with:\n",
+        "\n",
+        "1. **Inputs** — Features such as customer age, usage, etc.\n",
+        "2. **Outputs (Expected answers/labels)** — in our case, we would like to know whether the customer churned or not.\n",
+        "\n",
+        "Here, we'll use `x_train` and `x_val` to hold the input data (features), and `y_train` and `y_val` to hold the answers (the target we want to predict):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "6fd365fd",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "x_train = train_df.drop(customer_churn.target_column, axis=1)\n",
+        "y_train = train_df[customer_churn.target_column]\n",
+        "x_val = validation_df.drop(customer_churn.target_column, axis=1)\n",
+        "y_val = validation_df[customer_churn.target_column]"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "73d767d7",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind datasets\n",
+        "\n",
+        "Before you can run tests with your preprocessed datasets, you must first initialize a ValidMind `Dataset` object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module. **This step is always necessary every time you want to connect a dataset to documentation and produce test results through ValidMind,** but you only need to do it once per dataset.\n",
+        "\n",
+        "For this example, we'll pass in the following arguments:\n",
+        "\n",
+        "- **`dataset`** — The raw dataset that you want to provide as input to tests.\n",
+        "- **`input_id`** — A unique identifier that allows tracking what inputs are used when running each individual test.\n",
+        "- **`target_column`** — A required argument if tests require access to true values. This is the name of the target column in the dataset.\n",
+        "- **`class_labels`** — An optional value to map predicted classes to class labels."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "bb6ad06a",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Initialize the raw dataset\n",
+        "vm_raw_dataset = vm.init_dataset(\n",
+        "    dataset=raw_df,\n",
+        "    input_id=\"raw_dataset\",\n",
+        "    target_column=customer_churn.target_column,\n",
+        "    class_labels=customer_churn.class_labels,\n",
+        ")\n",
+        "\n",
+        "# Initialize the training dataset\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    dataset=train_df,\n",
+        "    input_id=\"train_dataset\",\n",
+        "    target_column=customer_churn.target_column,\n",
+        ")\n",
+        "\n",
+        "# Initialize the testing dataset\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    dataset=test_df,\n",
+        "    input_id=\"test_dataset\",\n",
+        "    target_column=customer_churn.target_column\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "0b33afca",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Working with ValidMind models"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "5962362c",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_1__'></a>\n",
+        "\n",
+        "### Train an XGBoost classifier model\n",
+        "\n",
+        "Next, let's create an XGBoost classifier model that will automatically stop training if it doesn’t improve after 10 tries.\n",
+        "\n",
+        "Setting a threshold avoids wasting time and helps prevent overfitting by stopping training when further improvement isn’t happening."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "3296cac6",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "model = xgb.XGBClassifier(early_stopping_rounds=10)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "33cafbcf",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_1_1__'></a>\n",
+        "\n",
+        "#### Set evaluation metrics\n",
+        "\n",
+        "Then, we'll set the evaluation metrics, which tells the model to use three different ways to measure its performance:\n",
+        "\n",
+        "1. **error** — Measures how often the model makes incorrect predictions.\n",
+        "2. **logloss** — Indicates how confident the predictions are.\n",
+        "3. **auc** — Evaluates how well the model distinguishes between churn and not churn.\n",
+        "\n",
+        "Using multiple metrics gives a more complete picture of how good (or bad) the model is."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "32d3c3f4",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "model.set_params(\n",
+        "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "47d84a80",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_1_2__'></a>\n",
+        "\n",
+        "#### Fit the model\n",
+        "\n",
+        "Finally, our actual training step — where the model learns patterns from the data, so it can make predictions later:\n",
+        "\n",
+        "- The model is trained on `x_train` and `y_train`, and evaluates its performance using `x_val` and `y_val` to check if it’s learning well.\n",
+        "- To turn off printed output while training, we'll set `verbose` to `False`."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "3fb95ce4",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "model.fit(\n",
+        "    x_train,\n",
+        "    y_train,\n",
+        "    eval_set=[(x_val, y_val)],\n",
+        "    verbose=False,\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "23bccb27",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind model\n",
+        "\n",
+        "You'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for our model.\n",
+        "\n",
+        "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+        "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
+        "\n",
+        "Initialize your model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "0e44eebd",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "vm_model = vm.init_model(\n",
+        "    model,\n",
+        "    input_id=\"model\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "20c008bf",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_3__'></a>\n",
+        "\n",
+        "### Assign predictions\n",
+        "\n",
+        "Once the model has been registered, you can assign model predictions to the training and testing datasets.\n",
+        "\n",
+        "- The [`assign_predictions()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#assign_predictions) from the `Dataset` object can link existing predictions to any number of models.\n",
+        "- This method links the model's class prediction values and probabilities to our `vm_train_ds` and `vm_test_ds` datasets.\n",
+        "\n",
+        "If no prediction values are passed, the method will compute predictions automatically:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "62bd94fc",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "vm_train_ds.assign_predictions(\n",
+        "    model=vm_model,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds.assign_predictions(\n",
+        "    model=vm_model,\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "0e66a7cd",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Run a ValidMind test suite\n",
+        "\n",
+        "This is where it all comes together — you are now ready to **run the documentation tests for the model as defined by the documentation template** you looked at earlier.\n",
+        "\n",
+        "The [`vm.run_documentation_tests`](https://docs.validmind.ai/validmind/validmind.html#run_documentation_tests) function finds and runs every test specified in the template and then uploads all the documentation and test artifacts that get generated to the ValidMind Platform:\n",
+        "\n",
+        "- The function requires information about the inputs to use on every test. These inputs can be passed as an `inputs` argument if we want to use the same inputs for all tests. \n",
+        "- It's also possible to pass a `config` argument that has information about the `params` and `inputs` that each test requires. The `config` parameter is a dictionary with the following structure:\n",
+        "\n",
+        "    ```python\n",
+        "    config = {\n",
+        "        \"<test-id>\": {\n",
+        "            \"params\": {\n",
+        "                \"param1\": \"value1\",\n",
+        "                \"param2\": \"value2\",\n",
+        "                ...\n",
+        "            },\n",
+        "            \"inputs\": {\n",
+        "                \"input1\": \"value1\",\n",
+        "                \"input2\": \"value2\",\n",
+        "                ...\n",
+        "            }\n",
+        "        },\n",
+        "        ...\n",
+        "    }\n",
+        "    ```\n",
+        "\n",
+        "    Each `<test-id>` above corresponds to the test driven block identifiers shown by `vm.preview_template()`. For this model, we will use the default parameters for all tests, but we'll need to specify the input configuration for each one. The method `get_demo_test_config()` below constructs the default input configuration for our demo."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "b3d6741b",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "from validmind.utils import preview_test_config\n",
+        "\n",
+        "test_config = customer_churn.get_demo_test_config()\n",
+        "preview_test_config(test_config)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "7eebd40f",
+      "metadata": {},
+      "source": [
+        "Now we can pass the input configuration to `vm.run_documentation_tests()` and run the full suite of tests.\n",
+        "\n",
+        "The variable `full_suite` then holds the result of these tests:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "ae3accf7",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "full_suite = vm.run_documentation_tests(config=test_config)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "ed61fa23",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## In summary\n",
+        "\n",
+        "In this notebook, you learned how to:\n",
+        "\n",
+        "- [x] Register a record (model) within the ValidMind Platform\n",
+        "- [x] Install and initialize the ValidMind Library\n",
+        "- [x] Preview the documentation template for your model\n",
+        "- [x] Import a sample dataset\n",
+        "- [x] Initialize ValidMind datasets and model objects\n",
+        "- [x] Assign model predictions to your ValidMind model objects\n",
+        "- [x] Run a full suite of documentation tests"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "68803cd9",
+      "metadata": {},
+      "source": [
+        "<a id='toc9__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the output produced by the ValidMind Library right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your documentation."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "ba38b729",
+      "metadata": {},
+      "source": [
+        "<a id='toc9_1__'></a>\n",
+        "\n",
+        "### Work with your documentation\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "ae046dc4",
+      "metadata": {},
+      "source": [
+        "<a id='toc9_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "For a more in-depth introduction to using the ValidMind Library for development, check out our introductory development series and the accompanying interactive training:\n",
+        "\n",
+        "- **[ValidMind for development](https://docs.validmind.ai/developer/validmind-library.html#development)**\n",
+        "- **[Developer Fundamentals](https://docs.validmind.ai/training/developer-fundamentals/developer-fundamentals-register.html)**\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "4ce38015",
+      "metadata": {},
+      "source": [
+        "<a id='toc10__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "id": "35955b6b",
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "%pip show validmind"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "f865e64e",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "65b36aa7",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "copyright-bd87da591b88473997979690dbffcfa5",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ]
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "name": "python",
+      "version": "3.12.12"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 5
+}
diff --git a/site/notebooks/quickstart/quickstart_model_documentation.ipynb b/site/notebooks/quickstart/quickstart_model_documentation.ipynb
deleted file mode 100644
index 40287aa57f..0000000000
--- a/site/notebooks/quickstart/quickstart_model_documentation.ipynb
+++ /dev/null
@@ -1,884 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "id": "686bdc65",
-   "metadata": {},
-   "source": [
-    "# Quickstart for model documentation\n",
-    "\n",
-    "Learn the basics of using ValidMind to document models as part of a model development workflow. Set up the ValidMind Library in your environment, and generate a draft of documentation using ValidMind tests for a binary classification model.\n",
-    "\n",
-    "To document a model with the ValidMind Library, we'll:\n",
-    "\n",
-    "1. Import a sample dataset and preprocess it\n",
-    "2. Split the datasets and initialize them for use with ValidMind\n",
-    "3. Initialize a model object for use with testing\n",
-    "4. Run a full suite of tests as defined by our documentation template, which will send the results of those tests to the ValidMind Platform"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "17e1b850",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [Introduction](#toc1__)    \n",
-    "- [About ValidMind](#toc2__)    \n",
-    "  - [Before you begin](#toc2_1__)    \n",
-    "  - [New to ValidMind?](#toc2_2__)    \n",
-    "  - [Key concepts](#toc2_3__)    \n",
-    "- [Setting up](#toc3__)    \n",
-    "  - [Install the ValidMind Library](#toc3_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc3_2__)    \n",
-    "    - [Register sample model](#toc3_2_1__)    \n",
-    "    - [Apply documentation template](#toc3_2_2__)    \n",
-    "    - [Get your code snippet](#toc3_2_3__)    \n",
-    "  - [Initialize the Python environment](#toc3_3__)    \n",
-    "- [Getting to know ValidMind](#toc4__)    \n",
-    "  - [Preview the documentation template](#toc4_1__)    \n",
-    "  - [View model documentation in the ValidMind Platform](#toc4_2__)    \n",
-    "- [Import the sample dataset](#toc5__)    \n",
-    "- [Preprocessing the raw dataset](#toc6__)    \n",
-    "  - [Split the dataset](#toc6_1__)    \n",
-    "  - [Separate features and targets](#toc6_2__)    \n",
-    "- [Training an XGBoost classifier model](#toc7__)    \n",
-    "  - [Set evaluation metrics](#toc7_1__)    \n",
-    "  - [Fit the model](#toc7_2__)    \n",
-    "- [Initialize the ValidMind datasets](#toc8__)    \n",
-    "- [Initialize a model object](#toc9__)    \n",
-    "  - [Assign predictions](#toc9_1__)    \n",
-    "- [Run the full suite of tests](#toc10__)    \n",
-    "- [In summary](#toc11__)    \n",
-    "- [Next steps](#toc12__)    \n",
-    "  - [Work with your model documentation](#toc12_1__)    \n",
-    "  - [Discover more learning resources](#toc12_2__)    \n",
-    "- [Upgrade ValidMind](#toc13__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "16993535",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## Introduction\n",
-    "\n",
-    "Model development aims to produce a fit-for-purpose *champion model* by conducting thorough testing and analysis, supporting the capabilities of the model with evidence in the form of documentation and test results. Model documentation should be clear and comprehensive, ideally following a structure or template covering all aspects of compliance with model risk regulation.\n",
-    "\n",
-    "A *binary classification model* is a type of predictive model used in churn analysis to identify customers who are likely to leave a service or subscription by analyzing various behavioral, transactional, and demographic factors.\n",
-    "\n",
-    "- This model helps businesses take proactive measures to retain at-risk customers by offering personalized incentives, improving customer service, or adjusting pricing strategies.\n",
-    "- Effective validation of a churn prediction model ensures that businesses can accurately identify potential churners, optimize retention efforts, and enhance overall customer satisfaction while minimizing revenue loss."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "3b8e33f0",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models. \n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "24a5e851",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "87f8ed22",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "61497ac2",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Metrics**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
-    "\n",
-    "**Custom metrics**: Custom metrics are functions that you define to evaluate your model or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom metric.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom metric. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a metric, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom metrics can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "5c4158bd",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "fd4a5481",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
-    "<br></br>\n",
-    "Python 3.8 <= x <= 3.14</div>\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "d1f6dbed",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "d32e4d62",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "70757032",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "445ac2ce",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Binary classification`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "c30a58b5",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "e2c1dd22",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "d1dcb3d0",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_3__'></a>\n",
-    "\n",
-    "### Initialize the Python environment\n",
-    "\n",
-    "Then, let's import the necessary libraries and set up your Python environment for data analysis:\n",
-    "\n",
-    "- Import **Extreme Gradient Boosting** (XGBoost) with an alias so that we can reference its functions in later calls. XGBoost is a powerful machine learning library designed for speed and performance, especially in handling structured or tabular data.\n",
-    "- Enable **`matplotlib`**, a plotting library used for visualizing data. Ensures that any plots you generate will render inline in our notebook output rather than opening in a separate window."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "62d7c2c1",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import xgboost as xgb\n",
-    "\n",
-    "%matplotlib inline"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "7bbc5e0c",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Getting to know ValidMind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b07067d5",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "b2bce375",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "1336b875",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### View model documentation in the ValidMind Platform\n",
-    "\n",
-    "Next, let's head to the ValidMind Platform to see the template in action:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and select the model you registered for this notebook.\n",
-    "\n",
-    "3. Click **Development** under Documents for your model and note how the structure of the documentation matches our preview above."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e2281cec",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Import the sample dataset\n",
-    "\n",
-    "First, let's import the public [Bank Customer Churn Prediction](https://www.kaggle.com/datasets/shantanudhakadd/bank-customer-churn-prediction) dataset from Kaggle so that we have something to work with.\n",
-    "\n",
-    "In our below example, note that: \n",
-    "\n",
-    "- The target column, `Exited` has a value of `1` when a customer has churned and `0` otherwise.\n",
-    "- The ValidMind Library provides a wrapper to automatically load the dataset as a [Pandas DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html) object. A Pandas Dataframe is a two-dimensional tabular data structure that makes use of rows and columns."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "58d1c94b",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.datasets.classification import customer_churn\n",
-    "\n",
-    "print(\n",
-    "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{customer_churn.target_column}' \\n\\t• Class labels: {customer_churn.class_labels}\"\n",
-    ")\n",
-    "\n",
-    "raw_df = customer_churn.load_data()\n",
-    "raw_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "0aafde18",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Preprocessing the raw dataset\n",
-    "\n",
-    "Before running tests with ValidMind, we'll need to preprocess our imported dataset. This involves splitting the data and separating the features (inputs) from the targets (outputs)."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "dcd9848d",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1__'></a>\n",
-    "\n",
-    "### Split the dataset\n",
-    "\n",
-    "Splitting our dataset helps assess how well the model generalizes to unseen data.\n",
-    "\n",
-    "Use [`preprocess()`](https://docs.validmind.ai/validmind/validmind/datasets/classification/customer_churn.html#preprocess) to split our dataset into three subsets:\n",
-    "\n",
-    "1. **train_df** — Used to train the model.\n",
-    "2. **validation_df** — Used to evaluate the model's performance during training.\n",
-    "3. **test_df** — Used later on to asses the model's performance on new, unseen data."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "418cb5aa",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "train_df, validation_df, test_df = customer_churn.preprocess(raw_df)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "0ed6cb75",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2__'></a>\n",
-    "\n",
-    "### Separate features and targets\n",
-    "\n",
-    "To train the model, we need to provide it with:\n",
-    "\n",
-    "1. **Inputs** — Features such as customer age, usage, etc.\n",
-    "2. **Outputs (Expected answers/labels)** — in our case, we would like to know whether the customer churned or not.\n",
-    "\n",
-    "Here, we'll use `x_train` and `x_val` to hold the input data (features), and `y_train` and `y_val` to hold the answers (the target we want to predict):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "6fd365fd",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "x_train = train_df.drop(customer_churn.target_column, axis=1)\n",
-    "y_train = train_df[customer_churn.target_column]\n",
-    "x_val = validation_df.drop(customer_churn.target_column, axis=1)\n",
-    "y_val = validation_df[customer_churn.target_column]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "3e1d226e",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Training an XGBoost classifier model\n",
-    "\n",
-    "Next, let's create an XGBoost classifier model that will automatically stop training if it doesn’t improve after 10 tries.\n",
-    "\n",
-    "Setting a threshold avoids wasting time and helps prevent overfitting by stopping training when further improvement isn’t happening."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "3296cac6",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "model = xgb.XGBClassifier(early_stopping_rounds=10)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "d641a3f1",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_1__'></a>\n",
-    "\n",
-    "### Set evaluation metrics\n",
-    "\n",
-    "Then, we'll set the evaluation metrics, which tells the model to use three different ways to measure its performance:\n",
-    "\n",
-    "1. **error** — Measures how often the model makes incorrect predictions.\n",
-    "2. **logloss** — Indicates how confident the predictions are.\n",
-    "3. **auc** — Evaluates how well the model distinguishes between churn and not churn.\n",
-    "\n",
-    "Using multiple metrics gives a more complete picture of how good (or bad) the model is."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "32d3c3f4",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "model.set_params(\n",
-    "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "ec0de49c",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_2__'></a>\n",
-    "\n",
-    "### Fit the model\n",
-    "\n",
-    "Finally, our actual training step — where the model learns patterns from the data, so it can make predictions later:\n",
-    "\n",
-    "- The model is trained on `x_train` and `y_train`, and evaluates its performance using `x_val` and `y_val` to check if it’s learning well.\n",
-    "- To turn off printed output while training, we'll set `verbose` to `False`."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "3fb95ce4",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "model.fit(\n",
-    "    x_train,\n",
-    "    y_train,\n",
-    "    eval_set=[(x_val, y_val)],\n",
-    "    verbose=False,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "833a5047",
-   "metadata": {},
-   "source": [
-    "<a id='toc8__'></a>\n",
-    "\n",
-    "## Initialize the ValidMind datasets\n",
-    "\n",
-    "Before you can run tests with your preprocessed datasets, you must first initialize a ValidMind `Dataset` object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module. **This step is always necessary every time you want to connect a dataset to documentation and produce test results through ValidMind,** but you only need to do it once per dataset.\n",
-    "\n",
-    "For this example, we'll pass in the following arguments:\n",
-    "\n",
-    "- **`dataset`** — The raw dataset that you want to provide as input to tests.\n",
-    "- **`input_id`** — A unique identifier that allows tracking what inputs are used when running each individual test.\n",
-    "- **`target_column`** — A required argument if tests require access to true values. This is the name of the target column in the dataset.\n",
-    "- **`class_labels`** — An optional value to map predicted classes to class labels."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "bb6ad06a",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize the raw dataset\n",
-    "vm_raw_dataset = vm.init_dataset(\n",
-    "    dataset=raw_df,\n",
-    "    input_id=\"raw_dataset\",\n",
-    "    target_column=customer_churn.target_column,\n",
-    "    class_labels=customer_churn.class_labels,\n",
-    ")\n",
-    "\n",
-    "# Initialize the training dataset\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    dataset=train_df,\n",
-    "    input_id=\"train_dataset\",\n",
-    "    target_column=customer_churn.target_column,\n",
-    ")\n",
-    "\n",
-    "# Initialize the testing dataset\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    dataset=test_df,\n",
-    "    input_id=\"test_dataset\",\n",
-    "    target_column=customer_churn.target_column\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "316ae030",
-   "metadata": {},
-   "source": [
-    "<a id='toc9__'></a>\n",
-    "\n",
-    "## Initialize a model object\n",
-    "\n",
-    "You'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for our model.\n",
-    "\n",
-    "You simply initialize this model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "0e44eebd",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_model = vm.init_model(\n",
-    "    model,\n",
-    "    input_id=\"model\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "3002517f",
-   "metadata": {},
-   "source": [
-    "<a id='toc9_1__'></a>\n",
-    "\n",
-    "### Assign predictions\n",
-    "\n",
-    "Once the model has been registered, you can assign model predictions to the training and testing datasets.\n",
-    "\n",
-    "- The [`assign_predictions()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#assign_predictions) from the `Dataset` object can link existing predictions to any number of models.\n",
-    "- This method links the model's class prediction values and probabilities to our `vm_train_ds` and `vm_test_ds` datasets.\n",
-    "\n",
-    "If no prediction values are passed, the method will compute predictions automatically:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "62bd94fc",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds.assign_predictions(\n",
-    "    model=vm_model,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds.assign_predictions(\n",
-    "    model=vm_model,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "123d94f9",
-   "metadata": {},
-   "source": [
-    "<a id='toc10__'></a>\n",
-    "\n",
-    "## Run the full suite of tests\n",
-    "\n",
-    "This is where it all comes together — you are now ready to **run the documentation tests for the model as defined by the documentation template** you looked at earlier.\n",
-    "\n",
-    "The [`vm.run_documentation_tests`](https://docs.validmind.ai/validmind/validmind.html#run_documentation_tests) function finds and runs every test specified in the template and then uploads all the documentation and test artifacts that get generated to the ValidMind Platform:\n",
-    "\n",
-    "- The function requires information about the inputs to use on every test. These inputs can be passed as an `inputs` argument if we want to use the same inputs for all tests. \n",
-    "- It's also possible to pass a `config` argument that has information about the `params` and `inputs` that each test requires. The `config` parameter is a dictionary with the following structure:\n",
-    "\n",
-    "    ```python\n",
-    "    config = {\n",
-    "        \"<test-id>\": {\n",
-    "            \"params\": {\n",
-    "                \"param1\": \"value1\",\n",
-    "                \"param2\": \"value2\",\n",
-    "                ...\n",
-    "            },\n",
-    "            \"inputs\": {\n",
-    "                \"input1\": \"value1\",\n",
-    "                \"input2\": \"value2\",\n",
-    "                ...\n",
-    "            }\n",
-    "        },\n",
-    "        ...\n",
-    "    }\n",
-    "    ```\n",
-    "\n",
-    "    Each `<test-id>` above corresponds to the test driven block identifiers shown by `vm.preview_template()`. For this model, we will use the default parameters for all tests, but we'll need to specify the input configuration for each one. The method `get_demo_test_config()` below constructs the default input configuration for our demo."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "b3d6741b",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.utils import preview_test_config\n",
-    "\n",
-    "test_config = customer_churn.get_demo_test_config()\n",
-    "preview_test_config(test_config)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "323c9246",
-   "metadata": {},
-   "source": [
-    "Now we can pass the input configuration to `vm.run_documentation_tests()` and run the full suite of tests.\n",
-    "\n",
-    "The variable `full_suite` then holds the result of these tests:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "ae3accf7",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "full_suite = vm.run_documentation_tests(config=test_config)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "5235c139",
-   "metadata": {},
-   "source": [
-    "<a id='toc11__'></a>\n",
-    "\n",
-    "## In summary\n",
-    "\n",
-    "In this notebook, you learned how to:\n",
-    "\n",
-    "- [x] Register a model within the ValidMind Platform\n",
-    "- [x] Install and initialize the ValidMind Library\n",
-    "- [x] Preview the documentation template for your model\n",
-    "- [x] Import a sample dataset\n",
-    "- [x] Initialize ValidMind datasets and model objects\n",
-    "- [x] Assign model predictions to your ValidMind model objects\n",
-    "- [x] Run a full suite of documentation tests"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "2c84651a",
-   "metadata": {},
-   "source": [
-    "<a id='toc12__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the output produced by the ValidMind Library right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "946e40b2",
-   "metadata": {},
-   "source": [
-    "<a id='toc12_1__'></a>\n",
-    "\n",
-    "### Work with your model documentation\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "0b83397d",
-   "metadata": {},
-   "source": [
-    "<a id='toc12_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "For a more in-depth introduction to using the ValidMind Library for development, check out our introductory development series and the accompanying interactive training:\n",
-    "\n",
-    "- **[ValidMind for model development](https://docs.validmind.ai/developer/validmind-library.html#for-model-development)**\n",
-    "- **[Developer Fundamentals](https://docs.validmind.ai/training/developer-fundamentals/developer-fundamentals-register.html)**\n",
-    "\n",
-    "We also offer many interactive notebooks to help you document models:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "9c78dfe5",
-   "metadata": {},
-   "source": [
-    "<a id='toc13__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "35955b6b",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f6061b3d",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f7216e8c",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-e26871efeffc48e386d68e90db1838e7",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
-  },
-  "language_info": {
-   "name": "python",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
-}
diff --git a/site/notebooks/quickstart/quickstart_model_validation.ipynb b/site/notebooks/quickstart/quickstart_model_validation.ipynb
deleted file mode 100644
index 63e17f2a88..0000000000
--- a/site/notebooks/quickstart/quickstart_model_validation.ipynb
+++ /dev/null
@@ -1,1207 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "id": "395ae75c",
-   "metadata": {},
-   "source": [
-    "# Quickstart for model validation\n",
-    "\n",
-    "Learn the basics of using ValidMind to validate models as part of a model validation workflow. Set up the ValidMind Library in your environment, and generate a draft of a validation report using ValidMind tests for a binary classification model.\n",
-    "\n",
-    "To validate a model with the ValidMind Library, we'll:\n",
-    "\n",
-    "1. Import a sample dataset and preprocess it, then split the datasets and initialize them for use with ValidMind\n",
-    "2. Independently verify data quality tests performed on datasets by model development\n",
-    "3. Import a champion model for evaluation\n",
-    "4. Run model evaluation tests with the ValidMind Library, which will send the results of those tests to the ValidMind Platform"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "2e85681d",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [Introduction](#toc1__)    \n",
-    "- [About ValidMind](#toc2__)    \n",
-    "  - [Before you begin](#toc2_1__)    \n",
-    "  - [New to ValidMind?](#toc2_2__)    \n",
-    "  - [Key concepts](#toc2_3__)    \n",
-    "- [Setting up](#toc3__)    \n",
-    "  - [Register a sample model](#toc3_1__)    \n",
-    "    - [Assign validator credentials](#toc3_1_1__)    \n",
-    "    - [Apply validation report template](#toc3_1_2__)    \n",
-    "  - [Install the ValidMind Library](#toc3_2__)    \n",
-    "  - [Initialize the ValidMind Library](#toc3_3__)    \n",
-    "    - [Get your code snippet](#toc3_3_1__)    \n",
-    "  - [Initialize the Python environment](#toc3_4__)    \n",
-    "- [Getting to know ValidMind](#toc4__)    \n",
-    "  - [Preview the validation report template](#toc4_1__)    \n",
-    "  - [View validation report in the ValidMind Platform](#toc4_2__)    \n",
-    "- [Importing the sample dataset](#toc5__)    \n",
-    "  - [Load the sample dataset](#toc5_1__)    \n",
-    "  - [Preprocess the raw dataset](#toc5_2__)    \n",
-    "    - [Split the dataset](#toc5_2_1__)    \n",
-    "    - [Separate features and targets](#toc5_2_2__)    \n",
-    "- [Running data quality tests](#toc6__)    \n",
-    "  - [Identify qualitative tests](#toc6_1__)    \n",
-    "  - [Initialize the ValidMind datasets](#toc6_2__)    \n",
-    "  - [Run an individual data quality test](#toc6_3__)    \n",
-    "  - [Run data comparison tests](#toc6_4__)    \n",
-    "- [Importing the champion model](#toc7__)    \n",
-    "  - [Initialize a model object](#toc7_1__)    \n",
-    "  - [Assign predictions](#toc7_2__)    \n",
-    "- [Running model evaluation tests](#toc8__)    \n",
-    "  - [Run model performance tests](#toc8_1__)    \n",
-    "  - [Run diagnostic tests](#toc8_2__)    \n",
-    "  - [Run feature importance tests](#toc8_3__)    \n",
-    "- [In summary](#toc9__)    \n",
-    "- [Next steps](#toc10__)    \n",
-    "  - [Work with your validation report](#toc10_1__)    \n",
-    "  - [Discover more learning resources](#toc10_2__)    \n",
-    "- [Upgrade ValidMind](#toc11__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "5156da5e",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## Introduction\n",
-    "\n",
-    "Model validation aims to independently assess the compliance of *champion models* created by model developers with regulatory guidance by conducting thorough testing and analysis, potentially including the use of challenger models to benchmark performance. Assessments, presented in the form of a validation report, typically include *artifacts (findings)* and recommendations to address those issues.\n",
-    "\n",
-    "A *binary classification model* is a type of predictive model used in churn analysis to identify customers who are likely to leave a service or subscription by analyzing various behavioral, transactional, and demographic factors.\n",
-    "\n",
-    "- This model helps businesses take proactive measures to retain at-risk customers by offering personalized incentives, improving customer service, or adjusting pricing strategies.\n",
-    "- Effective validation of a churn prediction model ensures that businesses can accurately identify potential churners, optimize retention efforts, and enhance overall customer satisfaction while minimizing revenue loss."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "76b38b30",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate comparison and other validation tests, and then use the ValidMind Platform to submit compliance assessments of champion models via comprehensive validation reports. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model developers."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "cb0042c8",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "67b0915f",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "d0f2ef91",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Validation report**: A comprehensive and structured assessment of a model’s development and performance, focusing on verifying its integrity, appropriateness, and alignment with its intended use. It includes analyses of model assumptions, data quality, performance metrics, outcomes of testing procedures, and risk considerations. The validation report supports transparency, regulatory compliance, and informed decision-making by documenting the validator’s independent review and conclusions.\n",
-    "\n",
-    "**Validation report template**: Serves as a standardized framework for conducting and documenting model validation activities. It outlines the required sections, recommended analyses, and expected validation tests, ensuring consistency and completeness across validation reports. The template helps guide validators through a systematic review process while promoting comparability and traceability of validation outcomes.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets.\n",
-    "\n",
-    "**Metrics**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
-    "\n",
-    "**Custom metrics**: Custom metrics are functions that you define to evaluate your model or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom metric.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom metric. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a metric, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom metrics can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "d5a91730",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "144c69e9",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Register a sample model\n",
-    "\n",
-    "In a usual model lifecycle, a champion model will have been independently registered in your model inventory and submitted to you for validation by your model development team as part of the effective challenge process. (**Learn more:** [Submit for approval](https://docs.validmind.ai/guide/model-documentation/submit-for-approval.html))\n",
-    "\n",
-    "For this notebook, we'll have you register a dummy model in the ValidMind Platform inventory and assign yourself as the validator to familiarize you with the ValidMind interface and circumvent the need for an existing model:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down — don’t worry, we’ll adjust these permissions next for validation.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "45c2cd47",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1_1__'></a>\n",
-    "\n",
-    "#### Assign validator credentials\n",
-    "\n",
-    "In order to log tests as a validator instead of as a developer, on the model details page that appears after you've successfully registered your sample model:\n",
-    "\n",
-    "1. Remove yourself as a model owner: \n",
-    "\n",
-    "    - Click on the **OWNERS** tile.\n",
-    "    - Click the **x** next to your name to remove yourself from that model's role.\n",
-    "    - Click **Save** to apply your changes to that role.\n",
-    "\n",
-    "2. Remove yourself as a developer: \n",
-    "\n",
-    "    - Click on the **DEVELOPERS** tile.\n",
-    "    - Click the **x** next to your name to remove yourself from that model's role.\n",
-    "    - Click **Save** to apply your changes to that role.\n",
-    "\n",
-    "3. Add yourself as a validator: \n",
-    "\n",
-    "    - Click on the **VALIDATORS** tile.\n",
-    "    - Select your name from the drop-down menu.\n",
-    "    - Click **Save** to apply your changes to that role."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "15b34a9e",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1_2__'></a>\n",
-    "\n",
-    "#### Apply validation report template\n",
-    "\n",
-    "Next, let's select a validation report template. A template predefines sections for your report and provides a general outline to follow, making the validation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Validation**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Generic Validation Report`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "26218040",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
-    "<br></br>\n",
-    "Python 3.8 <= x <= 3.14</div>\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "64eb485c",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b3f92287",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_3__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "ad3be9e8",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_3_1__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Validation` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "9c6ce354",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"validation-report\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b488736f",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_4__'></a>\n",
-    "\n",
-    "### Initialize the Python environment\n",
-    "\n",
-    "Then, let's import the necessary libraries and set up your Python environment for data analysis by enabling **`matplotlib`**, a plotting library used for visualizing data.\n",
-    "\n",
-    "This ensures that any plots you generate will render inline in our notebook output rather than opening in a separate window:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "1e53065d",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "\n",
-    "%matplotlib inline"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "014592ea",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Getting to know ValidMind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "a880167f",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Preview the validation report template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for model validation. A template predefines sections for your validation report and provides a general outline to follow, making the validation process much easier.\n",
-    "\n",
-    "You will attach evidence to this template in the form of risk assessment notes, artifacts, and test results later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "be445598",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "2fd993fa",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### View validation report in the ValidMind Platform\n",
-    "\n",
-    "Next, let's head to the ValidMind Platform to see the template in action:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and select the model you registered for this notebook.\n",
-    "\n",
-    "3. Click **Validation** under Documents for your model and note:\n",
-    "\n",
-    "    - [x] The risk assessment compliance summary at the top of the report (screenshot below)\n",
-    "    - [x] How the structure of the validation report reflects the previewed template\n",
-    "\n",
-    "    <img src= \"../tutorials/model_validation/compliance-summary.png\" alt=\"Screenshot showing the risk assessment compliance summary\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
-    "    <br><br>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "832a2dc2",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Importing the sample dataset"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "dd3c2581",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_1__'></a>\n",
-    "\n",
-    "### Load the sample dataset\n",
-    "\n",
-    "First, let's import the public [Bank Customer Churn Prediction](https://www.kaggle.com/datasets/shantanudhakadd/bank-customer-churn-prediction) dataset from Kaggle, which was used to develop the dummy champion model.\n",
-    "\n",
-    "We'll use this dataset to review steps that should have been conducted during the initial development and documentation of the model to ensure that the model was built correctly. By independently performing steps taken by the model development team, we can confirm whether the model was built using appropriate and properly processed data.\n",
-    "\n",
-    "In our below example, note that:\n",
-    "\n",
-    "- The target column, `Exited` has a value of `1` when a customer has churned and `0` otherwise.\n",
-    "- The ValidMind Library provides a wrapper to automatically load the dataset as a [Pandas DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html) object. A Pandas Dataframe is a two-dimensional tabular data structure that makes use of rows and columns."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "73076ee3",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.datasets.classification import customer_churn\n",
-    "\n",
-    "print(\n",
-    "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{customer_churn.target_column}' \\n\\t• Class labels: {customer_churn.class_labels}\"\n",
-    ")\n",
-    "\n",
-    "raw_df = customer_churn.load_data()\n",
-    "raw_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "049683d2",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2__'></a>\n",
-    "\n",
-    "### Preprocess the raw dataset\n",
-    "\n",
-    "Let's say that thanks to the documentation submitted by the model development team ([Learn more ...](quickstart_model_documentation.ipynb)), we know that the sample dataset was first preprocessed before being used to train the champion model.\n",
-    "\n",
-    "During model validation, we use the same data processing logic and training procedure to confirm that the model's results can be reproduced independently, so let's also start by preprocessing our imported dataset to verify that preprocessing was done correctly. This involves splitting the data and separating the features (inputs) from the targets (outputs)."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "6c8f5916",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2_1__'></a>\n",
-    "\n",
-    "#### Split the dataset\n",
-    "\n",
-    "Splitting our dataset helps assess how well the model generalizes to unseen data.\n",
-    "\n",
-    "Use [`preprocess()`](https://docs.validmind.ai/validmind/validmind/datasets/classification/customer_churn.html#preprocess) to split our dataset into three subsets:\n",
-    "\n",
-    "1. **train_df** — Used to train the model.\n",
-    "2. **validation_df** — Used to evaluate the model's performance during training.\n",
-    "3. **test_df** — Used later on to asses the model's performance on new, unseen data."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "ee8cfaaf",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "train_df, validation_df, test_df = customer_churn.preprocess(raw_df)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "39883f88",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2_2__'></a>\n",
-    "\n",
-    "#### Separate features and targets\n",
-    "\n",
-    "To train the model, we need to provide it with:\n",
-    "\n",
-    "1. **Inputs** — Features such as customer age, usage, etc.\n",
-    "2. **Outputs (Expected answers/labels)** — in our case, we would like to know whether the customer churned or not.\n",
-    "\n",
-    "Here, we'll use `x_train` to hold the input features, and `y_train` to hold the target variable — the values we want the model to predict:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "6fe65be5",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "x_train = train_df.drop(customer_churn.target_column, axis=1)\n",
-    "y_train = train_df[customer_churn.target_column]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "6c54dacc",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Running data quality tests\n",
-    "\n",
-    "With everything ready to go, let's explore some of ValidMind's available tests to help us assess the quality of our datasets. Using ValidMind’s repository of tests streamlines your validation testing, and helps you ensure that your models are being validated appropriately."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e2682c35",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1__'></a>\n",
-    "\n",
-    "### Identify qualitative tests\n",
-    "\n",
-    "We want to narrow down the tests we want to run from the selection provided by ValidMind, so we'll use the [`vm.tests.list_tasks_and_tags()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tasks_and_tags) to list which `tags` are associated with each `task` type:\n",
-    "\n",
-    "- **`tasks`** represent the kind of modeling task associated with a test. Here we'll focus on `classification` tasks.\n",
-    "- **`tags`** are free-form descriptions providing more details about the test, for example, what category the test falls into. Here we'll focus on the `data_quality` tag."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "85bc2f85",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.list_tasks_and_tags()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "ae249675",
-   "metadata": {},
-   "source": [
-    "Then we'll call [the `vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) to list all the data quality tests for classification:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "31b31a51",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.list_tests(\n",
-    "    tags=[\"data_quality\"], task=\"classification\"\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "1540287c",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind datasets\n",
-    "\n",
-    "Before you can run tests with your preprocessed datasets, you must first initialize a ValidMind `Dataset` object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module. **This step is always necessary every time you want to connect a dataset to documentation and produce test results through ValidMind,** but you only need to do it once per dataset.\n",
-    "\n",
-    "For this example, we'll pass in the following arguments:\n",
-    "\n",
-    "- **`dataset`** — The raw dataset that you want to provide as input to tests.\n",
-    "- **`input_id`** — A unique identifier that allows tracking what inputs are used when running each individual test.\n",
-    "- **`target_column`** — A required argument if tests require access to true values. This is the name of the target column in the dataset.\n",
-    "- **`class_labels`** — An optional value to map predicted classes to class labels."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "ba677dd7",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize the raw dataset\n",
-    "vm_raw_dataset = vm.init_dataset(\n",
-    "    dataset=raw_df,\n",
-    "    input_id=\"raw_dataset\",\n",
-    "    target_column=customer_churn.target_column,\n",
-    "    class_labels=customer_churn.class_labels,\n",
-    ")\n",
-    "\n",
-    "# Initialize the training dataset\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    dataset=train_df,\n",
-    "    input_id=\"train_dataset\",\n",
-    "    target_column=customer_churn.target_column,\n",
-    ")\n",
-    "\n",
-    "# Initialize the validation dataset\n",
-    "vm_validation_ds = vm.init_dataset(\n",
-    "    dataset=validation_df,\n",
-    "    input_id=\"validation_dataset\",\n",
-    "    target_column=customer_churn.target_column,\n",
-    ")\n",
-    "\n",
-    "# Initialize the testing dataset\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    dataset=test_df,\n",
-    "    input_id=\"test_dataset\",\n",
-    "    target_column=customer_churn.target_column\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "610e8c3e",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_3__'></a>\n",
-    "\n",
-    "### Run an individual data quality test\n",
-    "\n",
-    "Next, we'll use our previously initialized raw dataset (`vm_raw_dataset`) as input to run an individual test, then log the result to the ValidMind Platform.\n",
-    "\n",
-    "- You run validation tests by calling [the `run_test` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test) provided by the `validmind.tests` module.\n",
-    "- Every test result returned by the `run_test()` function has a [`.log()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#TestResult.log) that can be used to send the test results to the ValidMind Platform.\n",
-    "\n",
-    "Here, we'll use the [`ClassImbalance` test](https://docs.validmind.ai/tests/data_validation/ClassImbalance.html) as an example:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "dcb9b017",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.ClassImbalance\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_raw_dataset\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "74546420",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your model's documentation for some test IDs. </b></span>\n",
-    "<br></br>\n",
-    "That's expected, as when we run validations tests the results logged need to be manually added to your report as part of your compliance assessment process within the ValidMind Platform. You'll continue to see this message throughout this notebook as we run and log more tests.</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "91c2efb2",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_4__'></a>\n",
-    "\n",
-    "### Run data comparison tests\n",
-    "<span id=\"data-comparison\">\n",
-    "\n",
-    "We can also use ValidMind to perform comparison tests between our datasets, again logging the results to the ValidMind Platform. Below, we'll perform two sets of comparison tests with a mix of our datasets and the same class imbalance test:\n",
-    "\n",
-    "- When running individual tests, you can use a custom **`result_id`** to tag the individual result with a unique identifier, appended to the `test_id` with a `:` separator.\n",
-    "- We can specify all the tests we'd ike to run in a dictionary called `test_config`, and we'll pass in an **`input_grid`** of individual test inputs to compare. In this case, we'll input our two datasets for comparison. Note here that the `input_grid` expects the `input_id` of the dataset as the value rather than the variable name we specified."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "d53edde7",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Individual test config with inputs specified\n",
-    "test_config = {\n",
-    "    # Comparison between training and testing datasets to check if class balance is the same in both sets\n",
-    "    \"validmind.data_validation.ClassImbalance:train_vs_validation\": {\n",
-    "        \"input_grid\": {\"dataset\": [\"train_dataset\", \"validation_dataset\"]}\n",
-    "    },\n",
-    "    # Comparison between training and testing datasets to confirm that both sets have similar class distributions\n",
-    "    \"validmind.data_validation.ClassImbalance:train_vs_test\": {\n",
-    "        \"input_grid\": {\"dataset\": [\"train_dataset\", \"test_dataset\"]},\n",
-    "    },\n",
-    "}"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "676f342e",
-   "metadata": {},
-   "source": [
-    "Then batch run and log our tests in `test_config`:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "1b97e404",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "for t in test_config:\n",
-    "    print(t)\n",
-    "    try:\n",
-    "        # Check if test has input_grid\n",
-    "        if 'input_grid' in test_config[t]:\n",
-    "            # For tests with input_grid, pass the input_grid configuration\n",
-    "            if 'params' in test_config[t]:\n",
-    "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid'], params=test_config[t]['params']).log()\n",
-    "            else:\n",
-    "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid']).log()\n",
-    "        else:\n",
-    "            # Original logic for regular inputs\n",
-    "            if 'params' in test_config[t]:\n",
-    "                vm.tests.run_test(t, inputs=test_config[t]['inputs'], params=test_config[t]['params']).log()\n",
-    "            else:\n",
-    "                vm.tests.run_test(t, inputs=test_config[t]['inputs']).log()\n",
-    "    except Exception as e:\n",
-    "        print(f\"Error running test {t}: {str(e)}\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "6b2087c7",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Importing the champion model\n",
-    "\n",
-    "With our raw dataset preprocessed, let's go ahead and import the champion model submitted by the model development team in the format of a `.pkl` file: **[xgboost_model_champion.pkl](xgboost_model_champion.pkl)**"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "7f18188e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Import the champion model\n",
-    "import joblib\n",
-    "\n",
-    "xgboost = joblib.load(\"xgboost_model_champion.pkl\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "8a4b4bb3",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_1__'></a>\n",
-    "\n",
-    "### Initialize a model object\n",
-    "\n",
-    "In addition to the initialized datasets, you'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for our champion model.\n",
-    "\n",
-    "You simply initialize this model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "0a799cf2",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize the champion XGBoost model\n",
-    "vm_xgboost = vm.init_model(\n",
-    "    xgboost,\n",
-    "    input_id=\"xgboost_champion\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b8174798",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_2__'></a>\n",
-    "\n",
-    "### Assign predictions\n",
-    "\n",
-    "Once the model has been registered, you can assign model predictions to the training and testing datasets.\n",
-    "\n",
-    "- The [`assign_predictions()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#assign_predictions) from the `Dataset` object can link existing predictions to any number of models.\n",
-    "- This method links the model's class prediction values and probabilities to our `vm_train_ds` and `vm_test_ds` datasets.\n",
-    "\n",
-    "If no prediction values are passed, the method will compute predictions automatically:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "71dd8e7b",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds.assign_predictions(\n",
-    "    model=vm_xgboost,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds.assign_predictions(\n",
-    "    model=vm_xgboost,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "ddd1e977",
-   "metadata": {},
-   "source": [
-    "<a id='toc8__'></a>\n",
-    "\n",
-    "## Running model evaluation tests\n",
-    "\n",
-    "With our setup complete, let's run the rest of our validation tests. Since we have already verified the data quality of the dataset used to train our champion model, we will now focus on evaluating the model's performance."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "a443989f",
-   "metadata": {},
-   "source": [
-    "<a id='toc8_1__'></a>\n",
-    "\n",
-    "### Run model performance tests\n",
-    "\n",
-    "First, let's run some performance tests. Use [`vm.tests.list_tests()`](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) to identify all the model performance tests for classification:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "202792e8",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.list_tests(tags=[\"model_performance\"], task=\"classification\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "24f889e5",
-   "metadata": {},
-   "source": [
-    "We'll isolate the specific tests we want to run in `mpt`, and append an identifier for our champion model here to the `result_id` with a `:` separator like we did above in another test:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "9fc18843",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "mpt = [\n",
-    "    \"validmind.model_validation.sklearn.ClassifierPerformance:xgboost_champion\",\n",
-    "    \"validmind.model_validation.sklearn.ConfusionMatrix:xgboost_champion\",\n",
-    "    \"validmind.model_validation.sklearn.ROCCurve:xgboost_champion\"\n",
-    "]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "69692f9c",
-   "metadata": {},
-   "source": [
-    "Now, let's run and log our batch of model performance tests using our testing dataset (`vm_test_ds`) for our champion model:\n",
-    "\n",
-    "- The test set serves as a proxy for real-world data, providing an unbiased estimate of model performance since it was not used during training or tuning.\n",
-    "- The test set also acts as protection against selection bias and model tweaking, giving a final, more unbiased checkpoint."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "6866b21c",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "for test in mpt:\n",
-    "    vm.tests.run_test(\n",
-    "        test,\n",
-    "        inputs={\n",
-    "            \"dataset\": vm_test_ds, \"model\" : vm_xgboost,\n",
-    "        },\n",
-    "    ).log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "bb3dd6ad",
-   "metadata": {},
-   "source": [
-    "<a id='toc8_2__'></a>\n",
-    "\n",
-    "### Run diagnostic tests\n",
-    "\n",
-    "Next, we want to inspect the robustness and stability of our champion model. Use `list_tests()` to list all available diagnosis tests applicable to classification tasks:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "c9b3caa4",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.list_tests(tags=[\"model_diagnosis\"], task=\"classification\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "83da587e",
-   "metadata": {},
-   "source": [
-    "Let’s now assess the model for potential signs of *overfitting* and identify any sub-segments where performance may inconsistent.\n",
-    "\n",
-    "Overfitting occurs when a model learns the training data too well, capturing not only the true pattern but noise and random fluctuations resulting in excellent performance on the training dataset but poor generalization to new, unseen data:\n",
-    "\n",
-    "- Since the training dataset (`vm_train_ds`) was used to fit the model, we use this set to establish a baseline performance for how well the model performs on data it has already seen.\n",
-    "- The testing dataset (`vm_test_ds`) was never seen during training, and here simulates real-world generalization, or how well the model performs on new, unseen data. "
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "82f824f2",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    test_id=\"validmind.model_validation.sklearn.OverfitDiagnosis:xgboost_champion\",\n",
-    "    input_grid={\n",
-    "        \"datasets\": [[vm_train_ds,vm_test_ds]],\n",
-    "        \"model\" : [vm_xgboost]\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "917342c5",
-   "metadata": {},
-   "source": [
-    "Let's also conduct *robustness* and *stability* tests.\n",
-    "\n",
-    "- Robustness evaluates the model’s ability to maintain consistent performance under varying input conditions.\n",
-    "- Stability assesses whether the model produces consistent outputs across different data subsets or over time.\n",
-    "\n",
-    "Again, we'll use both the training and testing datasets to establish baseline performance and to simulate real-world generalization:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "b2676197",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    test_id=\"validmind.model_validation.sklearn.RobustnessDiagnosis:xgboost_champion\",\n",
-    "    input_grid={\n",
-    "        \"datasets\": [[vm_train_ds,vm_test_ds]],\n",
-    "        \"model\" : [vm_xgboost]\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "36b92e50",
-   "metadata": {},
-   "source": [
-    "<a id='toc8_3__'></a>\n",
-    "\n",
-    "### Run feature importance tests\n",
-    "\n",
-    "We also want to verify the relative influence of different input features on our model's predictions. Use `list_tests()` to identify all the feature importance tests for classification and store them in `FI`:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "9c8c26e6",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Store the feature importance tests\n",
-    "FI = vm.tests.list_tests(tags=[\"feature_importance\"], task=\"classification\",pretty=False)\n",
-    "FI"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "22f48ec7",
-   "metadata": {},
-   "source": [
-    "We'll only use our testing dataset (`vm_test_ds`) here, to provide a realistic, unseen sample that mimic future or production data, as the training dataset has already influenced our model during learning:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "5a49f550",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Run and log our feature importance tests with the testing dataset\n",
-    "for test in FI:\n",
-    "    vm.tests.run_test(\n",
-    "        \"\".join((test,':xgboost_champion')),\n",
-    "        inputs={\n",
-    "            \"dataset\": vm_test_ds, \"model\": vm_xgboost\n",
-    "        },\n",
-    "    ).log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "3df0f5b6",
-   "metadata": {},
-   "source": [
-    "<a id='toc9__'></a>\n",
-    "\n",
-    "## In summary\n",
-    "\n",
-    "In this notebook, you learned how to:\n",
-    "\n",
-    "- [x] Register a model within the ValidMind Platform\n",
-    "- [x] Install and initialize the ValidMind Library\n",
-    "- [x] Preview the validation report template for your model\n",
-    "- [x] Import a sample dataset and champion model\n",
-    "- [x] Initialize ValidMind datasets and model objects\n",
-    "- [x] Assign model predictions to your ValidMind model objects\n",
-    "- [x] Identify and run various validation tests\n",
-    "\n",
-    "In a usual model validation workflow, you would wrap up your validation testing by verifying that all the tests provided by the model development team were run and reported accurately, and perhaps even propose a challenger model, comparing the performance of the challenger with the running champion.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>With ValidMind, you can easily:</b></span>\n",
-    "<ul>\n",
-    "    <li>Specify all the tests you'd like to independently rerun, just like you did in the step <a href=\"#run-data-comparison-tests\" style=\"color: #DE257E;\">Run data comparision tests</a></li>\n",
-    "    <li>Evaluate the performance of a challenger model against the champion, just like you did in the steps under <a href=\"#running-model-evaluation-tests\" style=\"color: #DE257E;\">Running model evaluation tests</a></li>\n",
-    "</ul>\n",
-    "</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "71dd2d3c",
-   "metadata": {},
-   "source": [
-    "<a id='toc10__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the output produced by the ValidMind Library right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your validation report."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "83648605",
-   "metadata": {},
-   "source": [
-    "<a id='toc10_1__'></a>\n",
-    "\n",
-    "### Work with your validation report\n",
-    "\n",
-    "Now that you've logged all your test results and verified the work done by the model development team, head to the ValidMind Platform to wrap up your validation report:\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you connected to earlier.\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Validation** under Documents.\n",
-    "\n",
-    "Include your logged test results as evidence, create risk assessment notes, add artifacts, and assess compliance, then submit your report for review when it's ready. **Learn more:** [Preparing validation reports](https://docs.validmind.ai/guide/model-validation/preparing-validation-reports.html)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "c901f28f",
-   "metadata": {},
-   "source": [
-    "<a id='toc10_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "For a more in-depth introduction to using the ValidMind Library for validation, check out our introductory validation series and the accompanying interactive training:\n",
-    "\n",
-    "- **[ValidMind for model validation](https://docs.validmind.ai/developer/validmind-library.html#for-model-validation)**\n",
-    "- **[Validator Fundamentals](https://docs.validmind.ai/training/validator-fundamentals/validator-fundamentals-register.html)**\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "62f2d2ea",
-   "metadata": {},
-   "source": [
-    "<a id='toc11__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "upgrade-show-c0a446ff-f26f-4ad0-839a-e92927711798",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b3143537",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f7a7527f",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-09361e6dcd874470819686c63660be51",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
-  },
-  "language_info": {
-   "name": "python",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
-}
diff --git a/site/notebooks/quickstart/quickstart_model_validation.Rmd b/site/notebooks/quickstart/quickstart_validation.Rmd
similarity index 69%
rename from site/notebooks/quickstart/quickstart_model_validation.Rmd
rename to site/notebooks/quickstart/quickstart_validation.Rmd
index 547aaf29d5..b28d319a56 100644
--- a/site/notebooks/quickstart/quickstart_model_validation.Rmd
+++ b/site/notebooks/quickstart/quickstart_validation.Rmd
@@ -1,20 +1,20 @@
 ---
-title: "Quickstart for Model Validation (R)"
+title: "Quickstart for validation (R)"
 author: "ValidMind"
 date: "2026-03-18"
 output: html_document
 ---
 
-# Quickstart for Model Validation
+# Quickstart for validation
 
-Learn the basics of using ValidMind to validate models as part of a model validation workflow using R. This notebook uses the ValidMind R package (a `reticulate` wrapper around the Python library) to generate a draft of a validation report for a binary classification model.
+Learn the basics of using ValidMind to validate records as part of a validation workflow with R. Using the ValidMind R package (a `reticulate` wrapper around the Python library), you'll generate a draft of a validation report using ValidMind tests for a binary classification model.
 
-We will:
+To validate our model with the ValidMind Library, we'll:
 
-1. Import a sample dataset and preprocess it, then initialize datasets for use with ValidMind
+1. Import a sample dataset and preprocess it, then split the datasets and initialize them for use with ValidMind
 2. Independently verify data quality tests performed on datasets by model development
-3. Train a champion model for evaluation
-4. Run model evaluation tests with the ValidMind Library
+3. Import a champion model for evaluation
+4. Run model evaluation tests with the ValidMind Library, which will send the results of those tests to the ValidMind Platform
 
 ## Setting up
 
@@ -41,14 +41,63 @@ knitr::opts_chunk$set(warning = FALSE, message = FALSE)
 
 ## Initialize the ValidMind Library
 
-Log in to the [ValidMind Platform](https://app.prod.validmind.ai) and register a model:
+#### Register sample model
 
-1. Navigate to **Inventory** and click **+ Register Model**.
-2. Assign yourself as a **Validator** (remove yourself from Owner and Developer roles).
-3. Under **Documents > Validation**, select the `Generic Validation Report` template.
-4. Go to **Getting Started**, select `Validation` from the **DOCUMENT** drop-down, and copy the code snippet.
+In a usual lifecycle, a champion will have been independently registered in your inventory and submitted to you for validation by your development team as part of the effective challenge process.
 
-Replace the placeholder values below with your own credentials:
+For this exercise, log in to the [ValidMind Platform](https://app.prod.validmind.ai) and register a sample record (model) to circumvent the need for an existing model:
+
+1. In the left sidebar, select **Inventory**.
+
+2. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))
+
+3. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.
+
+4. Select your own name under the **RECORD OWNER** drop-down  — don’t worry, we’ll adjust these permissions next for validation.
+
+6. Click **Register Model** to add the model to your inventory.
+
+#### Assign validator credentials
+
+In order to log tests as a validator instead of as a developer, on the details page that appears after you've successfully registered your sample model:
+
+1. Remove yourself as an owner:
+
+   - Click on the **OWNERS** tile.
+   - Click the **x** next to your name to remove yourself from that role.
+   - Click **Save** to apply your changes.
+
+2. Remove yourself as a developer:
+
+   - Click on the **DEVELOPERS** tile.
+   - Click the **x** next to your name to remove yourself from that role.
+   - Click **Save** to apply your changes.
+
+3. Add yourself as a validator:
+
+   - Click on the **VALIDATORS** tile.
+   - Select your name from the drop-down menu.
+   - Click **Save** to apply your changes.
+
+#### Apply validation report template
+
+Next, let's select a validation report template. A template predefines sections for your report and provides a general outline to follow, making the validation process much easier.
+
+1. In the model's left sidebar, click **Documents** and select **Validation**.
+
+2. Under **TEMPLATE**, select `Generic Validation Report`.
+
+3. Click **Use Template** to apply the template.
+
+#### Get your code snippet
+
+Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.
+
+1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.
+
+2. Click **Copy snippet to clipboard**. Paste the snippet into an editor and make note of the credentials.
+
+3. Next, replace the placeholder values below with your own credentials:
 
 ```{r}
 vm_r <- vm(
@@ -227,7 +276,7 @@ model <- glm(formula, data = train_data, family = binomial)
 summary(model)
 ```
 
-## Initialize the model object
+## Initialize the ValidMind model
 
 Save the R model and initialize it with ValidMind:
 
diff --git a/site/notebooks/quickstart/quickstart_validation.ipynb b/site/notebooks/quickstart/quickstart_validation.ipynb
new file mode 100644
index 0000000000..4d871e1226
--- /dev/null
+++ b/site/notebooks/quickstart/quickstart_validation.ipynb
@@ -0,0 +1,1248 @@
+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Quickstart for validation\n",
+        "\n",
+        "Learn the basics of using ValidMind to validate records as part of a validation workflow. Set up the ValidMind Library in your environment, and generate a draft of a validation report using ValidMind tests for a binary classification model.\n",
+        "\n",
+        "To validate our model with the ValidMind Library, we'll:\n",
+        "\n",
+        "1. Import a sample dataset and preprocess it, then split the datasets and initialize them for use with ValidMind\n",
+        "2. Independently verify data quality tests performed on datasets by model development\n",
+        "3. Import a champion model for evaluation\n",
+        "4. Run model evaluation tests with the ValidMind Library, which will send the results of those tests to the ValidMind Platform"
+      ],
+      "id": "1a88a895"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [Introduction](#toc1__)    \n",
+        "- [About ValidMind](#toc2__)    \n",
+        "  - [Before you begin](#toc2_1__)    \n",
+        "  - [New to ValidMind?](#toc2_2__)    \n",
+        "  - [Key concepts](#toc2_3__)    \n",
+        "- [Setting up](#toc3__)    \n",
+        "  - [Register a sample model](#toc3_1__)    \n",
+        "    - [Assign validator credentials](#toc3_1_1__)    \n",
+        "    - [Apply validation report template](#toc3_1_2__)    \n",
+        "  - [Install the ValidMind Library](#toc3_2__)    \n",
+        "  - [Initialize the ValidMind Library](#toc3_3__)    \n",
+        "    - [Get your code snippet](#toc3_3_1__)    \n",
+        "  - [Initialize the Python environment](#toc3_4__)    \n",
+        "- [Getting to know ValidMind](#toc4__)    \n",
+        "  - [Preview the validation report template](#toc4_1__)    \n",
+        "  - [View validation report in the ValidMind Platform](#toc4_2__)    \n",
+        "- [Working with ValidMind datasets](#toc5__)    \n",
+        "  - [Prepare the sample dataset](#toc5_1__)    \n",
+        "    - [Load the sample dataset](#toc5_1_1__)    \n",
+        "    - [Preprocess the raw dataset](#toc5_1_2__)    \n",
+        "    - [Split the dataset](#toc5_1_3__)    \n",
+        "    - [Separate features and targets](#toc5_1_4__)    \n",
+        "  - [Initialize the ValidMind datasets](#toc5_2__)    \n",
+        "- [Running data quality tests](#toc6__)    \n",
+        "  - [Identify qualitative tests](#toc6_1__)    \n",
+        "  - [Run an individual data quality test](#toc6_2__)    \n",
+        "  - [Run data comparison tests](#toc6_3__)    \n",
+        "- [Working with ValidMind models](#toc7__)    \n",
+        "  - [Import the champion model](#toc7_1__)    \n",
+        "  - [Initialize the ValidMind model](#toc7_2__)    \n",
+        "  - [Assign predictions](#toc7_3__)    \n",
+        "- [Running model evaluation tests](#toc8__)    \n",
+        "  - [Run model performance tests](#toc8_1__)    \n",
+        "  - [Run diagnostic tests](#toc8_2__)    \n",
+        "  - [Run feature importance tests](#toc8_3__)    \n",
+        "- [In summary](#toc9__)    \n",
+        "- [Next steps](#toc10__)    \n",
+        "  - [Work with your validation report](#toc10_1__)    \n",
+        "  - [Discover more learning resources](#toc10_2__)    \n",
+        "- [Upgrade ValidMind](#toc11__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ],
+      "id": "0493b0cb"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## Introduction\n",
+        "\n",
+        "Validation aims to independently assess the compliance of *champions* created by developers with regulatory guidance by conducting thorough testing and analysis, potentially including the use of challengers to benchmark performance. Assessments, presented in the form of a validation report, typically include *artifacts (findings)* and recommendations to address those issues.\n",
+        "\n",
+        "A *binary classification model* is a type of predictive model used in churn analysis to identify customers who are likely to leave a service or subscription by analyzing various behavioral, transactional, and demographic factors.\n",
+        "\n",
+        "- This model helps businesses take proactive measures to retain at-risk customers by offering personalized incentives, improving customer service, or adjusting pricing strategies.\n",
+        "- Effective validation of a churn prediction model ensures that businesses can accurately identify potential churners, optimize retention efforts, and enhance overall customer satisfaction while minimizing revenue loss."
+      ],
+      "id": "717d2a16"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate comparison and other validation tests, and then use the ValidMind Platform to submit compliance assessments of champions via comprehensive validation reports. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and developers."
+      ],
+      "id": "369d00db"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
+      ],
+      "id": "72800fc2"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about validating records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+      ],
+      "id": "e2beb1bb"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**validation report:** A validation report is a comprehensive and structured review evaluating a record's accuracy, performance, and suitability for its intended purpose. A report follows established validation guidelines to ensure consistency and adherence to internal and regulatory standards — encompassing the process of risk assessment, identifying areas of potential error or risk within the record's components, supporting transparency, regulatory compliance, and informed decision-making by documenting the validator’s independent review and conclusions.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**validation report template**: A default ValidMind document template that serves as a standardized framework for conducting and documenting validation, including sections designated for attaching test results, evidence, or artifacts (findings). By outlining required documentation, recommended analyses, and expected validation tests, validation report templates ensure consistency and completeness across validation reports and help guide validators through a systematic review process while promoting comparability and traceability of validation outcomes.\n",
+        "\n",
+        "**artifacts (findings)**: Observations or issues identified during validation, including any deviations from expected performance or standards. Artifacts are organized by type — default types provided by ValidMind include Validation Issue, Policy Exception, and Limitation. Custom artifact types can be created to track other categories relevant to your organization.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ],
+      "id": "78c8388c"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Setting up"
+      ],
+      "id": "ec7b4755"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Register a sample model\n",
+        "\n",
+        "In a usual lifecycle, a champion will have been independently registered in your inventory and submitted to you for validation by your development team as part of the effective challenge process. (**Learn more:** [Submit documents](https://docs.validmind.ai/guide/documentation/submit-documents.html))\n",
+        "\n",
+        "For this notebook, we'll have you register a dummy record (model) in the ValidMind Platform inventory and assign yourself as the validator to familiarize you with the ValidMind interface and circumvent the need for an existing model:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down — don’t worry, we’ll adjust these permissions next for validation.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ],
+      "id": "97d44f44"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1_1__'></a>\n",
+        "\n",
+        "#### Assign validator credentials\n",
+        "\n",
+        "In order to log tests as a validator instead of as a developer, on the details page that appears after you've successfully registered your sample model:\n",
+        "\n",
+        "1. Remove yourself as an owner:\n",
+        "\n",
+        "    - Click on the **OWNERS** tile.\n",
+        "    - Click the **x** next to your name to remove yourself from that model's role.\n",
+        "    - Click **Save** to apply your changes to that role.\n",
+        "\n",
+        "2. Remove yourself as a developer:\n",
+        "\n",
+        "    - Click on the **DEVELOPERS** tile.\n",
+        "    - Click the **x** next to your name to remove yourself from that model's role.\n",
+        "    - Click **Save** to apply your changes to that role.\n",
+        "\n",
+        "3. Add yourself as a validator:\n",
+        "\n",
+        "    - Click on the **VALIDATORS** tile.\n",
+        "    - Select your name from the drop-down menu.\n",
+        "    - Click **Save** to apply your changes to that role."
+      ],
+      "id": "fc3e48e1"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1_2__'></a>\n",
+        "\n",
+        "#### Apply validation report template\n",
+        "\n",
+        "Next, let's select a validation report template. A template predefines sections for your report and provides a general outline to follow, making the validation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Validation**.\n",
+        "\n",
+        "    If you cannot locate your Validation document, make sure Validation type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Generic Validation Report`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ],
+      "id": "428260e0"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
+        "<br></br>\n",
+        "Python 3.8 <= x <= 3.14</div>\n",
+        "\n",
+        "To install the library:"
+      ],
+      "id": "7b16c381"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "64eb485c"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_3__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ],
+      "id": "bf77550e"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_3_1__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Validation` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ],
+      "id": "ae918c6c"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"validation-report\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "9c6ce354"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_4__'></a>\n",
+        "\n",
+        "### Initialize the Python environment\n",
+        "\n",
+        "Then, let's import the necessary libraries and set up your Python environment for data analysis by enabling **`matplotlib`**, a plotting library used for visualizing data.\n",
+        "\n",
+        "This ensures that any plots you generate will render inline in our notebook output rather than opening in a separate window:"
+      ],
+      "id": "f9bc73e9"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "\n",
+        "%matplotlib inline"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "1e53065d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Getting to know ValidMind"
+      ],
+      "id": "e0e942dd"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Preview the validation report template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for validation. A template predefines sections for your validation report and provides a general outline to follow, making the validation process much easier.\n",
+        "\n",
+        "You will attach evidence to this template in the form of risk assessment notes, artifacts, and test results later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library:"
+      ],
+      "id": "0361d8bf"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "be445598"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### View validation report in the ValidMind Platform\n",
+        "\n",
+        "Next, let's head to the ValidMind Platform to see the template in action:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, navigate to **Inventory** and select the model you registered for this notebook.\n",
+        "\n",
+        "3. Click **Validation** under Documents for your model and note:\n",
+        "\n",
+        "    - [x] The risk assessment compliance summary at the top of the report (screenshot below)\n",
+        "    - [x] How the structure of the validation report reflects the previewed template\n",
+        "\n",
+        "    <img src= \"../tutorials/validation/compliance-summary.png\" alt=\"Screenshot showing the risk assessment compliance summary\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
+        "    <br><br>"
+      ],
+      "id": "4124c3d7"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Working with ValidMind datasets"
+      ],
+      "id": "767ea445"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Prepare the sample dataset"
+      ],
+      "id": "ae3f832d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1_1__'></a>\n",
+        "\n",
+        "#### Load the sample dataset\n",
+        "\n",
+        "First, let's import the public [Bank Customer Churn Prediction](https://www.kaggle.com/datasets/shantanudhakadd/bank-customer-churn-prediction) dataset from Kaggle, which was used to develop the dummy champion.\n",
+        "\n",
+        "We'll use this dataset to review steps that should have been conducted during the initial development and documentation of the champion to ensure that the model was built correctly. By independently performing steps taken by the development team, we can confirm whether the model was built using appropriate and properly processed data.\n",
+        "\n",
+        "In our below example, note that:\n",
+        "\n",
+        "- The target column, `Exited` has a value of `1` when a customer has churned and `0` otherwise.\n",
+        "- The ValidMind Library provides a wrapper to automatically load the dataset as a [Pandas DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html) object. A Pandas Dataframe is a two-dimensional tabular data structure that makes use of rows and columns."
+      ],
+      "id": "f91775e8"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.datasets.classification import customer_churn\n",
+        "\n",
+        "print(\n",
+        "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{customer_churn.target_column}' \\n\\t• Class labels: {customer_churn.class_labels}\"\n",
+        ")\n",
+        "\n",
+        "raw_df = customer_churn.load_data()\n",
+        "raw_df.head()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "73076ee3"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1_2__'></a>\n",
+        "\n",
+        "#### Preprocess the raw dataset\n",
+        "\n",
+        "Let's say that thanks to the documentation submitted by the development team (**Learn more:** [Quickstart for documentation](quickstart_documentation.ipynb)), we know that the sample dataset was first preprocessed before being used to train the champion.\n",
+        "\n",
+        "During validation, we use the same data processing logic and training procedure to confirm that the champion's results can be reproduced independently, so let's also start by preprocessing our imported dataset to verify that preprocessing was done correctly. This involves splitting the data and separating the features (inputs) from the targets (outputs)."
+      ],
+      "id": "6ab7fd19"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1_3__'></a>\n",
+        "\n",
+        "#### Split the dataset\n",
+        "\n",
+        "Splitting our dataset helps assess how well the model generalizes to unseen data.\n",
+        "\n",
+        "Use [`preprocess()`](https://docs.validmind.ai/validmind/validmind/datasets/classification/customer_churn.html#preprocess) to split our dataset into three subsets:\n",
+        "\n",
+        "1. **train_df** — Used to train the model.\n",
+        "2. **validation_df** — Used to evaluate the model's performance during training.\n",
+        "3. **test_df** — Used later on to asses the model's performance on new, unseen data."
+      ],
+      "id": "af660bf4"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "train_df, validation_df, test_df = customer_churn.preprocess(raw_df)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "ee8cfaaf"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1_4__'></a>\n",
+        "\n",
+        "#### Separate features and targets\n",
+        "\n",
+        "To train the model, we need to provide it with:\n",
+        "\n",
+        "1. **Inputs** — Features such as customer age, usage, etc.\n",
+        "2. **Outputs (Expected answers/labels)** — in our case, we would like to know whether the customer churned or not.\n",
+        "\n",
+        "Here, we'll use `x_train` to hold the input features, and `y_train` to hold the target variable — the values we want the model to predict:"
+      ],
+      "id": "125a39e6"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "x_train = train_df.drop(customer_churn.target_column, axis=1)\n",
+        "y_train = train_df[customer_churn.target_column]"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "6fe65be5"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind datasets\n",
+        "\n",
+        "Before you can run tests with your preprocessed datasets, you must first initialize a ValidMind `Dataset` object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module. **This step is always necessary every time you want to connect a dataset to documentation and produce test results through ValidMind,** but you only need to do it once per dataset.\n",
+        "\n",
+        "For this example, we'll pass in the following arguments:\n",
+        "\n",
+        "- **`dataset`** — The raw dataset that you want to provide as input to tests.\n",
+        "- **`input_id`** — A unique identifier that allows tracking what inputs are used when running each individual test.\n",
+        "- **`target_column`** — A required argument if tests require access to true values. This is the name of the target column in the dataset.\n",
+        "- **`class_labels`** — An optional value to map predicted classes to class labels."
+      ],
+      "id": "b6674505"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Initialize the raw dataset\n",
+        "vm_raw_dataset = vm.init_dataset(\n",
+        "    dataset=raw_df,\n",
+        "    input_id=\"raw_dataset\",\n",
+        "    target_column=customer_churn.target_column,\n",
+        "    class_labels=customer_churn.class_labels,\n",
+        ")\n",
+        "\n",
+        "# Initialize the training dataset\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    dataset=train_df,\n",
+        "    input_id=\"train_dataset\",\n",
+        "    target_column=customer_churn.target_column,\n",
+        ")\n",
+        "\n",
+        "# Initialize the validation dataset\n",
+        "vm_validation_ds = vm.init_dataset(\n",
+        "    dataset=validation_df,\n",
+        "    input_id=\"validation_dataset\",\n",
+        "    target_column=customer_churn.target_column,\n",
+        ")\n",
+        "\n",
+        "# Initialize the testing dataset\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    dataset=test_df,\n",
+        "    input_id=\"test_dataset\",\n",
+        "    target_column=customer_churn.target_column\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "ba677dd7"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Running data quality tests\n",
+        "\n",
+        "With everything ready to go, let's explore some of ValidMind's available tests to help us assess the quality of our datasets. Using ValidMind’s repository of tests streamlines your validation testing, and helps you ensure that your records are being validated appropriately."
+      ],
+      "id": "c53c6d35"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_1__'></a>\n",
+        "\n",
+        "### Identify qualitative tests\n",
+        "\n",
+        "We want to narrow down the tests we want to run from the selection provided by ValidMind, so we'll use the [`vm.tests.list_tasks_and_tags()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tasks_and_tags) to list which `tags` are associated with each `task` type:\n",
+        "\n",
+        "- **`tasks`** represent the kind of modeling task associated with a test. Here we'll focus on `classification` tasks.\n",
+        "- **`tags`** are free-form descriptions providing more details about the test, for example, what category the test falls into. Here we'll focus on the `data_quality` tag."
+      ],
+      "id": "b6acd486"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.list_tasks_and_tags()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "85bc2f85"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Then we'll call [the `vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) to list all the data quality tests for classification:"
+      ],
+      "id": "9881e58a"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.list_tests(\n",
+        "    tags=[\"data_quality\"], task=\"classification\"\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "31b31a51"
+    },
+    {
+      "cell_type": "markdown",
+      "id": "d3e27375",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2__'></a>\n",
+        "\n",
+        "### Run an individual data quality test\n",
+        "\n",
+        "Next, we'll use our previously initialized raw dataset (`vm_raw_dataset`) as input to run an individual test, then log the result to the ValidMind Platform.\n",
+        "\n",
+        "- You run validation tests by calling [the `run_test` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test) provided by the `validmind.tests` module.\n",
+        "- Every test result returned by the `run_test()` function has a [`.log()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#TestResult.log) that can be used to send the test results to the ValidMind Platform.\n",
+        "\n",
+        "Here, we'll use the `data_validation.ClassImbalance` test as an example:\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.ClassImbalance\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_raw_dataset\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "dcb9b017"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your documentation for some test IDs. </b></span>\n",
+        "<br></br>\n",
+        "That's expected, as when we run validations tests the results logged need to be manually added to your report as part of your compliance assessment process within the ValidMind Platform. You'll continue to see this message throughout this notebook as we run and log more tests.</div>"
+      ],
+      "id": "f6b7567b"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_3__'></a>\n",
+        "\n",
+        "### Run data comparison tests\n",
+        "<span id=\"data-comparison\">\n",
+        "\n",
+        "We can also use ValidMind to perform comparison tests between our datasets, again logging the results to the ValidMind Platform. Below, we'll perform two sets of comparison tests with a mix of our datasets and the same class imbalance test:\n",
+        "\n",
+        "- When running individual tests, you can use a custom **`result_id`** to tag the individual result with a unique identifier, appended to the `test_id` with a `:` separator.\n",
+        "- We can specify all the tests we'd ike to run in a dictionary called `test_config`, and we'll pass in an **`input_grid`** of individual test inputs to compare. In this case, we'll input our two datasets for comparison. Note here that the `input_grid` expects the `input_id` of the dataset as the value rather than the variable name we specified."
+      ],
+      "id": "97286c0e"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Individual test config with inputs specified\n",
+        "test_config = {\n",
+        "    # Comparison between training and testing datasets to check if class balance is the same in both sets\n",
+        "    \"validmind.data_validation.ClassImbalance:train_vs_validation\": {\n",
+        "        \"input_grid\": {\"dataset\": [\"train_dataset\", \"validation_dataset\"]}\n",
+        "    },\n",
+        "    # Comparison between training and testing datasets to confirm that both sets have similar class distributions\n",
+        "    \"validmind.data_validation.ClassImbalance:train_vs_test\": {\n",
+        "        \"input_grid\": {\"dataset\": [\"train_dataset\", \"test_dataset\"]},\n",
+        "    },\n",
+        "}"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "d53edde7"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Then batch run and log our tests in `test_config`:"
+      ],
+      "id": "1f1b796b"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "for t in test_config:\n",
+        "    print(t)\n",
+        "    try:\n",
+        "        # Check if test has input_grid\n",
+        "        if 'input_grid' in test_config[t]:\n",
+        "            # For tests with input_grid, pass the input_grid configuration\n",
+        "            if 'params' in test_config[t]:\n",
+        "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid'], params=test_config[t]['params']).log()\n",
+        "            else:\n",
+        "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid']).log()\n",
+        "        else:\n",
+        "            # Original logic for regular inputs\n",
+        "            if 'params' in test_config[t]:\n",
+        "                vm.tests.run_test(t, inputs=test_config[t]['inputs'], params=test_config[t]['params']).log()\n",
+        "            else:\n",
+        "                vm.tests.run_test(t, inputs=test_config[t]['inputs']).log()\n",
+        "    except Exception as e:\n",
+        "        print(f\"Error running test {t}: {str(e)}\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "1b97e404"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Working with ValidMind models"
+      ],
+      "id": "1ca8c343"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_1__'></a>\n",
+        "\n",
+        "### Import the champion model\n",
+        "\n",
+        "With our raw dataset preprocessed, let's go ahead and import the champion submitted by the development team in the format of a `.pkl` file: **[xgboost_model_champion.pkl](xgboost_model_champion.pkl)**"
+      ],
+      "id": "1fd05953"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Import the champion model\n",
+        "import joblib\n",
+        "\n",
+        "xgboost = joblib.load(\"xgboost_model_champion.pkl\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "7f18188e"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind model\n",
+        "\n",
+        "In addition to the initialized datasets, you'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for our champion.\n",
+        "\n",
+        "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+        "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
+        "\n",
+        "Initialize your model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
+      ],
+      "id": "ee26b0b6"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Initialize the champion XGBoost model\n",
+        "vm_xgboost = vm.init_model(\n",
+        "    xgboost,\n",
+        "    input_id=\"xgboost_champion\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "0a799cf2"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_3__'></a>\n",
+        "\n",
+        "### Assign predictions\n",
+        "\n",
+        "Once the model has been registered, you can assign model predictions to the training and testing datasets.\n",
+        "\n",
+        "- The [`assign_predictions()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#assign_predictions) from the `Dataset` object can link existing predictions to any number of models.\n",
+        "- This method links the model's class prediction values and probabilities to our `vm_train_ds` and `vm_test_ds` datasets.\n",
+        "\n",
+        "If no prediction values are passed, the method will compute predictions automatically:"
+      ],
+      "id": "823e49c5"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds.assign_predictions(\n",
+        "    model=vm_xgboost,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds.assign_predictions(\n",
+        "    model=vm_xgboost,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "71dd8e7b"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## Running model evaluation tests\n",
+        "\n",
+        "With our setup complete, let's run the rest of our validation tests. Since we have already verified the data quality of the dataset used to train our champion, we will now focus on evaluating the model's performance."
+      ],
+      "id": "2e29df90"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8_1__'></a>\n",
+        "\n",
+        "### Run model performance tests\n",
+        "\n",
+        "First, let's run some performance tests. Use [`vm.tests.list_tests()`](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) to identify all the model performance tests for classification:"
+      ],
+      "id": "fc6af0e0"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.list_tests(tags=[\"model_performance\"], task=\"classification\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "202792e8"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "We'll isolate the specific tests we want to run in `mpt`, and append an identifier for our champion model here to the `result_id` with a `:` separator like we did above in another test:"
+      ],
+      "id": "011b7c09"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "mpt = [\n",
+        "    \"validmind.model_validation.sklearn.ClassifierPerformance:xgboost_champion\",\n",
+        "    \"validmind.model_validation.sklearn.ConfusionMatrix:xgboost_champion\",\n",
+        "    \"validmind.model_validation.sklearn.ROCCurve:xgboost_champion\"\n",
+        "]"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "9fc18843"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Now, let's run and log our batch of model performance tests using our testing dataset (`vm_test_ds`) for our champion model:\n",
+        "\n",
+        "- The test set serves as a proxy for real-world data, providing an unbiased estimate of model performance since it was not used during training or tuning.\n",
+        "- The test set also acts as protection against selection bias and model tweaking, giving a final, more unbiased checkpoint."
+      ],
+      "id": "52096118"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "for test in mpt:\n",
+        "    vm.tests.run_test(\n",
+        "        test,\n",
+        "        inputs={\n",
+        "            \"dataset\": vm_test_ds, \"model\" : vm_xgboost,\n",
+        "        },\n",
+        "    ).log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "6866b21c"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8_2__'></a>\n",
+        "\n",
+        "### Run diagnostic tests\n",
+        "\n",
+        "Next, we want to inspect the robustness and stability of our champion. Use `list_tests()` to list all available diagnosis tests applicable to classification tasks:"
+      ],
+      "id": "842707f9"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.list_tests(tags=[\"model_diagnosis\"], task=\"classification\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "c9b3caa4"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let’s now assess the model for potential signs of *overfitting* and identify any sub-segments where performance may inconsistent.\n",
+        "\n",
+        "Overfitting occurs when a model learns the training data too well, capturing not only the true pattern but noise and random fluctuations resulting in excellent performance on the training dataset but poor generalization to new, unseen data:\n",
+        "\n",
+        "- Since the training dataset (`vm_train_ds`) was used to fit the model, we use this set to establish a baseline performance for how well the model performs on data it has already seen.\n",
+        "- The testing dataset (`vm_test_ds`) was never seen during training, and here simulates real-world generalization, or how well the model performs on new, unseen data. "
+      ],
+      "id": "5295d37b"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    test_id=\"validmind.model_validation.sklearn.OverfitDiagnosis:xgboost_champion\",\n",
+        "    input_grid={\n",
+        "        \"datasets\": [[vm_train_ds,vm_test_ds]],\n",
+        "        \"model\" : [vm_xgboost]\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "82f824f2"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let's also conduct *robustness* and *stability* tests.\n",
+        "\n",
+        "- Robustness evaluates the model’s ability to maintain consistent performance under varying input conditions.\n",
+        "- Stability assesses whether the model produces consistent outputs across different data subsets or over time.\n",
+        "\n",
+        "Again, we'll use both the training and testing datasets to establish baseline performance and to simulate real-world generalization:"
+      ],
+      "id": "88db22ed"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    test_id=\"validmind.model_validation.sklearn.RobustnessDiagnosis:xgboost_champion\",\n",
+        "    input_grid={\n",
+        "        \"datasets\": [[vm_train_ds,vm_test_ds]],\n",
+        "        \"model\" : [vm_xgboost]\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "b2676197"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8_3__'></a>\n",
+        "\n",
+        "### Run feature importance tests\n",
+        "\n",
+        "We also want to verify the relative influence of different input features on our model's predictions. Use `list_tests()` to identify all the feature importance tests for classification and store them in `FI`:"
+      ],
+      "id": "9226c6ea"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Store the feature importance tests\n",
+        "FI = vm.tests.list_tests(tags=[\"feature_importance\"], task=\"classification\",pretty=False)\n",
+        "FI"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "9c8c26e6"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "We'll only use our testing dataset (`vm_test_ds`) here, to provide a realistic, unseen sample that mimic future or production data, as the training dataset has already influenced our model during learning:"
+      ],
+      "id": "d36a3544"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Run and log our feature importance tests with the testing dataset\n",
+        "for test in FI:\n",
+        "    vm.tests.run_test(\n",
+        "        \"\".join((test,':xgboost_champion')),\n",
+        "        inputs={\n",
+        "            \"dataset\": vm_test_ds, \"model\": vm_xgboost\n",
+        "        },\n",
+        "    ).log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "5a49f550"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc9__'></a>\n",
+        "\n",
+        "## In summary\n",
+        "\n",
+        "In this notebook, you learned how to:\n",
+        "\n",
+        "- [x] Register a record (model) within the ValidMind Platform\n",
+        "- [x] Install and initialize the ValidMind Library\n",
+        "- [x] Preview the validation report template for your model\n",
+        "- [x] Import a sample dataset and champion model\n",
+        "- [x] Initialize ValidMind datasets and model objects\n",
+        "- [x] Assign model predictions to your ValidMind model objects\n",
+        "- [x] Identify and run various validation tests\n",
+        "\n",
+        "In a usual validation workflow, you would wrap up your validation testing by verifying that all the tests provided by the development team were run and reported accurately, and perhaps even propose a challenger, comparing the performance of the challenger with the running champion.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>With ValidMind, you can easily:</b></span>\n",
+        "<ul>\n",
+        "    <li>Specify all the tests you'd like to independently rerun, just like you did in the step <a href=\"#run-data-comparison-tests\" style=\"color: #DE257E;\">Run data comparision tests</a></li>\n",
+        "    <li>Evaluate the performance of a challenger against the champion, just like you did in the steps under <a href=\"#running-model-evaluation-tests\" style=\"color: #DE257E;\">Running model evaluation tests</a></li>\n",
+        "</ul>\n",
+        "</div>"
+      ],
+      "id": "293bf4ca"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc10__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the output produced by the ValidMind Library right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your validation report."
+      ],
+      "id": "b7fe1ed3"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc10_1__'></a>\n",
+        "\n",
+        "### Work with your validation report\n",
+        "\n",
+        "Now that you've logged all your test results and verified the work done by the development team, head to the ValidMind Platform to wrap up your validation report:\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you connected to earlier.\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Validation** under Documents.\n",
+        "\n",
+        "Include your logged test results as evidence, create risk assessment notes, add artifacts, and assess compliance, then submit your report for review when it's ready. (**Learn more:** [Preparing validation reports](https://docs.validmind.ai/guide/validation/preparing-validation-reports.html))"
+      ],
+      "id": "1e30826e"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc10_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "For a more in-depth introduction to using the ValidMind Library for validation, check out our introductory validation series and the accompanying interactive training:\n",
+        "\n",
+        "- **[ValidMind for validation](https://docs.validmind.ai/developer/validmind-library.html#validation)**\n",
+        "- **[Validator Fundamentals](https://docs.validmind.ai/training/validator-fundamentals/validator-fundamentals-register.html)**\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:q\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ],
+      "id": "8511e2f8"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc11__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ],
+      "id": "58d2d5da"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "upgrade-show-c0a446ff-f26f-4ad0-839a-e92927711798"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ],
+      "id": "7e76ca12"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ],
+      "id": "6d3e2933"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-2427447e4fe348908b3423e86473bfeb"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "name": "python",
+      "version": "3.10.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 5
+}
diff --git a/site/notebooks/tutorials/development/1-set_up_validmind.ipynb b/site/notebooks/tutorials/development/1-set_up_validmind.ipynb
new file mode 100644
index 0000000000..9ba5431049
--- /dev/null
+++ b/site/notebooks/tutorials/development/1-set_up_validmind.ipynb
@@ -0,0 +1,481 @@
+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# ValidMind for development 1 — Set up the ValidMind Library\n",
+        "\n",
+        "Learn how to use ValidMind for your end-to-end documentation process based on common development scenarios with our series of four introductory notebooks. This first notebook walks you through the initial setup of the ValidMind Library.\n",
+        "\n",
+        "These notebooks use a binary classification model as an example, but the same principles shown here apply to other record (model) types.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
+        "<br></br>\n",
+        "Our course tailor-made for developers new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/developer-fundamentals/developer-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Developer Fundamentals</b></a></div>"
+      ],
+      "id": "3bd9bc41"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [Introduction](#toc1__)    \n",
+        "- [About ValidMind](#toc2__)    \n",
+        "  - [Before you begin](#toc2_1__)    \n",
+        "  - [New to ValidMind?](#toc2_2__)    \n",
+        "  - [Key concepts](#toc2_3__)    \n",
+        "- [Setting up](#toc3__)    \n",
+        "  - [Install the ValidMind Library](#toc3_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc3_2__)    \n",
+        "    - [Register sample model](#toc3_2_1__)    \n",
+        "    - [Apply documentation template](#toc3_2_2__)    \n",
+        "    - [Get your code snippet](#toc3_2_3__)    \n",
+        "- [Getting to know ValidMind](#toc4__)    \n",
+        "  - [Preview the documentation template](#toc4_1__)    \n",
+        "    - [View documentation in the ValidMind Platform](#toc4_1_1__)    \n",
+        "  - [Explore available tests](#toc4_2__)    \n",
+        "- [Upgrade ValidMind](#toc5__)    \n",
+        "- [In summary](#toc6__)    \n",
+        "- [Next steps](#toc7__)    \n",
+        "  - [Start the model development process](#toc7_1__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ],
+      "id": "b4b7c002"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## Introduction\n",
+        "\n",
+        "Development aims to produce a fit-for-purpose *champion* by conducting thorough testing and analysis, supporting the capabilities of the champion with evidence in the form of documentation and test results. Documentation should be clear and comprehensive, ideally following a structure or template covering all aspects of compliance with risk regulation.\n",
+        "\n",
+        "A *binary classification model* is a type of predictive model used in churn analysis to identify customers who are likely to leave a service or subscription by analyzing various behavioral, transactional, and demographic factors.\n",
+        "\n",
+        "- This model helps businesses take proactive measures to retain at-risk customers by offering personalized incentives, improving customer service, or adjusting pricing strategies.\n",
+        "- Effective validation of a churn prediction model ensures that businesses can accurately identify potential churners, optimize retention efforts, and enhance overall customer satisfaction while minimizing revenue loss."
+      ],
+      "id": "7b7de259"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models. \n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators."
+      ],
+      "id": "b68b9958"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
+      ],
+      "id": "3b520a7e"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+      ],
+      "id": "9b3108db"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ],
+      "id": "f97d4266"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Setting up"
+      ],
+      "id": "bf5cd6c2"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
+        "<br></br>\n",
+        "Python 3.8 <= x <= 3.14</div>\n",
+        "\n",
+        "To install the library:"
+      ],
+      "id": "95bf9e4b"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "827eb6bd"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library\n",
+        "\n",
+        "The ValidMind Library provides a rich collection of documentation tools and test suites, from documenting descriptions of datasets to validation and testing using a variety of open-source testing frameworks."
+      ],
+      "id": "ad74254d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ],
+      "id": "a48cd34d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Binary classification`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ],
+      "id": "8ad7e39a"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ],
+      "id": "3339f683"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "a58d951f"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Getting to know ValidMind"
+      ],
+      "id": "61a021f3"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ],
+      "id": "852db20d"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "819a40bc"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1_1__'></a>\n",
+        "\n",
+        "#### View documentation in the ValidMind Platform\n",
+        "\n",
+        "Next, let's head to the ValidMind Platform to see the template in action:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, navigate to **Inventory** and select the model you registered for this \"ValidMind for development\" series of notebooks.\n",
+        "\n",
+        "3. Click **Development** under Documents for your model and note how the structure of the documentation matches our preview above."
+      ],
+      "id": "65ed2873"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Explore available tests\n",
+        "\n",
+        "Next, let's explore the list of all available tests in the ValidMind Library with [the `vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) — we'll learn how to run tests shortly. \n",
+        "\n",
+        "You can see that the documentation template for this model has references to some of the **test `ID`s used to run tests listed below:**"
+      ],
+      "id": "cdbb94d2"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.list_tests()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "7ccc7776"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ],
+      "id": "786f0d9c"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "f5d3216d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ],
+      "id": "d2010ad4"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ],
+      "id": "b637c5c6"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## In summary\n",
+        "\n",
+        "In this first notebook, you learned how to:\n",
+        "\n",
+        "- [x] Register a record (model) within the ValidMind Platform\n",
+        "- [x] Install and initialize the ValidMind Library\n",
+        "- [x] Preview the documentation template for your model\n",
+        "- [x] Explore the available tests offered by the ValidMind Library"
+      ],
+      "id": "dfef8925"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Next steps"
+      ],
+      "id": "186bee4f"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_1__'></a>\n",
+        "\n",
+        "### Start the development process\n",
+        "\n",
+        "Now that the ValidMind Library is connected to your model in the ValidMind Library with the correct template applied, we can go ahead and start the development process: **[2 — Start the development process](2-start_development_process.ipynb)**"
+      ],
+      "id": "7dbb07a1"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-63fcb66be39b42d38ad874a72a66581b"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "name": "python",
+      "version": "3.10.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 5
+}
diff --git a/site/notebooks/tutorials/model_development/2-start_development_process.ipynb b/site/notebooks/tutorials/development/2-start_development_process.ipynb
similarity index 89%
rename from site/notebooks/tutorials/model_development/2-start_development_process.ipynb
rename to site/notebooks/tutorials/development/2-start_development_process.ipynb
index b01cb35361..4016e2a97a 100644
--- a/site/notebooks/tutorials/model_development/2-start_development_process.ipynb
+++ b/site/notebooks/tutorials/development/2-start_development_process.ipynb
@@ -4,17 +4,17 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "# ValidMind for model development 2 — Start the model development process\n",
+    "# ValidMind for development 2 — Start the development process\n",
     "\n",
-    "Learn how to use ValidMind for your end-to-end model documentation process with our series of four introductory notebooks. In this second notebook, you'll run tests and investigate results, then add the results or evidence to your documentation.\n",
+    "Learn how to use ValidMind for your end-to-end documentation process with our series of four introductory notebooks. In this second notebook, you'll run tests and investigate results, then add the results or evidence to your documentation.\n",
     "\n",
-    "You'll become familiar with the individual tests available in ValidMind, as well as how to run them and change parameters as necessary. Using ValidMind's repository of individual tests as building blocks helps you ensure that a model is being built appropriately. \n",
+    "You'll become familiar with the individual tests available in ValidMind, as well as how to run them and change parameters as necessary. Using ValidMind's repository of individual tests as building blocks helps you ensure that a record (model) is being built appropriately.\n",
     "\n",
-    "**For a full list of out-of-the-box tests,** refer to our [Test descriptions](https://docs.validmind.ai/developer/model-testing/test-descriptions.html) or try the interactive [Test sandbox](https://docs.validmind.ai/developer/model-testing/test-sandbox.html).\n",
+    "**For a full list of out-of-the-box tests and descriptions,** use the interactive [ValidMind test sandbox](https://docs.validmind.ai/developer/how-to/test-sandbox.html).\n",
     "\n",
     "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
     "<br></br>\n",
-    "Our course tailor-made for developers new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/developer-fundamentals/developer-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Developer Fundamentals</b></a></div>"
+    "Our course tailor-made for developers new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/developer-fundamentals/developer-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Developer Fundamentals</b></a></div>\n"
    ]
   },
   {
@@ -29,24 +29,25 @@
     "  - [Import sample dataset](#toc2_2__)    \n",
     "  - [Identify qualitative tests](#toc2_3__)    \n",
     "  - [Initialize the ValidMind dataset](#toc2_4__)    \n",
-    "- [Running tests](#toc3__)    \n",
+    "- [Running tests on datasets](#toc3__)    \n",
     "  - [Run tabular data tests](#toc3_1__)    \n",
     "  - [Utilize test output](#toc3_2__)    \n",
     "- [Documenting test results](#toc4__)    \n",
     "  - [Run and log multiple tests](#toc4_1__)    \n",
     "  - [Run and log an individual test](#toc4_2__)    \n",
-    "    - [Add individual test results to model documentation](#toc4_2_1__)    \n",
-    "- [Model testing](#toc5__)    \n",
+    "    - [Add individual test results to documentation](#toc4_2_1__)    \n",
+    "- [Running model evaluation tests](#toc5__)    \n",
     "  - [Train simple logistic regression model](#toc5_1__)    \n",
-    "  - [Initialize model evaluation objects](#toc5_2__)    \n",
-    "  - [Assign predictions](#toc5_3__)    \n",
+    "  - [Initialize ValidMind datasets](#toc5_2__)    \n",
+    "  - [Initialize a ValidMind model](#toc5_3__)    \n",
+    "    - [Assign predictions](#toc5_3_1__)    \n",
     "  - [Run the model evaluation tests](#toc5_4__)    \n",
     "- [In summary](#toc6__)    \n",
     "- [Next steps](#toc7__)    \n",
     "  - [Integrate custom tests](#toc7_1__)    \n",
     "\n",
     ":::\n",
-    "<!-- jn-toc-notebook-configgs \n",
+    "<!-- jn-toc-notebook-config\n",
     "\tnumbering=false\n",
     "\tanchor=true\n",
     "\tflat=false\n",
@@ -64,7 +65,7 @@
     "\n",
     "## Prerequisites\n",
     "\n",
-    "In order to log test results or evidence to your model documentation with this notebook, you'll need to first have:\n",
+    "In order to log test results or evidence to your documentation with this notebook, you'll need to first have:\n",
     "\n",
     "- [x] Registered a model within the ValidMind Platform with a predefined documentation template\n",
     "- [x] Installed the ValidMind Library in your local environment, allowing you to access all its features\n",
@@ -94,8 +95,10 @@
     "First, let's connect up the ValidMind Library to our model we previously registered in the ValidMind Platform:\n",
     "\n",
     "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+    "\n",
     "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+    "\n",
+    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
    ]
   },
   {
@@ -258,7 +261,7 @@
    "source": [
     "<a id='toc3__'></a>\n",
     "\n",
-    "## Running tests\n",
+    "## Running tests on datasets\n",
     "\n",
     "Now that we know how to initialize a ValidMind `dataset` object, we're ready to run some tests!\n",
     "\n",
@@ -276,9 +279,9 @@
     "\n",
     "### Run tabular data tests\n",
     "\n",
-    "The inputs expected by a test can also be found in the test definition — let's take [`validmind.data_validation.DescriptiveStatistics`](https://docs.validmind.ai/tests/data_validation/DescriptiveStatistics.html) as an example.\n",
+    "The inputs expected by a test can also be found in the test definition — let's take `validmind.data_validation.DescriptiveStatistics` as an example.\n",
     "\n",
-    "Note that the output of the [`describe_test()` function](https://docs.validmind.ai/validmind/validmind/tests.html#describe_test) below shows that this test expects a `dataset` as input:"
+    "Note that the output of the [`describe_test()` function](https://docs.validmind.ai/validmind/validmind/tests.html#describe_test) below shows that this test expects a `dataset` as input:\n"
    ]
   },
   {
@@ -326,9 +329,9 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "The output above shows that [the class imbalance test](https://docs.validmind.ai/tests/data_validation/ClassImbalance.html) did not pass according to the value we set for `min_percent_threshold`.\n",
+    "The output above shows that the `validmind.data_validation.ClassImbalance` test did not pass according to the value we set for `min_percent_threshold`.\n",
     "\n",
-    "To address this issue, we'll re-run the test on some processed data. In this case let's apply a very simple rebalancing technique to the dataset:"
+    "To address this issue, we'll re-run the test on some processed data. In this case let's apply a very simple rebalancing technique to the dataset:\n"
    ]
   },
   {
@@ -398,7 +401,7 @@
     "\n",
     "Below we demonstrate how to retrieve the list of features with the highest correlation coefficients and use them to reduce the final list of features for modeling.\n",
     "\n",
-    "First, we'll run [`validmind.data_validation.HighPearsonCorrelation`](https://docs.validmind.ai/tests/data_validation/HighPearsonCorrelation.html) with the `balanced_raw_dataset` we initialized previously as input as is for comparison with later runs:"
+    "First, we'll run `validmind.data_validation.HighPearsonCorrelation` with the `balanced_raw_dataset` we initialized previously as input as is for comparison with later runs:\n"
    ]
   },
   {
@@ -574,9 +577,9 @@
     "Every test result returned by the `run_test()` function has a [`.log()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#TestResult.log) that can be used to send the test results to the ValidMind Platform:\n",
     "\n",
     "- When using `run_documentation_tests()`, documentation sections will be automatically populated with the results of all tests registered in the documentation template.\n",
-    "- When logging individual test results to the platform, you'll need to manually add those results to the desired section of the model documentation.\n",
+    "- When logging individual test results to the platform, you'll need to manually add those results to the desired section of the documentation.\n",
     "\n",
-    "To demonstrate how to add test results to your model documentation, we'll populate the entire **Data Preparation** section of the documentation using the clean `vm_raw_dataset_preprocessed` dataset as input, and then document an additional individual result for the highly correlated dataset `vm_balanced_raw_dataset`."
+    "To demonstrate how to add test results to your documentation, we'll populate the entire **Data Preparation** section of the documentation using the clean `vm_raw_dataset_preprocessed` dataset as input, and then document an additional individual result for the highly correlated dataset `vm_balanced_raw_dataset`."
    ]
   },
   {
@@ -661,7 +664,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your model's documentation for this particular test ID. </b></span>\n",
+    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your documentation for this particular test ID. </b></span>\n",
     "<br></br>\n",
     "That's expected, as when we run individual tests the results logged need to be manually added to your documentation within the ValidMind Platform.</div>"
    ]
@@ -672,9 +675,9 @@
    "source": [
     "<a id='toc4_2_1__'></a>\n",
     "\n",
-    "#### Add individual test results to model documentation\n",
+    "#### Add individual test results to documentation\n",
     "\n",
-    "With the test results logged, let's head to the model we connected to at the beginning of this notebook and insert our test results into the documentation ([Need more help?](https://docs.validmind.ai/developer/model-documentation/work-with-test-results.html)):\n",
+    "With the test results logged, let's head to the model we connected to at the beginning of this notebook and insert our test results into the documentation (**Learn more:** [Work with test results](https://docs.validmind.ai/guide/documentation/work-with-test-results.html)):\n",
     "\n",
     "1. From the **Inventory** in the ValidMind Platform, go to the model you connected to earlier.\n",
     "\n",
@@ -713,7 +716,7 @@
    "source": [
     "<a id='toc5__'></a>\n",
     "\n",
-    "## Model testing\n",
+    "## Running model evaluation tests\n",
     "\n",
     "So far, we've focused on the data assessment and pre-processing that usually occurs prior to any models being built. Now, let's instead assume we have already built a model and we want to incorporate some model results into our documentation."
    ]
@@ -830,7 +833,7 @@
    "source": [
     "<a id='toc5_2__'></a>\n",
     "\n",
-    "### Initialize model evaluation objects\n",
+    "### Initialize ValidMind datasets\n",
     "\n",
     "The last step for evaluating the model's performance is to initialize the ValidMind `Dataset` and `Model` objects in preparation for assigning model predictions to each dataset."
    ]
@@ -859,9 +862,16 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
+    "<a id='toc5_3__'></a>\n",
+    "\n",
+    "### Initialize a ValidMind model\n",
+    "\n",
     "You'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for each of our three models.\n",
     "\n",
-    "You simply initialize this model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
+    "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+    "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
+    "\n",
+    "Initialize your model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
    ]
   },
   {
@@ -878,11 +888,11 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "<a id='toc5_3__'></a>\n",
+    "<a id='toc5_3_1__'></a>\n",
     "\n",
-    "### Assign predictions\n",
+    "#### Assign predictions\n",
     "\n",
-    "Once the model has been registered you can assign model predictions to the training and testing datasets.\n",
+    "Once the model has been registered you can assign predictions to the training and testing datasets.\n",
     "\n",
     "- The [`assign_predictions()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#assign_predictions) from the `Dataset` object can link existing predictions to any number of models.\n",
     "- This method links the model's class prediction values and probabilities to our `vm_train_ds` and `vm_test_ds` datasets.\n",
@@ -908,10 +918,10 @@
     "\n",
     "### Run the model evaluation tests\n",
     "\n",
-    "In this next example, we'll focus on running the tests within the Model Development section of the model documentation. Only tests associated with this section will be executed, and the corresponding results will be updated in the model documentation.\n",
+    "In this next example, we'll focus on running the tests within the Model Development section of the documentation. Only tests associated with this section will be executed, and the corresponding results will be updated in the documentation.\n",
     "\n",
     "- Note the additional config that is passed to `run_documentation_tests()` — this allows you to override `inputs` or `params` in certain tests.\n",
-    "- In our case, we want to explicitly use the `vm_train_ds` for the [`validmind.model_validation.sklearn.ClassifierPerformance:in_sample` test](https://docs.validmind.ai/tests/model_validation/sklearn/ClassifierPerformance.html), since it's supposed to run on the training dataset and not the test dataset."
+    "- In our case, we want to explicitly use the `vm_train_ds` for the `validmind.model_validation.sklearn.ClassifierPerformance:in_sample` test, since it's supposed to run on the training dataset and not the test dataset.\n"
    ]
   },
   {
@@ -959,7 +969,7 @@
     "- [x] Utilize the output from tests you've run\n",
     "- [x] Log test results from sets of or individual tests as evidence to the ValidMind Platform\n",
     "- [x] Add supplementary individual test results to your documentation\n",
-    "- [x] Assign model predictions to your ValidMind model objects"
+    "- [x] Assign predictions to your ValidMind model objects"
    ]
   },
   {
@@ -979,12 +989,12 @@
     "\n",
     "### Integrate custom tests\n",
     "\n",
-    "Now that you're familiar with the basics of using the ValidMind Library to run and log tests to provide evidence for your model documentation, let's learn how to incorporate your own custom tests into ValidMind: **[3 — Integrate custom tests](3-integrate_custom_tests.ipynb)**"
+    "Now that you're familiar with the basics of using the ValidMind Library to run and log tests to provide evidence for your documentation, let's learn how to incorporate your own custom tests into ValidMind: **[3 — Integrate custom tests](3-integrate_custom_tests.ipynb)**"
    ]
   },
   {
    "cell_type": "markdown",
-   "id": "copyright-b0df0754a7a74581809f22d50b198597",
+   "id": "copyright-f012d0fd2e1f44e38b70b6ad06ae0e67",
    "metadata": {},
    "source": [
     "<!-- VALIDMIND COPYRIGHT -->\n",
diff --git a/site/notebooks/EXECUTED/model_development/3-integrate_custom_tests.ipynb b/site/notebooks/tutorials/development/3-integrate_custom_tests.ipynb
similarity index 95%
rename from site/notebooks/EXECUTED/model_development/3-integrate_custom_tests.ipynb
rename to site/notebooks/tutorials/development/3-integrate_custom_tests.ipynb
index b4b990346b..7f32f3e454 100644
--- a/site/notebooks/EXECUTED/model_development/3-integrate_custom_tests.ipynb
+++ b/site/notebooks/tutorials/development/3-integrate_custom_tests.ipynb
@@ -4,14 +4,14 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "# ValidMind for model development 3 — Integrate custom tests\n",
+    "# ValidMind for development 3 — Integrate custom tests\n",
     "\n",
-    "Learn how to use ValidMind for your end-to-end model documentation process with our series of four introductory notebooks. In this third notebook, supplement ValidMind tests with your own and include them as additional evidence in your documentation.\n",
+    "Learn how to use ValidMind for your end-to-end documentation process with our series of four introductory notebooks. In this third notebook, supplement ValidMind tests with your own and include them as additional evidence in your documentation.\n",
     "\n",
     "This notebook assumes that you already have a repository of custom made tests considered critical to include in your documentation. A custom test is any function that takes a set of inputs and parameters as arguments and returns one or more outputs:\n",
     "\n",
     "- The function can be as simple or as complex as you need it to be — it can use external libraries, make API calls, or do anything else that you can do in Python.\n",
-    "- The only requirement is that the function signature and return values can be \"understood\" and handled by the ValidMind Library. As such, custom tests offer added flexibility by extending the default tests provided by ValidMind, enabling you to document any type of model or use case.\n",
+    "- The only requirement is that the function signature and return values can be \"understood\" and handled by the ValidMind Library. As such, custom tests offer added flexibility by extending the default tests provided by ValidMind, enabling you to document any type of record (model) or use case.\n",
     "\n",
     "**For a more in-depth introduction to custom tests,** refer to our [Implement custom tests](../../how_to/tests/custom_tests/implement_custom_tests.ipynb) notebook.\n",
     "\n",
@@ -69,7 +69,7 @@
     "\n",
     "## Prerequisites\n",
     "\n",
-    "In order to integrate custom tests with your model documentation with this notebook, you'll need to first have:\n",
+    "In order to integrate custom tests with your documentation with this notebook, you'll need to first have:\n",
     "\n",
     "- [x] Registered a model within the ValidMind Platform with a predefined documentation template\n",
     "- [x] Installed the ValidMind Library in your local environment, allowing you to access all its features\n",
@@ -82,7 +82,7 @@
     "Refer to the first two notebooks in this series:\n",
     "\n",
     "- <a href=\"1-set_up_validmind.ipynb\" style=\"color: #DE257E;\"><b>1 — Set up the ValidMind Library</b></a>\n",
-    "- <a href=\"2-start_development_process.ipynb\" style=\"color: #DE257E;\"><b>2 — Start the model development process</b></a>\n",
+    "- <a href=\"2-start_development_process.ipynb\" style=\"color: #DE257E;\"><b>2 — Start the development process</b></a>\n",
     "\n",
     "</div>\n"
    ]
@@ -95,7 +95,7 @@
     "\n",
     "## Setting up\n",
     "\n",
-    "This section should be quite familiar to you — as we performed the same actions in the previous notebook, **[2 — Start the model development process](2-start_development_process.ipynb)**."
+    "This section should be quite familiar to you — as we performed the same actions in the previous notebook, **[2 — Start the development process](2-start_development_process.ipynb)**."
    ]
   },
   {
@@ -109,8 +109,10 @@
     "As usual, let's first connect up the ValidMind Library to our model we previously registered in the ValidMind Platform:\n",
     "\n",
     "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+    "\n",
     "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+    "\n",
+    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
    ]
   },
   {
@@ -385,7 +387,7 @@
     "\n",
     "#### Initialize the ValidMind objects\n",
     "\n",
-    "Let's initialize the ValidMind `Dataset` and `Model` objects in preparation for assigning model predictions to each dataset:"
+    "Let's initialize the ValidMind `Dataset` and `Model` objects in preparation for assigning predictions to each dataset:"
    ]
   },
   {
@@ -394,7 +396,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "# Initialize the datasets into their own dataset objects\n",
+    "# Initialize the datasets into their own ValidMind dataset objects\n",
     "vm_train_ds = vm.init_dataset(\n",
     "    input_id=\"train_dataset_final\",\n",
     "    dataset=train_df,\n",
@@ -407,7 +409,7 @@
     "    target_column=\"Exited\",\n",
     ")\n",
     "\n",
-    "# Initialize a model object\n",
+    "# Initialize the ValidMind model object\n",
     "vm_model = vm.init_model(log_reg, input_id=\"log_reg_model_v1\")"
    ]
   },
@@ -487,7 +489,7 @@
     "\n",
     "- The function `confusion_matrix` takes two arguments `dataset` and `model`. This is a `VMDataset` and `VMModel` object respectively.\n",
     "  - `VMDataset` objects allow you to access the dataset's true (target) values by accessing the `.y` attribute.\n",
-    "  - `VMDataset` objects allow you to access the predictions for a given model by accessing the `.y_pred()` method.\n",
+    "  - `VMDataset` objects allow you to access the predictions for a given record (model) by accessing the `.y_pred()` method.\n",
     "- The function docstring provides a description of what the test does. This will be displayed along with the result in this notebook as well as in the ValidMind Platform.\n",
     "- The function body calculates the confusion matrix using the `sklearn.metrics.confusion_matrix` function as we just did above.\n",
     "- The function then returns the `ConfusionMatrixDisplay.figure_` object — this is important as the ValidMind Library expects the output of the custom test to be a plot or a table.\n",
@@ -672,7 +674,7 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your model's documentation for this particular test ID. </b></span>\n",
+    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your documentation for this particular test ID. </b></span>\n",
     "<br></br>\n",
     "That's expected, as when we run individual tests the results logged need to be manually added to your documentation within the ValidMind Platform.</div>"
    ]
@@ -685,7 +687,7 @@
     "\n",
     "## Using external test providers\n",
     "\n",
-    "Creating inline custom tests with a function is a great way to customize your model documentation. However, sometimes you may want to reuse the same set of tests across multiple models and share them with others in your organization. In this case, you can create an external custom *test provider* that will allow you to load custom tests from a local folder or a Git repository.\n",
+    "Creating inline custom tests with a function is a great way to customize your documentation. However, sometimes you may want to reuse the same set of tests across multiple records (models) and share them with others in your organization. In this case, you can create an external custom *test provider* that will allow you to load custom tests from a local folder or a Git repository.\n",
     "\n",
     "In this section you will learn how to declare a local filesystem test provider that allows loading tests from a local folder following these high level steps:\n",
     "\n",
@@ -738,7 +740,7 @@
     "After running the command above, confirm that a new `my_tests` directory was created successfully. For example:\n",
     "\n",
     "```\n",
-    "~/notebooks/tutorials/model_development/my_tests/\n",
+    "~/notebooks/tutorials/development/my_tests/\n",
     "```"
    ]
   },
@@ -901,7 +903,7 @@
     "\n",
     "## Add test results to documentation\n",
     "\n",
-    "With our custom tests run and results logged to the ValidMind Platform, let's head to the model we connected to at the beginning of this notebook and insert our test results into the documentation ([Need more help?](https://docs.validmind.ai/developer/model-documentation/work-with-test-results.html)):\n",
+    "With our custom tests run and results logged to the ValidMind Platform, let's head to the model we connected to at the beginning of this notebook and insert our test results into the documentation (**Learn more:** [Work with test results](https://docs.validmind.ai/guide/documentation/work-with-test-results.html)):\n",
     "\n",
     "1. From the **Inventory** in the ValidMind Platform, go to the model you connected to earlier.\n",
     "\n",
diff --git a/site/notebooks/EXECUTED/model_development/4-finalize_testing_documentation.ipynb b/site/notebooks/tutorials/development/4-finalize_testing_documentation.ipynb
similarity index 88%
rename from site/notebooks/EXECUTED/model_development/4-finalize_testing_documentation.ipynb
rename to site/notebooks/tutorials/development/4-finalize_testing_documentation.ipynb
index 086ccc2029..0dbc8d3be1 100644
--- a/site/notebooks/EXECUTED/model_development/4-finalize_testing_documentation.ipynb
+++ b/site/notebooks/tutorials/development/4-finalize_testing_documentation.ipynb
@@ -4,11 +4,11 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "# ValidMind for model development 4 — Finalize testing and documentation\n",
+    "# ValidMind for development 4 — Finalize testing and documentation\n",
     "\n",
-    "Learn how to use ValidMind for your end-to-end model documentation process with our introductory notebook series. In this last notebook, finalize the testing and documentation of your model and have a fully documented sample model ready for review.\n",
+    "Learn how to use ValidMind for your end-to-end documentation process with our introductory notebook series. In this last notebook, finalize the testing and documentation of your model and have a fully documented sample model ready for review.\n",
     "\n",
-    "We'll first use [`run_documentation_tests()`](https://docs.validmind.ai/validmind/validmind.html#run_documentation_tests) previously covered in **[2 — Start the model development process](2-start_development_process.ipynb)** to ensure that your custom test results generated in **[3 — Integrate custom tests](3-integrate_custom_tests.ipynb)** are included in your documentation. Then, we'll view and update the configuration for the entire model documentation template to suit your needs.\n",
+    "We'll first use [`run_documentation_tests()`](https://docs.validmind.ai/validmind/validmind.html#run_documentation_tests) previously covered in **[2 — Start the development process](2-start_development_process.ipynb)** to ensure that your custom test results generated in **[3 — Integrate custom tests](3-integrate_custom_tests.ipynb)** are included in your documentation. Then, we'll view and update the configuration for the entire documentation template to suit your needs.\n",
     "\n",
     "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
     "<br></br>\n",
@@ -34,11 +34,12 @@
     "    - [Add a local test provider](#toc2_4_2__)    \n",
     "- [Reconnect to ValidMind](#toc3__)    \n",
     "- [Include custom test results](#toc4__)    \n",
-    "- [Documentation template configuration](#toc5__)    \n",
-    "  - [Update the config](#toc5_1__)    \n",
+    "- [Configuring documentation template tests](#toc5__)    \n",
+    "  - [Preview test configuration](#toc5_1__)    \n",
+    "  - [Run updated documentation section tests](#toc5_2__)    \n",
     "- [In summary](#toc6__)    \n",
     "- [Next steps](#toc7__)    \n",
-    "  - [Work with your model documentation](#toc7_1__)    \n",
+    "  - [Work with your documentation](#toc7_1__)    \n",
     "  - [Learn more](#toc7_2__)    \n",
     "    - [Use cases](#toc7_2_1__)    \n",
     "    - [Discover more learning resources](#toc7_2_2__)    \n",
@@ -78,7 +79,7 @@
     "Refer to the first three notebooks in this series:\n",
     "\n",
     "- <a href=\"1-set_up_validmind.ipynb\" style=\"color: #DE257E;\"><b>1 — Set up the ValidMind Library</b></a>\n",
-    "- <a href=\"2-start_development_process.ipynb\" style=\"color: #DE257E;\"><b>2 — Start the model development process</b></a>\n",
+    "- <a href=\"2-start_development_process.ipynb\" style=\"color: #DE257E;\"><b>2 — Start the development process</b></a>\n",
     "- <a href=\"3-integrate_custom_tests.ipynb\" style=\"color: #DE257E;\"><b>3 — Integrate custom tests</b></a>\n",
     "\n",
     "</div>"
@@ -106,8 +107,10 @@
     "As usual, let's first connect up the ValidMind Library to our model we previously registered in the ValidMind Platform:\n",
     "\n",
     "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+    "\n",
     "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+    "\n",
+    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
    ]
   },
   {
@@ -391,7 +394,7 @@
    "metadata": {},
    "outputs": [],
    "source": [
-    "# Initialize the datasets into their own dataset objects\n",
+    "# Initialize the datasets into their own ValidMind dataset objects\n",
     "vm_train_ds = vm.init_dataset(\n",
     "    input_id=\"train_dataset_final\",\n",
     "    dataset=train_df,\n",
@@ -404,7 +407,7 @@
     "    target_column=\"Exited\",\n",
     ")\n",
     "\n",
-    "# Initialize a model object\n",
+    "# Initialize the ValidMind model object\n",
     "vm_model = vm.init_model(log_reg, input_id=\"log_reg_model_v1\")"
    ]
   },
@@ -637,7 +640,7 @@
     "\n",
     "Let's run all tests in the Model Evaluation section of the documentation. Note that we have been running the sample custom confusion matrix with `normalize=True` to demonstrate the ability to provide custom parameters.\n",
     "\n",
-    "In the **Run the model evaluation tests** section of **[2 — Start the model development process](2-start_development_process.ipynb)**, you learned how to assign inputs to individual tests with [`run_documentation_tests()`](https://docs.validmind.ai/validmind/validmind.html#run_documentation_tests). Assigning parameters is similar, you only need to provide assign a `params` dictionary to a given test ID, `my_test_provider.ConfusionMatrix` in this case."
+    "In the **Run the model evaluation tests** section of **[2 — Start the development process](2-start_development_process.ipynb)**, you learned how to assign inputs to individual tests with [`run_documentation_tests()`](https://docs.validmind.ai/validmind/validmind.html#run_documentation_tests). Assigning parameters is similar, you only need to provide assign a `params` dictionary to a given test ID, `my_test_provider.ConfusionMatrix` in this case."
    ]
   },
   {
@@ -678,7 +681,7 @@
    "source": [
     "<a id='toc5__'></a>\n",
     "\n",
-    "## Documentation template configuration\n",
+    "## Configuring documentation template tests\n",
     "\n",
     "Let's call the utility function [`vm.get_test_suite().get_default_config()`](https://docs.validmind.ai/validmind/validmind/vm_models.html#TestSuite.get_default_config) which will return the **default configuration for the entire documentation template as a dictionary:**\n",
     "\n",
@@ -706,11 +709,11 @@
    "source": [
     "<a id='toc5_1__'></a>\n",
     "\n",
-    "### Update the config\n",
+    "### Preview test configuration\n",
     "\n",
-    "The default config does not assign any inputs to a test, but you can assign inputs to individual tests as needed depending on the datasets and models you want to pass to individual tests.\n",
+    "The default config does not assign any inputs to a test, but you can assign inputs to individual tests as needed depending on the datasets and records (models) you want to pass to individual tests.\n",
     "\n",
-    "For this particular documentation template (binary classification), the ValidMind Library provides a sample configuration that can be used to populate the entire model documentation using the following inputs as placeholders:\n",
+    "For this particular documentation template (binary classification), the ValidMind Library provides a sample configuration that can be used to populate the entire documentation using the following inputs as placeholders:\n",
     "\n",
     "- A **`raw_dataset`** raw dataset\n",
     "- A **`train_dataset`** training dataset\n",
@@ -739,7 +742,11 @@
    "cell_type": "markdown",
    "metadata": {},
    "source": [
-    "Using this sample configuration, let's finish populating model documentation by running all tests for the Model Development section of the documentation.\n",
+    "<a id='toc5_2__'></a>\n",
+    "\n",
+    "### Run updated documentation section tests\n",
+    "\n",
+    "Using this sample configuration, let's finish populating documentation by running all tests for the Model Development section of the documentation.\n",
     "\n",
     "Recall that the training and test datasets in our exercise have the following `input_id` values:\n",
     "\n",
@@ -863,13 +870,13 @@
     "In this final notebook, you learned how to:\n",
     "\n",
     "- [x] Refresh the connection from the ValidMind Library to the ValidMind Platform after you've inserted test-driven blocks to your documentation\n",
-    "- [x] Include custom test results in your model documentation\n",
-    "- [x] View and configure the configuration for your model documentation template\n",
+    "- [x] Include custom test results in your documentation\n",
+    "- [x] View and configure the configuration for your documentation template\n",
     "\n",
-    "With our ValidMind for model development series of notebooks, you learned how to document a model end-to-end with the ValidMind Library by running through some common scenarios in a typical model development setting:\n",
+    "With our ValidMind for development series of notebooks, you learned how to document a record (model) end-to-end with the ValidMind Library by running through some common scenarios in a typical development setting:\n",
     "\n",
     "- Running out-of-the-box tests\n",
-    "- Documenting your model by adding evidence to model documentation\n",
+    "- Documenting your record (model) by adding evidence to documentation\n",
     "- Extending the capabilities of the ValidMind Library by implementing custom tests\n",
     "- Ensuring that the documentation is complete by running all tests in the documentation template"
    ]
@@ -889,21 +896,21 @@
    "source": [
     "<a id='toc7_1__'></a>\n",
     "\n",
-    "### Work with your model documentation\n",
+    "### Work with your documentation\n",
     "\n",
-    "Now that you've logged all your test results and generated a draft for your model documentation, head to the ValidMind Platform to wrap up your model documentation. Continue to work on your model documentation by:\n",
+    "Now that you've logged all your test results and generated a draft for your documentation, head to the ValidMind Platform to wrap up your documentation. Continue to work on your documentation by:\n",
     "\n",
     "- **Run and log more tests:** Use the skills you learned in this series of notebooks to run and log more individual tests, including custom tests, then insert them into your documentation as supplementary evidence. (Learn more: [`validmind.tests`](https://docs.validmind.ai/validmind/validmind/tests.html))\n",
     "\n",
-    "- **Inserting additional test results:** Add **Test-Driven Blocks** under any relevant section of your model documentation. (Learn more: [Work with test results](https://docs.validmind.ai/guide/model-documentation/work-with-test-results.html))\n",
+    "- **Inserting additional test results:** Add **Test-Driven Blocks** under any relevant section of your documentation. (Learn more: [Work with test results](https://docs.validmind.ai/guide/documentation/work-with-test-results.html))\n",
     "\n",
-    "- **Making qualitative edits to your test descriptions:** Click on the description of any inserted test results to review and edit the ValidMind-generated test descriptions for quality and accuracy. (Learn more: [Working with model documentation](https://docs.validmind.ai/guide/model-documentation/working-with-model-documentation.html#add-or-edit-documentation))\n",
+    "- **Making qualitative edits to your test descriptions:** Click on the description of any inserted test results to review and edit the ValidMind-generated test descriptions for quality and accuracy. (Learn more: [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html#add-or-edit-documentation))\n",
     "\n",
-    "- **View guidelines:** In any section of your model documentation, click **​ValidMind Insights** in the top right corner to reveal the Documentation Guidelines for each section to help guide the contents of your model documentation. (Learn more: [View documentation guidelines](https://docs.validmind.ai/guide/model-documentation/view-documentation-guidelines.html))\n",
+    "- **View guidelines:** In any section of your documentation, click **ValidMind Insights** in the top right corner to reveal the Documentation Guidelines for each section to help guide the contents of your documentation. (Learn more: [View development guidelines](https://docs.validmind.ai/guide/documentation/view-development-guidelines.html))\n",
     "\n",
-    "- **Collaborate with other stakeholders:** Use the ValidMind Platform's real-time collaborative features to work seamlessly together with the rest of your organization, including model validators. Review suggested changes in your content blocks, work with versioned history, and use comments to discuss specific portions of your model documentation. (Learn more: [Collaborate with others](https://docs.validmind.ai/guide/model-documentation/collaborate-with-others.html))\n",
+    "- **Collaborate with other stakeholders:** Use the ValidMind Platform's real-time collaborative features to work seamlessly together with the rest of your organization, including validators. Review suggested changes in your content blocks, work with versioned history, and use comments to discuss specific portions of your documentation. (Learn more: [Collaborate with others](https://docs.validmind.ai/guide/documentation/collaborate-with-others.html))\n",
     "\n",
-    "When your model documentation is complete and ready for review, submit it for approval from the same ValidMind Platform where you made your edits and collaborated with the rest of your organization, ensuring transparency and a thorough model development history. (Learn more: [Submit for approval](https://docs.validmind.ai/guide/model-documentation/submit-for-approval.html))"
+    "When your documentation is complete and ready for review, submit it for approval from the same ValidMind Platform where you made your edits and collaborated with the rest of your organization, ensuring transparency and a thorough development history. (Learn more: [Submit documents](https://docs.validmind.ai/guide/documentation/submit-documents.html))"
    ]
   },
   {
@@ -914,7 +921,7 @@
     "\n",
     "### Learn more\n",
     "\n",
-    "Now that you're familiar with the basics, you can explore the following notebooks to get a deeper understanding on how the ValidMind Library allows you generate model documentation for any use case:"
+    "Now that you're familiar with the basics, you can explore the following notebooks to get a deeper understanding on how the ValidMind Library allows you generate documentation for any use case:"
    ]
   },
   {
@@ -941,7 +948,7 @@
     "Learn more about the ValidMind Library tools we used in this notebook:\n",
     "\n",
     "- [Explore tests](../../how_to/tests/explore_tests/explore_tests.ipynb)\n",
-    "- [Run dataset-based tests](../../how_to/tests/run_tests/1_run_dataset_based_tests.ipynb)\n",
+    "- [Run dataset-based tests](../../how_to/tests/run_tests/1-run_dataset-based_tests.ipynb)\n",
     "- [Implement custom tests](../../how_to/tests/custom_tests/implement_custom_tests.ipynb)\n",
     "- [Integrate external test providers](../../how_to/tests/custom_tests/integrate_external_test_providers.ipynb)\n",
     "- [Configure dataset features](../../how_to/data_and_datasets/dataset_inputs/configure_dataset_features.ipynb)\n",
@@ -950,14 +957,14 @@
     "\n",
     "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
     "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
+    "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
     "\n",
     "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
    ]
   },
   {
    "cell_type": "markdown",
-   "id": "copyright-2efae7bbb0f74bd5abe37252cd48b951",
+   "id": "copyright-9be88159d1f24db999931c13536a491c",
    "metadata": {},
    "source": [
     "<!-- VALIDMIND COPYRIGHT -->\n",
diff --git a/site/notebooks/tutorials/model_development/add-content-block.gif b/site/notebooks/tutorials/development/add-content-block.gif
similarity index 100%
rename from site/notebooks/tutorials/model_development/add-content-block.gif
rename to site/notebooks/tutorials/development/add-content-block.gif
diff --git a/site/notebooks/tutorials/model_development/high-pearson-correlation-block.png b/site/notebooks/tutorials/development/high-pearson-correlation-block.png
similarity index 100%
rename from site/notebooks/tutorials/model_development/high-pearson-correlation-block.png
rename to site/notebooks/tutorials/development/high-pearson-correlation-block.png
diff --git a/site/notebooks/tutorials/model_development/selecting-confusion-matrix-test.png b/site/notebooks/tutorials/development/selecting-confusion-matrix-test.png
similarity index 100%
rename from site/notebooks/tutorials/model_development/selecting-confusion-matrix-test.png
rename to site/notebooks/tutorials/development/selecting-confusion-matrix-test.png
diff --git a/site/notebooks/tutorials/model_development/selecting-high-pearson-correlation-test.png b/site/notebooks/tutorials/development/selecting-high-pearson-correlation-test.png
similarity index 100%
rename from site/notebooks/tutorials/model_development/selecting-high-pearson-correlation-test.png
rename to site/notebooks/tutorials/development/selecting-high-pearson-correlation-test.png
diff --git a/site/notebooks/tutorials/model_development/1-set_up_validmind.ipynb b/site/notebooks/tutorials/model_development/1-set_up_validmind.ipynb
deleted file mode 100644
index 4244924b9a..0000000000
--- a/site/notebooks/tutorials/model_development/1-set_up_validmind.ipynb
+++ /dev/null
@@ -1,471 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "id": "06993494",
-   "metadata": {},
-   "source": [
-    "# ValidMind for model development 1 — Set up the ValidMind Library\n",
-    "\n",
-    "Learn how to use ValidMind for your end-to-end model documentation process based on common model development scenarios with our series of four introductory notebooks. This first notebook walks you through the initial setup of the ValidMind Library.\n",
-    "\n",
-    "These notebooks use a binary classification model as an example, but the same principles shown here apply to other model types.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
-    "<br></br>\n",
-    "Our course tailor-made for developers new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/developer-fundamentals/developer-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Developer Fundamentals</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "5269a388",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [Introduction](#toc1__)    \n",
-    "- [About ValidMind](#toc2__)    \n",
-    "  - [Before you begin](#toc2_1__)    \n",
-    "  - [New to ValidMind?](#toc2_2__)    \n",
-    "  - [Key concepts](#toc2_3__)    \n",
-    "- [Setting up](#toc3__)    \n",
-    "  - [Install the ValidMind Library](#toc3_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc3_2__)    \n",
-    "    - [Register sample model](#toc3_2_1__)    \n",
-    "    - [Apply documentation template](#toc3_2_2__)    \n",
-    "    - [Get your code snippet](#toc3_2_3__)    \n",
-    "- [Getting to know ValidMind](#toc4__)    \n",
-    "  - [Preview the documentation template](#toc4_1__)    \n",
-    "    - [View model documentation in the ValidMind Platform](#toc4_1_1__)    \n",
-    "  - [Explore available tests](#toc4_2__)    \n",
-    "- [Upgrade ValidMind](#toc5__)    \n",
-    "- [In summary](#toc6__)    \n",
-    "- [Next steps](#toc7__)    \n",
-    "  - [Start the model development process](#toc7_1__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "1020f3fa",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## Introduction\n",
-    "\n",
-    "Model development aims to produce a fit-for-purpose *champion model* by conducting thorough testing and analysis, supporting the capabilities of the model with evidence in the form of documentation and test results. Model documentation should be clear and comprehensive, ideally following a structure or template covering all aspects of compliance with model risk regulation.\n",
-    "\n",
-    "A *binary classification model* is a type of predictive model used in churn analysis to identify customers who are likely to leave a service or subscription by analyzing various behavioral, transactional, and demographic factors.\n",
-    "\n",
-    "- This model helps businesses take proactive measures to retain at-risk customers by offering personalized incentives, improving customer service, or adjusting pricing strategies.\n",
-    "- Effective validation of a churn prediction model ensures that businesses can accurately identify potential churners, optimize retention efforts, and enhance overall customer satisfaction while minimizing revenue loss."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "4424a3e8",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models. \n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "ed8cfd11",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "353613e5",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "63912e66",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Metrics**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
-    "\n",
-    "**Custom metrics**: Custom metrics are functions that you define to evaluate your model or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom metric.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom metric. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a metric, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom metrics can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "7d039206",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "d6758437",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
-    "<br></br>\n",
-    "Python 3.8 <= x <= 3.14</div>\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "827eb6bd",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "02f8b26f",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library\n",
-    "\n",
-    "The ValidMind Library provides a rich collection of documentation tools and test suites, from documenting descriptions of datasets to validation and testing of models using a variety of open-source testing frameworks."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "706a1004",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "8ceb6261",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Binary classification`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "acf3e1db",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "a58d951f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "3e0596f8",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Getting to know ValidMind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "bcd77028",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "819a40bc",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "025a518c",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1_1__'></a>\n",
-    "\n",
-    "#### View model documentation in the ValidMind Platform\n",
-    "\n",
-    "Next, let's head to the ValidMind Platform to see the template in action:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and select the model you registered for this \"ValidMind for model development\" series of notebooks.\n",
-    "\n",
-    "3. Click **Development** under Documents for your model and note how the structure of the documentation matches our preview above."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "596d6d16",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Explore available tests\n",
-    "\n",
-    "Next, let's explore the list of all available tests in the ValidMind Library with [the `vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) — we'll learn how to run tests shortly. \n",
-    "\n",
-    "You can see that the documentation template for this model has references to some of the **test `ID`s used to run tests listed below:**"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "7ccc7776",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.list_tests()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "30c4a1bc",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "f5d3216d",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e27b286f",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "75bf527b",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b919c3a0",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## In summary\n",
-    "\n",
-    "In this first notebook, you learned how to:\n",
-    "\n",
-    "- [x] Register a model within the ValidMind Platform\n",
-    "- [x] Install and initialize the ValidMind Library\n",
-    "- [x] Preview the documentation template for your model\n",
-    "- [x] Explore the available tests offered by the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e9c62e9d",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Next steps"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "8f1a7063",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_1__'></a>\n",
-    "\n",
-    "### Start the model development process\n",
-    "\n",
-    "Now that the ValidMind Library is connected to your model in the ValidMind Library with the correct template applied, we can go ahead and start the model development process: **[2 — Start the model development process](2-start_development_process.ipynb)**"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-3e02e70c1d4d4840bf8d9ef44e2cf20c",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
-  },
-  "language_info": {
-   "name": "python",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
-}
diff --git a/site/notebooks/tutorials/model_validation/1-set_up_validmind_for_validation.ipynb b/site/notebooks/tutorials/model_validation/1-set_up_validmind_for_validation.ipynb
deleted file mode 100644
index 05ad11c2c3..0000000000
--- a/site/notebooks/tutorials/model_validation/1-set_up_validmind_for_validation.ipynb
+++ /dev/null
@@ -1,517 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "id": "821a881e",
-   "metadata": {},
-   "source": [
-    "# ValidMind for model validation 1 — Set up the ValidMind Library for validation\n",
-    "\n",
-    "Learn how to use ValidMind for your end-to-end model validation process based on common scenarios with our series of four introductory notebooks. In this first notebook, set up the ValidMind Library in preparation for validating a champion model.\n",
-    "\n",
-    "These notebooks use a binary classification model as an example, but the same principles shown here apply to other model types.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
-    "<br></br>\n",
-    "Our course tailor-made for validators new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/validator-fundamentals/validator-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Validator Fundamentals</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "19ea797c",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [Introduction](#toc1__)    \n",
-    "- [About ValidMind](#toc2__)    \n",
-    "  - [Before you begin](#toc2_1__)    \n",
-    "  - [New to ValidMind?](#toc2_2__)    \n",
-    "  - [Key concepts](#toc2_3__)    \n",
-    "- [Setting up](#toc3__)    \n",
-    "  - [Register a sample model](#toc3_1__)    \n",
-    "    - [Assign validator credentials](#toc3_1_1__)    \n",
-    "    - [Apply documentation template](#toc3_1_2__)    \n",
-    "    - [Apply validation report template](#toc3_1_3__)    \n",
-    "  - [Install the ValidMind Library](#toc3_2__)    \n",
-    "  - [Initialize the ValidMind Library](#toc3_3__)    \n",
-    "    - [Get your code snippet](#toc3_3_1__)    \n",
-    "- [Getting to know ValidMind](#toc4__)    \n",
-    "  - [Preview the validation report template](#toc4_1__)    \n",
-    "    - [View validation report in the ValidMind Platform](#toc4_1_1__)    \n",
-    "  - [Explore available tests](#toc4_2__)    \n",
-    "- [Upgrade ValidMind](#toc5__)    \n",
-    "- [In summary](#toc6__)    \n",
-    "- [Next steps](#toc7__)    \n",
-    "  - [Start the model validation process](#toc7_1__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "d624f88d",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## Introduction\n",
-    "\n",
-    "Model validation aims to independently assess the compliance of *champion models* created by model developers with regulatory guidance by conducting thorough testing and analysis, potentially including the use of challenger models to benchmark performance. Assessments, presented in the form of a validation report, typically include *artifacts (findings)* and recommendations to address those issues.\n",
-    "\n",
-    "A *binary classification model* is a type of predictive model used in churn analysis to identify customers who are likely to leave a service or subscription by analyzing various behavioral, transactional, and demographic factors.\n",
-    "\n",
-    "- This model helps businesses take proactive measures to retain at-risk customers by offering personalized incentives, improving customer service, or adjusting pricing strategies.\n",
-    "- Effective validation of a churn prediction model ensures that businesses can accurately identify potential churners, optimize retention efforts, and enhance overall customer satisfaction while minimizing revenue loss."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "4fb1ef5a",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate comparison and other validation tests, and then use the ValidMind Platform to submit compliance assessments of champion models via comprehensive validation reports. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model developers."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "594f9fd4",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "262ed111",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "0eb67fe9",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Validation report**: A comprehensive and structured assessment of a model’s development and performance, focusing on verifying its integrity, appropriateness, and alignment with its intended use. It includes analyses of model assumptions, data quality, performance metrics, outcomes of testing procedures, and risk considerations. The validation report supports transparency, regulatory compliance, and informed decision-making by documenting the validator’s independent review and conclusions.\n",
-    "\n",
-    "**Validation report template**: Serves as a standardized framework for conducting and documenting model validation activities. It outlines the required sections, recommended analyses, and expected validation tests, ensuring consistency and completeness across validation reports. The template helps guide validators through a systematic review process while promoting comparability and traceability of validation outcomes.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets.\n",
-    "\n",
-    "**Metrics**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
-    "\n",
-    "**Custom metrics**: Custom metrics are functions that you define to evaluate your model or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom metric.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom metric. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a metric, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom metrics can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e0e1cf3d",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "609fe59b",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Register a sample model\n",
-    "\n",
-    "In a usual model lifecycle, a champion model will have been independently registered in your model inventory and submitted to you for validation by your model development team as part of the effective challenge process. (**Learn more:** [Submit for approval](https://docs.validmind.ai/guide/model-documentation/submit-for-approval.html))\n",
-    "\n",
-    "For this notebook, we'll have you register a dummy model in the ValidMind Platform inventory and assign yourself as the validator to familiarize you with the ValidMind interface and circumvent the need for an existing model:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down — don’t worry, we’ll adjust these permissions next for validation.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "58e552bb",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1_1__'></a>\n",
-    "\n",
-    "#### Assign validator credentials\n",
-    "\n",
-    "In order to log tests as a validator instead of as a developer, on the model details page that appears after you've successfully registered your sample model:\n",
-    "\n",
-    "1. Remove yourself as a model owner: \n",
-    "\n",
-    "    - Click on the **OWNERS** tile.\n",
-    "    - Click the **x** next to your name to remove yourself from that model's role.\n",
-    "    - Click **Save** to apply your changes to that role.\n",
-    "\n",
-    "2. Remove yourself as a developer: \n",
-    "\n",
-    "    - Click on the **DEVELOPERS** tile.\n",
-    "    - Click the **x** next to your name to remove yourself from that model's role.\n",
-    "    - Click **Save** to apply your changes to that role.\n",
-    "\n",
-    "3. Add yourself as a validator: \n",
-    "\n",
-    "    - Click on the **VALIDATORS** tile.\n",
-    "    - Select your name from the drop-down menu.\n",
-    "    - Click **Save** to apply your changes to that role."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "84251589",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier for developers.\n",
-    "\n",
-    "We'll need this documentation template later for reference as we draft our validation report:\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Documentation**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Binary classification`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "fdfb5dc5",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1_3__'></a>\n",
-    "\n",
-    "#### Apply validation report template\n",
-    "\n",
-    "Next, let's select a validation report template. A template predefines sections for your report and provides a general outline to follow, making the validation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Validation**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Generic Validation Report`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f656d0d6",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
-    "<br></br>\n",
-    "Python 3.8 <= x <= 3.14</div>\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "931d8f7f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "1435fd5b",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_3__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b375b341",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_3_1__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Validation` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "d5d87e2d",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"validation-report\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "331e1c07",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Getting to know ValidMind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f6331a98",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Preview the validation report template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will attach evidence to this template in the form of risk assessment notes, artifacts, and test results later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "13d34bbb",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "20717133",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1_1__'></a>\n",
-    "\n",
-    "#### View validation report in the ValidMind Platform\n",
-    "\n",
-    "Next, let's head to the ValidMind Platform to see the template in action:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and select the model you registered for this \"ValidMind for model validation\" series of notebooks.\n",
-    "\n",
-    "3. Click **Validation** under Documents for your model and note:\n",
-    "\n",
-    "    - [x] The risk assessment compliance summary at the top of the report (screenshot below)\n",
-    "    - [x] How the structure of the validation report reflects the previewed template\n",
-    "\n",
-    "    <img src= \"compliance-summary.png\" alt=\"Screenshot showing the risk assessment compliance summary\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
-    "    <br><br>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f5d0aaab",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Explore available tests\n",
-    "\n",
-    "Next, let's explore the list of all available tests in the ValidMind Library with [the `vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) — we'll later narrow down the tests we want to run from this list when we learn to run tests."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "de6abc2a",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.list_tests()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "dce47e40",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "10272aa9",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "7a0c3cc2",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "2dac11d5",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "174d2c8d",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## In summary\n",
-    "\n",
-    "In this first notebook, you learned how to:\n",
-    "\n",
-    "- [x] Register a model within the ValidMind Platform and assign yourself as the validator\n",
-    "- [x] Install and initialize the ValidMind Library\n",
-    "- [x] Preview the validation report template for your model\n",
-    "- [x] Explore the available tests offered by the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "d8ffdcf7",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "<a id='toc7_1__'></a>\n",
-    "\n",
-    "### Start the model validation process\n",
-    "\n",
-    "Now that the ValidMind Library is connected to your model in the ValidMind Library with the correct template applied, we can go ahead and start the model validation process: **[2 — Start the model validation process](2-start_validation_process.ipynb)**"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-5d7a1c159e4840fca79011d1c0380725",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
-  },
-  "language_info": {
-   "name": "python",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
-}
diff --git a/site/notebooks/tutorials/model_validation/2-start_validation_process.ipynb b/site/notebooks/tutorials/model_validation/2-start_validation_process.ipynb
deleted file mode 100644
index 7fafa5ab50..0000000000
--- a/site/notebooks/tutorials/model_validation/2-start_validation_process.ipynb
+++ /dev/null
@@ -1,889 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# ValidMind for model validation 2 — Start the model validation process\n",
-    "\n",
-    "Learn how to use ValidMind for your end-to-end model validation process with our series of four introductory notebooks. In this second notebook, independently verify the data quality tests performed on the dataset used to train the champion model.\n",
-    "\n",
-    "You'll learn how to run relevant validation tests with ValidMind, log the results of those tests to the ValidMind Platform, and insert your logged test results as evidence into your validation report. You'll become familiar with the tests available in ValidMind, as well as how to run them. Running tests during model validation is crucial to the effective challenge process, as we want to independently evaluate the evidence and assessments provided by the model development team.\n",
-    "\n",
-    "While running our tests in this notebook, we'll focus on:\n",
-    "\n",
-    "- Ensuring that data used for training and testing the model is of appropriate data quality\n",
-    "- Ensuring that the raw data has been preprocessed appropriately and that the resulting final datasets reflects this\n",
-    "\n",
-    "**For a full list of out-of-the-box tests,** refer to our [Test descriptions](https://docs.validmind.ai/developer/model-testing/test-descriptions.html) or try the interactive [Test sandbox](https://docs.validmind.ai/developer/model-testing/test-sandbox.html).\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
-    "<br></br>\n",
-    "Our course tailor-made for validators new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/validator-fundamentals/validator-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Validator Fundamentals</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [Prerequisites](#toc1__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_1__)    \n",
-    "- [Load the sample dataset](#toc3__)    \n",
-    "- [Verifying data quality adjustments](#toc4__)    \n",
-    "  - [Identify qualitative tests](#toc4_1__)    \n",
-    "  - [Initialize the ValidMind dataset](#toc4_2__)    \n",
-    "  - [Run data quality tests](#toc4_3__)    \n",
-    "    - [Run tabular data tests](#toc4_3_1__)    \n",
-    "  - [Remove highly correlated features](#toc4_4__)    \n",
-    "- [Documenting test results](#toc5__)    \n",
-    "  - [Configure and run comparison tests](#toc5_1__)    \n",
-    "  - [Log tests with unique identifiers](#toc5_2__)    \n",
-    "  - [Add test results to reporting](#toc5_3__)    \n",
-    "- [Split the preprocessed dataset](#toc6__)    \n",
-    "  - [Initialize the split datasets](#toc6_1__)    \n",
-    "- [In summary](#toc7__)    \n",
-    "- [Next steps](#toc8__)    \n",
-    "  - [Develop potential challenger models](#toc8_1__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## Prerequisites\n",
-    "\n",
-    "In order to independently assess the quality of your datasets with notebook, you'll need to first have:\n",
-    "\n",
-    "- [x] Registered a model within the ValidMind Platform and granted yourself access to the model as a validator\n",
-    "- [x] Installed the ValidMind Library in your local environment, allowing you to access all its features\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Need help with the above steps?</b></span>\n",
-    "<br></br>\n",
-    "Refer to the first notebook in this series: <a href=\"1-set_up_validmind_for_validation.ipynb\" style=\"color: #DE257E;\"><b>1 — Set up the ValidMind Library for validation</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library\n",
-    "\n",
-    "First, let's connect up the ValidMind Library to our model we previously registered in the ValidMind Platform:\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Validation` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Make sure the ValidMind Library is installed\n",
-    "\n",
-    "%pip install -q validmind\n",
-    "\n",
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"validation-report\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Load the sample dataset\n",
-    "\n",
-    "Let's first import the public [Bank Customer Churn Prediction](https://www.kaggle.com/datasets/shantanudhakadd/bank-customer-churn-prediction) dataset from Kaggle, which was used to develop the dummy champion model.\n",
-    "\n",
-    "We'll use this dataset to review steps that should have been conducted during the initial development and documentation of the model to ensure that the model was built correctly. By independently performing steps taken by the model development team, we can confirm whether the model was built using appropriate and properly processed data.\n",
-    "\n",
-    "In our below example, note that:\n",
-    "\n",
-    "- The target column, `Exited` has a value of `1` when a customer has churned and `0` otherwise.\n",
-    "- The ValidMind Library provides a wrapper to automatically load the dataset as a [Pandas DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html) object. A Pandas Dataframe is a two-dimensional tabular data structure that makes use of rows and columns."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.datasets.classification import customer_churn as demo_dataset\n",
-    "\n",
-    "print(\n",
-    "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{demo_dataset.target_column}' \\n\\t• Class labels: {demo_dataset.class_labels}\"\n",
-    ")\n",
-    "\n",
-    "raw_df = demo_dataset.load_data()\n",
-    "raw_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Verifying data quality adjustments\n",
-    "\n",
-    "Let's say that thanks to the documentation submitted by the model development team ([Learn more ...](https://docs.validmind.ai/developer/validmind-library.html#for-model-development)), we know that the sample dataset was first modified before being used to train the champion model. After performing some data quality assessments on the raw dataset, it was determined that the dataset required rebalancing, and highly correlated features were also removed."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Identify qualitative tests\n",
-    "\n",
-    "During model validation, we use the same data processing logic and training procedure to confirm that the model's results can be reproduced independently, so let's start by doing some data quality assessments by running a few individual tests just like the development team did.\n",
-    "\n",
-    "Use the [`vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) introduced by the first notebook in this series in combination with [`vm.tests.list_tags()`](https://docs.validmind.ai/validmind/validmind/tests.html#list_tags) and [`vm.tests.list_tasks()`](https://docs.validmind.ai/validmind/validmind/tests.html#list_tasks) to find which prebuilt tests are relevant for data quality assessment:\n",
-    "\n",
-    "- **`tasks`** represent the kind of modeling task associated with a test. Here we'll focus on `classification` tasks.\n",
-    "- **`tags`** are free-form descriptions providing more details about the test, for example, what category the test falls into. Here we'll focus on the `data_quality` tag."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Get the list of available task types\n",
-    "sorted(vm.tests.list_tasks())"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Get the list of available tags\n",
-    "sorted(vm.tests.list_tags())"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You can pass `tags` and `tasks` as parameters to the `vm.tests.list_tests()` function to filter the tests based on the tags and task types.\n",
-    "\n",
-    "For example, to find tests related to tabular data quality for classification models, you can call `list_tests()` like this:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.list_tests(task=\"classification\", tags=[\"tabular_data\", \"data_quality\"])"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about navigating ValidMind tests?</b></span>\n",
-    "<br></br>\n",
-    "Refer to our notebook outlining the utilities available for viewing and understanding available ValidMind tests: <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/explore_tests/explore_tests.html\" style=\"color: #DE257E;\"><b>Explore tests</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind dataset\n",
-    "\n",
-    "With the individual tests we want to run identified, the next step is to connect your data with a ValidMind `Dataset` object. **This step is always necessary every time you want to connect a dataset to documentation and produce test results through ValidMind,** but you only need to do it once per dataset.\n",
-    "\n",
-    "Initialize a ValidMind dataset object using the [`init_dataset` function](https://docs.validmind.ai/validmind/validmind.html#init_dataset) from the ValidMind (`vm`) module. For this example, we'll pass in the following arguments:\n",
-    "\n",
-    "- **`dataset`** — The raw dataset that you want to provide as input to tests.\n",
-    "- **`input_id`** — A unique identifier that allows tracking what inputs are used when running each individual test.\n",
-    "- **`target_column`** — A required argument if tests require access to true values. This is the name of the target column in the dataset."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# vm_raw_dataset is now a VMDataset object that you can pass to any ValidMind test\n",
-    "vm_raw_dataset = vm.init_dataset(\n",
-    "    dataset=raw_df,\n",
-    "    input_id=\"raw_dataset\",\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_3__'></a>\n",
-    "\n",
-    "### Run data quality tests\n",
-    "\n",
-    "Now that we know how to initialize a ValidMind `dataset` object, we're ready to run some tests!\n",
-    "\n",
-    "You run individual tests by calling [the `run_test` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test) provided by the `validmind.tests` module. For the examples below, we'll pass in the following arguments:\n",
-    "\n",
-    "- **`test_id`** — The ID of the test to run, as seen in the `ID` column when you run `list_tests`. \n",
-    "- **`params`** — A dictionary of parameters for the test. These will override any `default_params` set in the test definition. "
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_3_1__'></a>\n",
-    "\n",
-    "#### Run tabular data tests\n",
-    "\n",
-    "The inputs expected by a test can also be found in the test definition — let's take [`validmind.data_validation.DescriptiveStatistics`](https://docs.validmind.ai/tests/data_validation/DescriptiveStatistics.html) as an example.\n",
-    "\n",
-    "Note that the output of the [`describe_test()` function](https://docs.validmind.ai/validmind/validmind/tests.html#describe_test) below shows that this test expects a `dataset` as input:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.describe_test(\"validmind.data_validation.DescriptiveStatistics\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Now, let's run a few tests to assess the quality of the dataset:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result2 = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.ClassImbalance\",\n",
-    "    inputs={\"dataset\": vm_raw_dataset},\n",
-    "    params={\"min_percent_threshold\": 30},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "The output above shows that [the class imbalance test](https://docs.validmind.ai/tests/data_validation/ClassImbalance.html) did not pass according to the value we set for `min_percent_threshold` — great, this matches what was reported by the model development team.\n",
-    "\n",
-    "To address this issue, we'll re-run the test on some processed data. In this case let's apply a very simple rebalancing technique to the dataset:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import pandas as pd\n",
-    "\n",
-    "raw_copy_df = raw_df.sample(frac=1)  # Create a copy of the raw dataset\n",
-    "\n",
-    "# Create a balanced dataset with the same number of exited and not exited customers\n",
-    "exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 1]\n",
-    "not_exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 0].sample(n=exited_df.shape[0])\n",
-    "\n",
-    "balanced_raw_df = pd.concat([exited_df, not_exited_df])\n",
-    "balanced_raw_df = balanced_raw_df.sample(frac=1, random_state=42)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "With this new balanced dataset, you can re-run the individual test to see if it now passes the class imbalance test requirement.\n",
-    "\n",
-    "As this is technically a different dataset, **remember to first initialize a new ValidMind `Dataset` object** to pass in as input as required by `run_test()`:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Register new data and now 'balanced_raw_dataset' is the new dataset object of interest\n",
-    "vm_balanced_raw_dataset = vm.init_dataset(\n",
-    "    dataset=balanced_raw_df,\n",
-    "    input_id=\"balanced_raw_dataset\",\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Pass the initialized `balanced_raw_dataset` as input into the test run\n",
-    "result = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.ClassImbalance\",\n",
-    "    inputs={\"dataset\": vm_balanced_raw_dataset},\n",
-    "    params={\"min_percent_threshold\": 30},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_4__'></a>\n",
-    "\n",
-    "### Remove highly correlated features\n",
-    "\n",
-    "Next, let's also remove highly correlated features from our dataset as outlined by the development team. Removing highly correlated features helps make the model simpler, more stable, and easier to understand.\n",
-    "\n",
-    "You can utilize the output from a ValidMind test for further use — in this below example, to retrieve the list of features with the highest correlation coefficients and use them to reduce the final list of features for modeling.\n",
-    "\n",
-    "First, we'll run [`validmind.data_validation.HighPearsonCorrelation`](https://docs.validmind.ai/tests/data_validation/HighPearsonCorrelation.html) with the `balanced_raw_dataset` we initialized previously as input as is for comparison with later runs:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "corr_result = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
-    "    params={\"max_threshold\": 0.3},\n",
-    "    inputs={\"dataset\": vm_balanced_raw_dataset},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "The output above shows that the test did not pass according to the value we set for `max_threshold` — as reported and expected.\n",
-    "\n",
-    "`corr_result` is an object of type `TestResult`. We can inspect the result object to see what the test has produced:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "print(type(corr_result))\n",
-    "print(\"Result ID: \", corr_result.result_id)\n",
-    "print(\"Params: \", corr_result.params)\n",
-    "print(\"Passed: \", corr_result.passed)\n",
-    "print(\"Tables: \", corr_result.tables)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Let's remove the highly correlated features and create a new VM `dataset` object.\n",
-    "\n",
-    "We'll begin by checking out the table in the result and extracting a list of features that failed the test:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Extract table from `corr_result.tables`\n",
-    "features_df = corr_result.tables[0].data\n",
-    "features_df"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Extract list of features that failed the test\n",
-    "high_correlation_features = features_df[features_df[\"Pass/Fail\"] == \"Fail\"][\"Columns\"].tolist()\n",
-    "high_correlation_features"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Next, extract the feature names from the list of strings (example: `(Age, Exited)` > `Age`):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "high_correlation_features = [feature.split(\",\")[0].strip(\"()\") for feature in high_correlation_features]\n",
-    "high_correlation_features"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Now, it's time to re-initialize the dataset with the highly correlated features removed.\n",
-    "\n",
-    "**Note the use of a different `input_id`.** This allows tracking the inputs used when running each individual test."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Remove the highly correlated features from the dataset\n",
-    "balanced_raw_no_age_df = balanced_raw_df.drop(columns=high_correlation_features)\n",
-    "\n",
-    "# Re-initialize the dataset object\n",
-    "vm_raw_dataset_preprocessed = vm.init_dataset(\n",
-    "    dataset=balanced_raw_no_age_df,\n",
-    "    input_id=\"raw_dataset_preprocessed\",\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Re-running the test with the reduced feature set should pass the test:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "corr_result = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
-    "    params={\"max_threshold\": 0.3},\n",
-    "    inputs={\"dataset\": vm_raw_dataset_preprocessed},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You can also plot the correlation matrix to visualize the new correlation between features:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "corr_result = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.PearsonCorrelationMatrix\",\n",
-    "    inputs={\"dataset\": vm_raw_dataset_preprocessed},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Documenting test results\n",
-    "\n",
-    "Now that we've done some analysis on two different datasets, we can use ValidMind to easily document why certain things were done to our raw data with testing to support it. Every test result returned by the `run_test()` function has a `.log()` method that can be used to send the test results to the ValidMind Platform.\n",
-    "\n",
-    "When logging validation test results to the platform, you'll need to manually add those results to the desired section of the validation report. To demonstrate how to add test results to your validation report, we'll log our data quality tests and insert the results via the ValidMind Platform."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_1__'></a>\n",
-    "\n",
-    "### Configure and run comparison tests\n",
-    "\n",
-    "Below, we'll perform comparison tests between the original raw dataset (`raw_dataset`) and the final preprocessed (`raw_dataset_preprocessed`) dataset, again logging the results to the ValidMind Platform. \n",
-    "\n",
-    "We can specify all the tests we'd ike to run in a dictionary called `test_config`, and we'll pass in the following arguments for each test:\n",
-    "\n",
-    "  - **`params`:** Individual test parameters.\n",
-    "  - **`input_grid`:** Individual test inputs to compare. In this case, we'll input our two datasets for comparison.\n",
-    "\n",
-    "**Note here that the `input_grid` expects the `input_id` of the dataset as the value rather than the variable name we specified:**"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Individual test config with inputs specified\n",
-    "test_config = {\n",
-    "    \"validmind.data_validation.ClassImbalance\": {\n",
-    "        \"input_grid\": {\"dataset\": [\"raw_dataset\", \"raw_dataset_preprocessed\"]},\n",
-    "        \"params\": {\"min_percent_threshold\": 30}\n",
-    "    },\n",
-    "    \"validmind.data_validation.HighPearsonCorrelation\": {\n",
-    "        \"input_grid\": {\"dataset\": [\"raw_dataset\", \"raw_dataset_preprocessed\"]},\n",
-    "        \"params\": {\"max_threshold\": 0.3}\n",
-    "    },\n",
-    "}"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Then batch run and log our tests in `test_config`:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "for t in test_config:\n",
-    "    print(t)\n",
-    "    try:\n",
-    "        # Check if test has input_grid\n",
-    "        if 'input_grid' in test_config[t]:\n",
-    "            # For tests with input_grid, pass the input_grid configuration\n",
-    "            if 'params' in test_config[t]:\n",
-    "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid'], params=test_config[t]['params']).log()\n",
-    "            else:\n",
-    "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid']).log()\n",
-    "        else:\n",
-    "            # Original logic for regular inputs\n",
-    "            if 'params' in test_config[t]:\n",
-    "                vm.tests.run_test(t, inputs=test_config[t]['inputs'], params=test_config[t]['params']).log()\n",
-    "            else:\n",
-    "                vm.tests.run_test(t, inputs=test_config[t]['inputs']).log()\n",
-    "    except Exception as e:\n",
-    "        print(f\"Error running test {t}: {str(e)}\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your model's documentation for some test IDs. </b></span>\n",
-    "<br></br>\n",
-    "That's expected, as when we run validations tests the results logged need to be manually added to your report as part of your compliance assessment process within the ValidMind Platform.</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2__'></a>\n",
-    "\n",
-    "### Log tests with unique identifiers\n",
-    "\n",
-    "Next, we'll use the previously initialized `vm_balanced_raw_dataset` (that still has a highly correlated `Age` column) as input to run an individual test, then log the result to the ValidMind Platform.\n",
-    "\n",
-    "When running individual tests, **you can use a custom `result_id` to tag the individual result with a unique identifier:**\n",
-    "\n",
-    "- This `result_id` can be appended to `test_id` with a `:` separator.\n",
-    "- The `balanced_raw_dataset` result identifier will correspond to the `balanced_raw_dataset` input, the dataset that still has the `Age` column."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.HighPearsonCorrelation:balanced_raw_dataset\",\n",
-    "    params={\"max_threshold\": 0.3},\n",
-    "    inputs={\"dataset\": vm_balanced_raw_dataset},\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_3__'></a>\n",
-    "\n",
-    "### Add test results to reporting\n",
-    "\n",
-    "With some test results logged, let's head to the model we connected to at the beginning of this notebook and learn how to insert a test result into our validation report ([Need more help?](https://docs.validmind.ai/guide/model-validation/assess-compliance.html#link-validator-evidence)).\n",
-    "\n",
-    "While the example below focuses on a specific test result, you can follow the same general procedure for your other results:\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you connected to earlier.\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Validation** under Documents.\n",
-    "\n",
-    "3. Locate the Data Preparation section and click on **2.2.1. Data Quality** to expand that section.\n",
-    "\n",
-    "4. Under the Class Imbalance Assessment section, locate Validator Evidence then click **Link Evidence to Report**:\n",
-    "\n",
-    "    <img src= \"link-validator-evidence.png\" alt=\"Screenshot showing the validation report with the link validator evidence to report option highlighted\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
-    "    <br><br>\n",
-    "\n",
-    "5. Select the Class Imbalance test results we logged: **ValidMind Data Validation Class Imbalance** \n",
-    "\n",
-    "    <img src= \"selecting-class-imbalance-results.png\" alt=\"Screenshot showing the ClassImbalance test selected\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
-    "    <br><br>\n",
-    "\n",
-    "6. Click **Update Linked Evidence** to add the test results to the validation report.\n",
-    "\n",
-    "    Confirm that the results for the Class Imbalance test you inserted has been correctly inserted into section **2.2.1. Data Quality** of the report:\n",
-    "\n",
-    "    <img src= \"inserted-class-imbalance-results.png\" alt=\"Screenshot showing the ClassImbalance test inserted into the validation report\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
-    "    <br><br>\n",
-    "\n",
-    "7. Note that these test results are flagged as **Requires Attention** — as they include comparative results from our initial raw dataset.\n",
-    "\n",
-    "    Click **See evidence details** to review the LLM-generated description that summarizes the test results, that confirm that our final preprocessed dataset actually passes our test:\n",
-    "\n",
-    "    <img src= \"class-imbalance-results-detail.png\" alt=\"Screenshot showing the ClassImbalance test generated description in the text editor\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
-    "    <br><br>\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>    Here in this text editor, you can make qualitative edits to the draft that ValidMind generated to finalize the test results.</b></span>\n",
-    "<br></br>\n",
-    "Learn more: <a href=\"https://docs.validmind.ai/guide/model-documentation/work-with-content-blocks.html\" style=\"color: #DE257E;\"><b>Work with content blocks</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Split the preprocessed dataset\n",
-    "\n",
-    "With our raw dataset rebalanced with highly correlated features removed, let's now **spilt our dataset into train and test** in preparation for model evaluation testing.\n",
-    "\n",
-    "To start, let's grab the first few rows from the `balanced_raw_no_age_df` dataset we initialized earlier:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "balanced_raw_no_age_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Before training the model, we need to encode the categorical features in the dataset:\n",
-    "\n",
-    "- Use the `OneHotEncoder` class from the `sklearn.preprocessing` module to encode the categorical features.\n",
-    "- The categorical features in the dataset are `Geography` and `Gender`."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "balanced_raw_no_age_df = pd.get_dummies(\n",
-    "    balanced_raw_no_age_df, columns=[\"Geography\", \"Gender\"], drop_first=True\n",
-    ")\n",
-    "balanced_raw_no_age_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Splitting our dataset into training and testing is essential for proper validation testing, as this helps assess how well the model generalizes to unseen data:\n",
-    "\n",
-    "- We start by dividing our `balanced_raw_no_age_df` dataset into training and test subsets using `train_test_split`, with 80% of the data allocated to training (`train_df`) and 20% to testing (`test_df`).\n",
-    "- From each subset, we separate the features (all columns except \"Exited\") into `X_train` and `X_test`, and the target column (\"Exited\") into `y_train` and `y_test`."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from sklearn.model_selection import train_test_split\n",
-    "\n",
-    "train_df, test_df = train_test_split(balanced_raw_no_age_df, test_size=0.20)\n",
-    "\n",
-    "X_train = train_df.drop(\"Exited\", axis=1)\n",
-    "y_train = train_df[\"Exited\"]\n",
-    "X_test = test_df.drop(\"Exited\", axis=1)\n",
-    "y_test = test_df[\"Exited\"]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1__'></a>\n",
-    "\n",
-    "### Initialize the split datasets\n",
-    "\n",
-    "Next, let's initialize the training and testing datasets so they are available for use:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds = vm.init_dataset(\n",
-    "    input_id=\"train_dataset_final\",\n",
-    "    dataset=train_df,\n",
-    "    target_column=\"Exited\",\n",
-    ")\n",
-    "\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    input_id=\"test_dataset_final\",\n",
-    "    dataset=test_df,\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## In summary\n",
-    "\n",
-    "In this second notebook, you learned how to:\n",
-    "\n",
-    "- [x] Import a sample dataset\n",
-    "- [x] Identify which tests you might want to run with ValidMind\n",
-    "- [x] Initialize ValidMind datasets\n",
-    "- [x] Run individual tests\n",
-    "- [x] Utilize the output from tests you’ve run\n",
-    "- [x] Log test results as evidence to the ValidMind Platform\n",
-    "- [x] Insert test results into your validation report"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc8__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "<a id='toc8_1__'></a>\n",
-    "\n",
-    "### Develop potential challenger models\n",
-    "\n",
-    "Now that you're familiar with the basics of using the ValidMind Library, let's use it to develop a challenger model: **[3 — Developing a potential challenger model](3-developing_challenger_model.ipynb)**"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-a798ee72616640f5bead3af25e6e9434",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
-  },
-  "language_info": {
-   "name": "python",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
-}
diff --git a/site/notebooks/tutorials/model_validation/3-developing_challenger_model.ipynb b/site/notebooks/tutorials/model_validation/3-developing_challenger_model.ipynb
deleted file mode 100644
index e86fde85de..0000000000
--- a/site/notebooks/tutorials/model_validation/3-developing_challenger_model.ipynb
+++ /dev/null
@@ -1,893 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# ValidMind for model validation 3 — Developing a potential challenger model\n",
-    "\n",
-    "Learn how to use ValidMind for your end-to-end model validation process with our series of four introductory notebooks. In this third notebook, develop a potential challenger model and then pass your model and its predictions to ValidMind.\n",
-    "\n",
-    "A *challenger model* is an alternate model that attempts to outperform the champion model, ensuring that the best performing fit-for-purpose model is always considered for deployment. Challenger models also help avoid over-reliance on a single model, and allow testing of new features, algorithms, or data sources without disrupting the production lifecycle.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
-    "<br></br>\n",
-    "Our course tailor-made for validators new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/validator-fundamentals/validator-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Validator Fundamentals</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [Prerequisites](#toc1_)    \n",
-    "- [Setting up](#toc2_)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_1_)    \n",
-    "  - [Import the sample dataset](#toc2_2_)    \n",
-    "    - [Preprocess the dataset](#toc2_2_1_)    \n",
-    "  - [Split the preprocessed dataset](#toc2_3_)    \n",
-    "- [Import the champion model](#toc3_)    \n",
-    "- [Training a potential challenger model](#toc4_)    \n",
-    "  - [Random forest classification model](#toc4_1_)    \n",
-    "- [Initializing the model objects](#toc5_)    \n",
-    "  - [Initialize the model objects](#toc5_1_)    \n",
-    "  - [Assign predictions](#toc5_2_)    \n",
-    "- [Running model evaluation tests](#toc6_)    \n",
-    "  - [Run model performance tests](#toc6_1_)    \n",
-    "    - [Evaluate performance of the champion model](#toc6_1_1_)    \n",
-    "    - [Log an artifact](#toc6_1_2_)    \n",
-    "    - [Evaluate performance of challenger model](#toc6_1_3_)    \n",
-    "  - [Run diagnostic tests](#toc6_2_)    \n",
-    "  - [Run feature importance tests](#toc6_3_)    \n",
-    "- [In summary](#toc7_)    \n",
-    "- [Next steps](#toc8_)    \n",
-    "  - [Finalize validation and reporting](#toc8_1_)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_'></a>\n",
-    "\n",
-    "## Prerequisites\n",
-    "\n",
-    "In order to develop potential challenger models with this notebook, you'll need to first have:\n",
-    "\n",
-    "- [x] Registered a model within the ValidMind Platform and granted yourself access to the model as a validator\n",
-    "- [x] Installed the ValidMind Library in your local environment, allowing you to access all its features\n",
-    "- [x] Learned how to import and initialize datasets for use with ValidMind\n",
-    "- [x] Understood the basics of how to run and log tests with ValidMind\n",
-    "- [x] Run data quality tests on the datasets used to train the champion model, and logged the results of those tests to ValidMind\n",
-    "- [x] Inserted your logged test results into your validation report\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Need help with the above steps?</b></span>\n",
-    "<br></br>\n",
-    "Refer to the first two notebooks in this series:\n",
-    "\n",
-    "- <a href=\"1-set_up_validmind_for_validation.ipynb\" style=\"color: #DE257E;\"><b>1 — Set up the ValidMind Library for validation</b></a>\n",
-    "- <a href=\"2-start_validation_process.ipynb\" style=\"color: #DE257E;\"><b>2 — Start the model validation process</b></a>\n",
-    "\n",
-    "</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_'></a>\n",
-    "\n",
-    "## Setting up\n",
-    "\n",
-    "This section should be quite familiar to you — as we performed the same actions in the previous notebook, **[2 — Start the model validation process](2-start_validation_process.ipynb)**."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1_'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library\n",
-    "\n",
-    "As usual, let's first connect up the ValidMind Library to our model we previously registered in the ValidMind Platform:\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Validation` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Make sure the ValidMind Library is installed\n",
-    "\n",
-    "%pip install -q validmind\n",
-    "\n",
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"validation-report\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_'></a>\n",
-    "\n",
-    "### Import the sample dataset\n",
-    "\n",
-    "Next, we'll load in the sample [Bank Customer Churn Prediction](https://www.kaggle.com/datasets/shantanudhakadd/bank-customer-churn-prediction) dataset used to develop the champion model that we will independently preprocess:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load the sample dataset\n",
-    "from validmind.datasets.classification import customer_churn as demo_dataset\n",
-    "\n",
-    "print(\n",
-    "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{demo_dataset.target_column}' \\n\\t• Class labels: {demo_dataset.class_labels}\"\n",
-    ")\n",
-    "\n",
-    "raw_df = demo_dataset.load_data()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1_'></a>\n",
-    "\n",
-    "#### Preprocess the dataset\n",
-    "\n",
-    "We’ll apply a simple rebalancing technique to the dataset before continuing:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import pandas as pd\n",
-    "\n",
-    "raw_copy_df = raw_df.sample(frac=1)  # Create a copy of the raw dataset\n",
-    "\n",
-    "# Create a balanced dataset with the same number of exited and not exited customers\n",
-    "exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 1]\n",
-    "not_exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 0].sample(n=exited_df.shape[0])\n",
-    "\n",
-    "balanced_raw_df = pd.concat([exited_df, not_exited_df])\n",
-    "balanced_raw_df = balanced_raw_df.sample(frac=1, random_state=42)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Let’s also quickly remove highly correlated features from the dataset using the output from a ValidMind test.\n",
-    "\n",
-    "As you know, before we can run tests you’ll need to initialize a ValidMind dataset object with the [`init_dataset` function](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Register new data and now 'balanced_raw_dataset' is the new dataset object of interest\n",
-    "vm_balanced_raw_dataset = vm.init_dataset(\n",
-    "    dataset=balanced_raw_df,\n",
-    "    input_id=\"balanced_raw_dataset\",\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "With our balanced dataset initialized, we can then run our test and utilize the output to help us identify the features we want to remove:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Run HighPearsonCorrelation test with our balanced dataset as input and return a result object\n",
-    "corr_result = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
-    "    params={\"max_threshold\": 0.3},\n",
-    "    inputs={\"dataset\": vm_balanced_raw_dataset},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# From result object, extract table from `corr_result.tables`\n",
-    "features_df = corr_result.tables[0].data\n",
-    "features_df"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Extract list of features that failed the test\n",
-    "high_correlation_features = features_df[features_df[\"Pass/Fail\"] == \"Fail\"][\"Columns\"].tolist()\n",
-    "high_correlation_features"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Extract feature names from the list of strings\n",
-    "high_correlation_features = [feature.split(\",\")[0].strip(\"()\") for feature in high_correlation_features]\n",
-    "high_correlation_features"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "We can then re-initialize the dataset with a different `input_id` and the highly correlated features removed and re-run the test for confirmation:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Remove the highly correlated features from the dataset\n",
-    "balanced_raw_no_age_df = balanced_raw_df.drop(columns=high_correlation_features)\n",
-    "\n",
-    "# Re-initialize the dataset object\n",
-    "vm_raw_dataset_preprocessed = vm.init_dataset(\n",
-    "    dataset=balanced_raw_no_age_df,\n",
-    "    input_id=\"raw_dataset_preprocessed\",\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Re-run the test with the reduced feature set\n",
-    "corr_result = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
-    "    params={\"max_threshold\": 0.3},\n",
-    "    inputs={\"dataset\": vm_raw_dataset_preprocessed},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3_'></a>\n",
-    "\n",
-    "### Split the preprocessed dataset\n",
-    "\n",
-    "With our raw dataset rebalanced with highly correlated features removed, let's now **spilt our dataset into train and test** in preparation for model evaluation testing:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Encode categorical features in the dataset\n",
-    "balanced_raw_no_age_df = pd.get_dummies(\n",
-    "    balanced_raw_no_age_df, columns=[\"Geography\", \"Gender\"], drop_first=True\n",
-    ")\n",
-    "balanced_raw_no_age_df.head()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from sklearn.model_selection import train_test_split\n",
-    "\n",
-    "# Split the dataset into train and test\n",
-    "train_df, test_df = train_test_split(balanced_raw_no_age_df, test_size=0.20)\n",
-    "\n",
-    "X_train = train_df.drop(\"Exited\", axis=1)\n",
-    "y_train = train_df[\"Exited\"]\n",
-    "X_test = test_df.drop(\"Exited\", axis=1)\n",
-    "y_test = test_df[\"Exited\"]"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize the split datasets\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    input_id=\"train_dataset_final\",\n",
-    "    dataset=train_df,\n",
-    "    target_column=\"Exited\",\n",
-    ")\n",
-    "\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    input_id=\"test_dataset_final\",\n",
-    "    dataset=test_df,\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_'></a>\n",
-    "\n",
-    "## Import the champion model\n",
-    "\n",
-    "With our raw dataset assessed and preprocessed, let's go ahead and import the champion model submitted by the model development team in the format of a `.pkl` file: **[lr_model_champion.pkl](lr_model_champion.pkl)**"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Import the champion model\n",
-    "import pickle as pkl\n",
-    "\n",
-    "with open(\"lr_model_champion.pkl\", \"rb\") as f:\n",
-    "    log_reg = pkl.load(f)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_'></a>\n",
-    "\n",
-    "## Training a potential challenger model\n",
-    "\n",
-    "We're curious how an alternate model compares to our champion model, so let's train a challenger model as a basis for our testing.\n",
-    "\n",
-    "Our champion *logistic regression model* is a simpler, parametric model that assumes a linear relationship between the independent variables and the log-odds of the outcome. While logistic regression may not capture complex patterns as effectively, it offers a high degree of interpretability and is easier to explain to stakeholders. However, model risk is not calculated in isolation from a single factor, but rather in consideration with trade-offs in predictive performance, ease of interpretability, and overall alignment with business objectives."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1_'></a>\n",
-    "\n",
-    "### Random forest classification model\n",
-    "\n",
-    "A *random forest classification model* is an ensemble machine learning algorithm that uses multiple decision trees to classify data. In ensemble learning, multiple models are combined to improve prediction accuracy and robustness.\n",
-    "\n",
-    "Random forest classification models generally have higher accuracy because they capture complex, non-linear relationships, but as a result they lack transparency in their predictions."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Import the Random Forest Classification model\n",
-    "from sklearn.ensemble import RandomForestClassifier\n",
-    "\n",
-    "# Create the model instance with 50 decision trees\n",
-    "rf_model = RandomForestClassifier(\n",
-    "    n_estimators=50,\n",
-    "    random_state=42,\n",
-    ")\n",
-    "\n",
-    "# Train the model\n",
-    "rf_model.fit(X_train, y_train)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_'></a>\n",
-    "\n",
-    "## Initializing the model objects"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_1_'></a>\n",
-    "\n",
-    "### Initialize the model objects\n",
-    "\n",
-    "In addition to the initialized datasets, you'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for each of our two models.\n",
-    "\n",
-    "You simply initialize this model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize the champion logistic regression model\n",
-    "vm_log_model = vm.init_model(\n",
-    "    log_reg,\n",
-    "    input_id=\"log_model_champion\",\n",
-    ")\n",
-    "\n",
-    "# Initialize the challenger random forest classification model\n",
-    "vm_rf_model = vm.init_model(\n",
-    "    rf_model,\n",
-    "    input_id=\"rf_model\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2_'></a>\n",
-    "\n",
-    "### Assign predictions\n",
-    "\n",
-    "With our models registered, we'll move on to assigning both the predictive probabilities coming directly from each model's predictions, and the binary prediction after applying the cutoff threshold described in the Compute binary predictions step above.\n",
-    "\n",
-    "- The [`assign_predictions()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#assign_predictions) from the `Dataset` object can link existing predictions to any number of models.\n",
-    "- This method links the model's class prediction values and probabilities to our `vm_train_ds` and `vm_test_ds` datasets.\n",
-    "\n",
-    "If no prediction values are passed, the method will compute predictions automatically:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Champion — Logistic regression model\n",
-    "vm_train_ds.assign_predictions(model=vm_log_model)\n",
-    "vm_test_ds.assign_predictions(model=vm_log_model)\n",
-    "\n",
-    "# Challenger — Random forest classification model\n",
-    "vm_train_ds.assign_predictions(model=vm_rf_model)\n",
-    "vm_test_ds.assign_predictions(model=vm_rf_model)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_'></a>\n",
-    "\n",
-    "## Running model evaluation tests\n",
-    "\n",
-    "With our setup complete, let's run the rest of our validation tests. Since we have already verified the data quality of the dataset used to train our champion model, we will now focus on comprehensive performance evaluations of both the champion and challenger models."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1_'></a>\n",
-    "\n",
-    "### Run model performance tests\n",
-    "\n",
-    "Let's run some performance tests, beginning with independent testing of our champion logistic regression model, then moving on to our potential challenger model.\n",
-    "\n",
-    "Use [`vm.tests.list_tests()`](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) to identify all the model performance tests for classification:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "\n",
-    "vm.tests.list_tests(tags=[\"model_performance\"], task=\"classification\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "We'll isolate the specific tests we want to run in `mpt`:\n",
-    "\n",
-    "- [`ClassifierPerformance`](https://docs.validmind.ai/tests/model_validation/sklearn/ClassifierPerformance.html)\n",
-    "- [`ConfusionMatrix`](https://docs.validmind.ai/tests/model_validation/sklearn/ConfusionMatrix.html)\n",
-    "- [`MinimumAccuracy`](https://docs.validmind.ai/tests/model_validation/sklearn/MinimumAccuracy.html)\n",
-    "- [`MinimumF1Score`](https://docs.validmind.ai/tests/model_validation/sklearn/MinimumF1Score.html)\n",
-    "- [`ROCCurve`](https://docs.validmind.ai/tests/model_validation/sklearn/ROCCurve.html)\n",
-    "\n",
-    "As we learned in the previous notebook [2 — Start the model validation process](2-start_validation_process.ipynb), you can use a custom `result_id` to tag the individual result with a unique identifier by appending this `result_id` to the `test_id` with a `:` separator. We'll append an identifier for our champion model here:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "mpt = [\n",
-    "    \"validmind.model_validation.sklearn.ClassifierPerformance:logreg_champion\",\n",
-    "    \"validmind.model_validation.sklearn.ConfusionMatrix:logreg_champion\",\n",
-    "    \"validmind.model_validation.sklearn.MinimumAccuracy:logreg_champion\",\n",
-    "    \"validmind.model_validation.sklearn.MinimumF1Score:logreg_champion\",\n",
-    "    \"validmind.model_validation.sklearn.ROCCurve:logreg_champion\"\n",
-    "]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1_1_'></a>\n",
-    "\n",
-    "#### Evaluate performance of the champion model\n",
-    "\n",
-    "Now, let's run and log our batch of model performance tests using our testing dataset (`vm_test_ds`) for our champion model:\n",
-    "\n",
-    "- The test set serves as a proxy for real-world data, providing an unbiased estimate of model performance since it was not used during training or tuning.\n",
-    "- The test set also acts as protection against selection bias and model tweaking, giving a final, more unbiased checkpoint."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "for test in mpt:\n",
-    "    vm.tests.run_test(\n",
-    "        test,\n",
-    "        inputs={\n",
-    "            \"dataset\": vm_test_ds, \"model\" : vm_log_model,\n",
-    "        },\n",
-    "    ).log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your model's documentation for some test IDs. </b></span>\n",
-    "<br></br>\n",
-    "That's expected, as when we run validations tests the results logged need to be manually added to your report as part of your compliance assessment process within the ValidMind Platform.</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1_2_'></a>\n",
-    "\n",
-    "#### Log an artifact\n",
-    "\n",
-    "As we can observe from the output above, our champion model doesn't pass the `MinimumAccuracy` based on the default thresholds of the out-of-the-box test, so let's log an artifact (finding) in the ValidMind Platform  ([Need more help?](https://docs.validmind.ai/guide/model-validation/add-manage-artifacts.html)):\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you connected to earlier.\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Validation** under Documents.\n",
-    "\n",
-    "3. Locate the Data Preparation section and click on **2.2.2. Model Performance** to expand that section.\n",
-    "\n",
-    "4. Under the Model Performance Metrics section, locate Artifacts then click **Link Artifact to Report**:\n",
-    "\n",
-    "    <img src=\"link-artifact.png\" alt=\"Screenshot showing the validation report with the link artifact option highlighted\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
-    "    <br><br>\n",
-    "\n",
-    "5. Select **Validation Issue** as the type of artifact.\n",
-    "\n",
-    "6. Click **+ Add Validation Issue** to add a validation issue type artifact.\n",
-    "\n",
-    "76. Enter in the details for your validation issue, for example:\n",
-    "\n",
-    "    - **TITLE** — Champion Logistic Regression Model Fails Minimum Accuracy Threshold\n",
-    "    - **RISK AREA** — Model Performance\n",
-    "    - **DOCUMENTATION SECTION** — 3.2. Model Evaluation\n",
-    "    - **DESCRIPTION** — The logistic regression champion model was subjected to a Minimum Accuracy test to determine whether its predictive accuracy meets the predefined performance threshold of 0.7. The model achieved an accuracy score of 0.6136, which falls below the required minimum. As a result, the test produced a Fail outcome.\n",
-    "\n",
-    "8. Click **Save**.\n",
-    "\n",
-    "9. Select the validation issue you just added to link to your validation report and click **Update Linked Artifacts** to insert your validation issue.\n",
-    "\n",
-    "10. Click on the validation issue to expand the issue, where you can adjust details such as severity, owner, due date, status, etc. as well as include proposed remediation plans or supporting documentation as attachments."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1_3_'></a>\n",
-    "\n",
-    "#### Evaluate performance of challenger model\n",
-    "\n",
-    "We've now conducted similar tests as the model development team for our champion model, with the aim of verifying their test results.\n",
-    "\n",
-    "Next, let's see how our challenger models compare. We'll use the same batch of tests here as we did in `mpt`, but append a different `result_id` to indicate that these results should be associated with our challenger model:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "mpt_chall = [\n",
-    "    \"validmind.model_validation.sklearn.ClassifierPerformance:champion_vs_challenger\",\n",
-    "    \"validmind.model_validation.sklearn.ConfusionMatrix:champion_vs_challenger\",\n",
-    "    \"validmind.model_validation.sklearn.MinimumAccuracy:champion_vs_challenger\",\n",
-    "    \"validmind.model_validation.sklearn.MinimumF1Score:champion_vs_challenger\",\n",
-    "    \"validmind.model_validation.sklearn.ROCCurve:champion_vs_challenger\"\n",
-    "]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "We'll run each test once for each model with the same `vm_test_ds` dataset to compare them:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "for test in mpt_chall:\n",
-    "    vm.tests.run_test(\n",
-    "        test,\n",
-    "        input_grid={\n",
-    "            \"dataset\": [vm_test_ds], \"model\" : [vm_log_model,vm_rf_model]\n",
-    "        }\n",
-    "    ).log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Based on the performance metrics, our challenger random forest classification model passes the <code>MinimumAccuracy</code> where our champion did not.</b></span>\n",
-    "<br></br>\n",
-    "In your validation report, support your recommendation in your validation issue's <b>Proposed Remediation Plan</b> to investigate the usage of our challenger model by inserting the performance tests we logged with this notebook into the appropriate section.</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2_'></a>\n",
-    "\n",
-    "### Run diagnostic tests\n",
-    "\n",
-    "Next, we want to inspect the robustness and stability testing comparison between our champion and challenger model.\n",
-    "\n",
-    "Use `list_tests()` to list all available diagnosis tests applicable to classification tasks:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.list_tests(tags=[\"model_diagnosis\"], task=\"classification\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Let’s now assess the models for potential signs of *overfitting* and identify any sub-segments where performance may inconsistent with the [`OverfitDiagnosis` test](https://docs.validmind.ai/tests/model_validation/sklearn/OverfitDiagnosis.html).\n",
-    "\n",
-    "Overfitting occurs when a model learns the training data too well, capturing not only the true pattern but noise and random fluctuations resulting in excellent performance on the training dataset but poor generalization to new, unseen data:\n",
-    "\n",
-    "- Since the training dataset (`vm_train_ds`) was used to fit the model, we use this set to establish a baseline performance for how well the model performs on data it has already seen.\n",
-    "- The testing dataset (`vm_test_ds`) was never seen during training, and here simulates real-world generalization, or how well the model performs on new, unseen data. "
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    test_id=\"validmind.model_validation.sklearn.OverfitDiagnosis:champion_vs_challenger\",\n",
-    "    input_grid={\n",
-    "        \"datasets\": [[vm_train_ds,vm_test_ds]],\n",
-    "        \"model\" : [vm_log_model,vm_rf_model]\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Let's also conduct *robustness* and *stability* testing of the two models with the [`RobustnessDiagnosis` test](https://docs.validmind.ai/tests/model_validation/sklearn/RobustnessDiagnosis.html). Robustness refers to a model's ability to maintain consistent performance, and stability refers to a model's ability to produce consistent outputs over time across different data subsets.\n",
-    "\n",
-    "Again, we'll use both the training and testing datasets to establish baseline performance and to simulate real-world generalization:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    test_id=\"validmind.model_validation.sklearn.RobustnessDiagnosis:Champion_vs_LogRegression\",\n",
-    "    input_grid={\n",
-    "        \"datasets\": [[vm_train_ds,vm_test_ds]],\n",
-    "        \"model\" : [vm_log_model,vm_rf_model]\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_3_'></a>\n",
-    "\n",
-    "### Run feature importance tests\n",
-    "\n",
-    "We also want to verify the relative influence of different input features on our models' predictions, as well as inspect the differences between our champion and challenger model to see if a certain model offers more understandable or logical importance scores for features.\n",
-    "\n",
-    "Use `list_tests()` to identify all the feature importance tests for classification:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Store the feature importance tests\n",
-    "FI = vm.tests.list_tests(tags=[\"feature_importance\"], task=\"classification\",pretty=False)\n",
-    "FI"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "We'll only use our testing dataset (`vm_test_ds`) here, to provide a realistic, unseen sample that mimic future or production data, as the training dataset has already influenced our model during learning:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Run and log our feature importance tests for both models for the testing dataset\n",
-    "for test in FI:\n",
-    "    vm.tests.run_test(\n",
-    "        \"\".join((test,':champion_vs_challenger')),\n",
-    "        input_grid={\n",
-    "            \"dataset\": [vm_test_ds], \"model\" : [vm_log_model,vm_rf_model]\n",
-    "        },\n",
-    "    ).log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_'></a>\n",
-    "\n",
-    "## In summary\n",
-    "\n",
-    "In this third notebook, you learned how to:\n",
-    "\n",
-    "- [x] Initialize ValidMind model objects\n",
-    "- [x] Assign predictions and probabilities to your ValidMind model objects\n",
-    "- [x] Use tests from ValidMind to evaluate the potential of models, including comparative tests between champion and challenger models\n",
-    "- [x] Log an artifact in the ValidMind Platform"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc8_'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "<a id='toc8_1_'></a>\n",
-    "\n",
-    "### Finalize validation and reporting\n",
-    "\n",
-    "Now that you're familiar with the basics of using the ValidMind Library to run and log validation tests, let's learn how to implement some custom tests and wrap up our validation: **[4 — Finalize validation and reporting](4-finalize_validation_reporting.ipynb)**"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-0b98aebe3459409f848c2c03b413d181",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
-  },
-  "language_info": {
-   "name": "python",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
-}
diff --git a/site/notebooks/tutorials/model_validation/4-finalize_validation_reporting.ipynb b/site/notebooks/tutorials/model_validation/4-finalize_validation_reporting.ipynb
deleted file mode 100644
index 854ccde766..0000000000
--- a/site/notebooks/tutorials/model_validation/4-finalize_validation_reporting.ipynb
+++ /dev/null
@@ -1,1233 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# ValidMind for model validation 4 — Finalize testing and reporting\n",
-    "\n",
-    "Learn how to use ValidMind for your end-to-end model validation process with our series of four introductory notebooks. In this last notebook, finalize the compliance assessment process and have a complete validation report ready for review.\n",
-    "\n",
-    "This notebook will walk you through how to supplement ValidMind tests with your own custom tests and include them as additional evidence in your validation report. A custom test is any function that takes a set of inputs and parameters as arguments and returns one or more outputs:\n",
-    "\n",
-    "- The function can be as simple or as complex as you need it to be — it can use external libraries, make API calls, or do anything else that you can do in Python.\n",
-    "- The only requirement is that the function signature and return values can be \"understood\" and handled by the ValidMind Library. As such, custom tests offer added flexibility by extending the default tests provided by ValidMind, enabling you to document any type of model or use case.\n",
-    "\n",
-    "**For a more in-depth introduction to custom tests,** refer to our [Implement custom tests](../../how_to/tests/custom_tests/implement_custom_tests.ipynb) notebook.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
-    "<br></br>\n",
-    "Our course tailor-made for validators new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/validator-fundamentals/validator-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Validator Fundamentals</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [Prerequisites](#toc1__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_1__)    \n",
-    "  - [Import the sample dataset](#toc2_2__)    \n",
-    "  - [Split the preprocessed dataset](#toc2_3__)    \n",
-    "  - [Import the champion model](#toc2_4__)    \n",
-    "  - [Train potential challenger model](#toc2_5__)    \n",
-    "  - [Initialize the model objects](#toc2_6__)    \n",
-    "- [Implementing custom tests](#toc3__)    \n",
-    "  - [Implement a custom inline test](#toc3_1__)    \n",
-    "    - [Create a confusion matrix plot](#toc3_1_1__)    \n",
-    "    - [Add parameters to custom tests](#toc3_1_2__)    \n",
-    "    - [Pass parameters to custom tests](#toc3_1_3__)    \n",
-    "  - [Use external test providers](#toc3_2__)    \n",
-    "    - [Create custom tests folder](#toc3_2_1__)    \n",
-    "    - [Save an inline test](#toc3_2_2__)    \n",
-    "    - [Register a local test provider](#toc3_2_3__)    \n",
-    "- [Verify test runs](#toc4__)    \n",
-    "- [In summary](#toc5__)    \n",
-    "- [Next steps](#toc6__)    \n",
-    "  - [Work with your validation report](#toc6_1__)    \n",
-    "  - [Learn more](#toc6_2__)    \n",
-    "    - [Use cases](#toc6_2_1__)    \n",
-    "    - [Discover more learning resources](#toc6_2_2__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## Prerequisites\n",
-    "\n",
-    "In order to finalize validation and reporting, you'll need to first have:\n",
-    "\n",
-    "- [x] Registered a model within the ValidMind Platform and granted yourself access to the model as a validator\n",
-    "- [x] Installed the ValidMind Library in your local environment, allowing you to access all its features\n",
-    "- [x] Learned how to import and initialize datasets and models for use with ValidMind\n",
-    "- [x] Understood the basics of how to identify and run validation tests\n",
-    "- [x] Run validation tests for your champion and challenger models, and logged the results of those tests to the ValidMind Platform\n",
-    "- [x] Inserted your logged test results into your validation report\n",
-    "- [x] Added some preliminary artifacts (findings) to your validation report\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Need help with the above steps?</b></span>\n",
-    "<br></br>\n",
-    "Refer to the first three notebooks in this series:\n",
-    "\n",
-    "- <a href=\"1-set_up_validmind_for_validation.ipynb\" style=\"color: #DE257E;\"><b>1 — Set up the ValidMind Library for validation</b></a>\n",
-    "- <a href=\"2-start_validation_process.ipynb\" style=\"color: #DE257E;\"><b>2 — Start the model validation process</b></a>\n",
-    "- <a href=\"3-developing_challenger_model.ipynb\" style=\"color: #DE257E;\"><b>2 — Developing a potential challenger model</b></a>\n",
-    "\n",
-    "</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up\n",
-    "\n",
-    "This section should be very familiar to you now — as we performed the same actions in the previous two notebooks in this series."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library\n",
-    "\n",
-    "As usual, let's first connect up the ValidMind Library to our model we previously registered in the ValidMind Platform:\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Validation` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Make sure the ValidMind Library is installed\n",
-    "\n",
-    "%pip install -q validmind\n",
-    "\n",
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"validation-report\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Import the sample dataset\n",
-    "\n",
-    "Next, we'll load in the same sample [Bank Customer Churn Prediction](https://www.kaggle.com/datasets/shantanudhakadd/bank-customer-churn-prediction) dataset used to develop the champion model that we will independently preprocess:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load the sample dataset\n",
-    "from validmind.datasets.classification import customer_churn as demo_dataset\n",
-    "\n",
-    "print(\n",
-    "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{demo_dataset.target_column}' \\n\\t• Class labels: {demo_dataset.class_labels}\"\n",
-    ")\n",
-    "\n",
-    "raw_df = demo_dataset.load_data()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize the raw dataset for use in ValidMind tests\n",
-    "vm_raw_dataset = vm.init_dataset(\n",
-    "    dataset=raw_df,\n",
-    "    input_id=\"raw_dataset\",\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import pandas as pd\n",
-    "\n",
-    "raw_copy_df = raw_df.sample(frac=1)  # Create a copy of the raw dataset\n",
-    "\n",
-    "# Create a balanced dataset with the same number of exited and not exited customers\n",
-    "exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 1]\n",
-    "not_exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 0].sample(n=exited_df.shape[0])\n",
-    "\n",
-    "balanced_raw_df = pd.concat([exited_df, not_exited_df])\n",
-    "balanced_raw_df = balanced_raw_df.sample(frac=1, random_state=42)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Let’s also quickly remove highly correlated features from the dataset using the output from a ValidMind test:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Register new data and now 'balanced_raw_dataset' is the new dataset object of interest\n",
-    "vm_balanced_raw_dataset = vm.init_dataset(\n",
-    "    dataset=balanced_raw_df,\n",
-    "    input_id=\"balanced_raw_dataset\",\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Run HighPearsonCorrelation test with our balanced dataset as input and return a result object\n",
-    "corr_result = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
-    "    params={\"max_threshold\": 0.3},\n",
-    "    inputs={\"dataset\": vm_balanced_raw_dataset},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# From result object, extract table from `corr_result.tables`\n",
-    "features_df = corr_result.tables[0].data\n",
-    "features_df"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Extract list of features that failed the test\n",
-    "high_correlation_features = features_df[features_df[\"Pass/Fail\"] == \"Fail\"][\"Columns\"].tolist()\n",
-    "high_correlation_features"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Extract feature names from the list of strings\n",
-    "high_correlation_features = [feature.split(\",\")[0].strip(\"()\") for feature in high_correlation_features]\n",
-    "high_correlation_features"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Remove the highly correlated features from the dataset\n",
-    "balanced_raw_no_age_df = balanced_raw_df.drop(columns=high_correlation_features)\n",
-    "\n",
-    "# Re-initialize the dataset object\n",
-    "vm_raw_dataset_preprocessed = vm.init_dataset(\n",
-    "    dataset=balanced_raw_no_age_df,\n",
-    "    input_id=\"raw_dataset_preprocessed\",\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Re-run the test with the reduced feature set\n",
-    "corr_result = vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
-    "    params={\"max_threshold\": 0.3},\n",
-    "    inputs={\"dataset\": vm_raw_dataset_preprocessed},\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Split the preprocessed dataset\n",
-    "\n",
-    "With our raw dataset rebalanced with highly correlated features removed, let's now **spilt our dataset into train and test** in preparation for model evaluation testing:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Encode categorical features in the dataset\n",
-    "balanced_raw_no_age_df = pd.get_dummies(\n",
-    "    balanced_raw_no_age_df, columns=[\"Geography\", \"Gender\"], drop_first=True\n",
-    ")\n",
-    "balanced_raw_no_age_df.head()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from sklearn.model_selection import train_test_split\n",
-    "\n",
-    "# Split the dataset into train and test\n",
-    "train_df, test_df = train_test_split(balanced_raw_no_age_df, test_size=0.20)\n",
-    "\n",
-    "X_train = train_df.drop(\"Exited\", axis=1)\n",
-    "y_train = train_df[\"Exited\"]\n",
-    "X_test = test_df.drop(\"Exited\", axis=1)\n",
-    "y_test = test_df[\"Exited\"]"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize the split datasets\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    input_id=\"train_dataset_final\",\n",
-    "    dataset=train_df,\n",
-    "    target_column=\"Exited\",\n",
-    ")\n",
-    "\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    input_id=\"test_dataset_final\",\n",
-    "    dataset=test_df,\n",
-    "    target_column=\"Exited\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_4__'></a>\n",
-    "\n",
-    "### Import the champion model\n",
-    "\n",
-    "With our raw dataset assessed and preprocessed, let's go ahead and import the champion model submitted by the model development team in the format of a `.pkl` file: **[lr_model_champion.pkl](lr_model_champion.pkl)**"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Import the champion model\n",
-    "import pickle as pkl\n",
-    "\n",
-    "with open(\"lr_model_champion.pkl\", \"rb\") as f:\n",
-    "    log_reg = pkl.load(f)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_5__'></a>\n",
-    "\n",
-    "### Train potential challenger model\n",
-    "\n",
-    "We'll also train our random forest classification challenger model to see how it compares:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Import the Random Forest Classification model\n",
-    "from sklearn.ensemble import RandomForestClassifier\n",
-    "\n",
-    "# Create the model instance with 50 decision trees\n",
-    "rf_model = RandomForestClassifier(\n",
-    "    n_estimators=50,\n",
-    "    random_state=42,\n",
-    ")\n",
-    "\n",
-    "# Train the model\n",
-    "rf_model.fit(X_train, y_train)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_6__'></a>\n",
-    "\n",
-    "### Initialize the model objects\n",
-    "\n",
-    "In addition to the initialized datasets, you'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for each of our two models:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize the champion logistic regression model\n",
-    "vm_log_model = vm.init_model(\n",
-    "    log_reg,\n",
-    "    input_id=\"log_model_champion\",\n",
-    ")\n",
-    "\n",
-    "# Initialize the challenger random forest classification model\n",
-    "vm_rf_model = vm.init_model(\n",
-    "    rf_model,\n",
-    "    input_id=\"rf_model\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Assign predictions to Champion — Logistic regression model\n",
-    "vm_train_ds.assign_predictions(model=vm_log_model)\n",
-    "vm_test_ds.assign_predictions(model=vm_log_model)\n",
-    "\n",
-    "# Assign predictions to Challenger — Random forest classification model\n",
-    "vm_train_ds.assign_predictions(model=vm_rf_model)\n",
-    "vm_test_ds.assign_predictions(model=vm_rf_model)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Implementing custom tests\n",
-    "\n",
-    "Thanks to the model documentation ([Learn more ...](https://docs.validmind.ai/developer/validmind-library.html#for-model-development)), we know that the model development team implemented a custom test to further evaluate the performance of the champion model.\n",
-    "\n",
-    "In a usual model validation situation, you would load a saved custom test provided by the model development team. In the following section, we'll have you implement the same custom test and make it available for reuse, to familiarize you with the processes.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about custom tests?</b></span>\n",
-    "<br></br>\n",
-    "Refer to our in-depth introduction to custom tests: <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/custom_tests/implement_custom_tests.html\" style=\"color: #DE257E;\"><b>Implement custom tests</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Implement a custom inline test\n",
-    "\n",
-    "Let's implement the same custom *inline test* that calculates the confusion matrix for a binary classification model that the model development team used in their performance evaluations.\n",
-    "\n",
-    "- An inline test refers to a test written and executed within the same environment as the code being tested — in this case, right in this Jupyter Notebook —  without requiring a separate test file or framework.\n",
-    "- You'll note that the custom test function is just a regular Python function that can include and require any Python library as you see fit."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1_1__'></a>\n",
-    "\n",
-    "#### Create a confusion matrix plot\n",
-    "\n",
-    "Let's first create a confusion matrix plot using the `confusion_matrix` function from the `sklearn.metrics` module:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import matplotlib.pyplot as plt\n",
-    "from sklearn import metrics\n",
-    "\n",
-    "# Get the predicted classes\n",
-    "y_pred = log_reg.predict(vm_test_ds.x)\n",
-    "\n",
-    "confusion_matrix = metrics.confusion_matrix(y_test, y_pred)\n",
-    "\n",
-    "cm_display = metrics.ConfusionMatrixDisplay(\n",
-    "    confusion_matrix=confusion_matrix, display_labels=[False, True]\n",
-    ")\n",
-    "cm_display.plot()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Next, create a [`@vm.test` wrapper](https://docs.validmind.ai/validmind/validmind.html#test) that will allow you to create a reusable test. **Note the following changes in the code below:**\n",
-    "\n",
-    "- The function `confusion_matrix` takes two arguments `dataset` and `model`. This is a `VMDataset` and `VMModel` object respectively.\n",
-    "  - `VMDataset` objects allow you to access the dataset's true (target) values by accessing the `.y` attribute.\n",
-    "  - `VMDataset` objects allow you to access the predictions for a given model by accessing the `.y_pred()` method.\n",
-    "- The function docstring provides a description of what the test does. This will be displayed along with the result in this notebook as well as in the ValidMind Platform.\n",
-    "- The function body calculates the confusion matrix using the `sklearn.metrics.confusion_matrix` function as we just did above.\n",
-    "- The function then returns the `ConfusionMatrixDisplay.figure_` object — this is important as the ValidMind Library expects the output of the custom test to be a plot or a table.\n",
-    "- The `@vm.test` decorator is doing the work of creating a wrapper around the function that will allow it to be run by the ValidMind Library. It also registers the test so it can be found by the ID `my_custom_tests.ConfusionMatrix`."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "@vm.test(\"my_custom_tests.ConfusionMatrix\")\n",
-    "def confusion_matrix(dataset, model):\n",
-    "    \"\"\"The confusion matrix is a table that is often used to describe the performance of a classification model on a set of data for which the true values are known.\n",
-    "\n",
-    "    The confusion matrix is a 2x2 table that contains 4 values:\n",
-    "\n",
-    "    - True Positive (TP): the number of correct positive predictions\n",
-    "    - True Negative (TN): the number of correct negative predictions\n",
-    "    - False Positive (FP): the number of incorrect positive predictions\n",
-    "    - False Negative (FN): the number of incorrect negative predictions\n",
-    "\n",
-    "    The confusion matrix can be used to assess the holistic performance of a classification model by showing the accuracy, precision, recall, and F1 score of the model on a single figure.\n",
-    "    \"\"\"\n",
-    "    y_true = dataset.y\n",
-    "    y_pred = dataset.y_pred(model=model)\n",
-    "\n",
-    "    confusion_matrix = metrics.confusion_matrix(y_true, y_pred)\n",
-    "\n",
-    "    cm_display = metrics.ConfusionMatrixDisplay(\n",
-    "        confusion_matrix=confusion_matrix, display_labels=[False, True]\n",
-    "    )\n",
-    "    cm_display.plot()\n",
-    "\n",
-    "    plt.close()  # close the plot to avoid displaying it\n",
-    "\n",
-    "    return cm_display.figure_  # return the figure object itself"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You can now run the newly created custom test on both the training and test datasets for both models using the [`run_test()` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Champion train and test\n",
-    "vm.tests.run_test(\n",
-    "    test_id=\"my_custom_tests.ConfusionMatrix:champion\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds,vm_test_ds],\n",
-    "        \"model\" : [vm_log_model]\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Challenger train and test\n",
-    "vm.tests.run_test(\n",
-    "    test_id=\"my_custom_tests.ConfusionMatrix:challenger\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds,vm_test_ds],\n",
-    "        \"model\" : [vm_rf_model]\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your model's documentation for some test IDs. </b></span>\n",
-    "<br></br>\n",
-    "That's expected, as when we run validations tests the results logged need to be manually added to your report as part of your compliance assessment process within the ValidMind Platform.</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1_2__'></a>\n",
-    "\n",
-    "#### Add parameters to custom tests\n",
-    "\n",
-    "Custom tests can take parameters just like any other function. To demonstrate, let's modify the `confusion_matrix` function to take an additional parameter `normalize` that will allow you to normalize the confusion matrix:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "@vm.test(\"my_custom_tests.ConfusionMatrix\")\n",
-    "def confusion_matrix(dataset, model, normalize=False):\n",
-    "    \"\"\"The confusion matrix is a table that is often used to describe the performance of a classification model on a set of data for which the true values are known.\n",
-    "\n",
-    "    The confusion matrix is a 2x2 table that contains 4 values:\n",
-    "\n",
-    "    - True Positive (TP): the number of correct positive predictions\n",
-    "    - True Negative (TN): the number of correct negative predictions\n",
-    "    - False Positive (FP): the number of incorrect positive predictions\n",
-    "    - False Negative (FN): the number of incorrect negative predictions\n",
-    "\n",
-    "    The confusion matrix can be used to assess the holistic performance of a classification model by showing the accuracy, precision, recall, and F1 score of the model on a single figure.\n",
-    "    \"\"\"\n",
-    "    y_true = dataset.y\n",
-    "    y_pred = dataset.y_pred(model=model)\n",
-    "\n",
-    "    if normalize:\n",
-    "        confusion_matrix = metrics.confusion_matrix(y_true, y_pred, normalize=\"all\")\n",
-    "    else:\n",
-    "        confusion_matrix = metrics.confusion_matrix(y_true, y_pred)\n",
-    "\n",
-    "    cm_display = metrics.ConfusionMatrixDisplay(\n",
-    "        confusion_matrix=confusion_matrix, display_labels=[False, True]\n",
-    "    )\n",
-    "    cm_display.plot()\n",
-    "\n",
-    "    plt.close()  # close the plot to avoid displaying it\n",
-    "\n",
-    "    return cm_display.figure_  # return the figure object itself"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1_3__'></a>\n",
-    "\n",
-    "#### Pass parameters to custom tests\n",
-    "\n",
-    "You can pass parameters to custom tests by providing a dictionary of parameters to the `run_test()` function.\n",
-    "\n",
-    "- The parameters will override any default parameters set in the custom test definition. Note that `dataset` and `model` are still passed as `inputs`.\n",
-    "- Since these are `VMDataset` or `VMModel` inputs, they have a special meaning.\n",
-    "\n",
-    "Re-running and logging the custom confusion matrix with `normalize=True` for both models and our testing dataset looks like this:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Champion with test dataset and normalize=True\n",
-    "vm.tests.run_test(\n",
-    "    test_id=\"my_custom_tests.ConfusionMatrix:test_normalized_champion\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_test_ds],\n",
-    "        \"model\" : [vm_log_model]\n",
-    "    },\n",
-    "    params={\"normalize\": True}\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Challenger with test dataset and normalize=True\n",
-    "vm.tests.run_test(\n",
-    "    test_id=\"my_custom_tests.ConfusionMatrix:test_normalized_challenger\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_test_ds],\n",
-    "        \"model\" : [vm_rf_model]\n",
-    "    },\n",
-    "    params={\"normalize\": True}\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2__'></a>\n",
-    "\n",
-    "### Use external test providers\n",
-    "\n",
-    "Sometimes you may want to reuse the same set of custom tests across multiple models and share them with others in your organization, like the model development team would have done with you in this example workflow featured in this series of notebooks. In this case, you can create an external custom *test provider* that will allow you to load custom tests from a local folder or a Git repository.\n",
-    "\n",
-    "In this section you will learn how to declare a local filesystem test provider that allows loading tests from a local folder following these high level steps:\n",
-    "\n",
-    "1. Create a folder of custom tests from existing inline tests (tests that exist in your active Jupyter Notebook)\n",
-    "2. Save an inline test to a file\n",
-    "3. Define and register a [`LocalTestProvider`](https://docs.validmind.ai/validmind/validmind/tests.html#LocalTestProvider) that points to that folder\n",
-    "4. Run test provider tests\n",
-    "5. Add the test results to your documentation"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_1__'></a>\n",
-    "\n",
-    "#### Create custom tests folder\n",
-    "\n",
-    "Let's start by creating a new folder that will contain reusable custom tests from your existing inline tests.\n",
-    "\n",
-    "The following code snippet will create a new `my_tests` directory in the current working directory if it doesn't exist:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "tests_folder = \"my_tests\"\n",
-    "\n",
-    "import os\n",
-    "\n",
-    "# create tests folder\n",
-    "os.makedirs(tests_folder, exist_ok=True)\n",
-    "\n",
-    "# remove existing tests\n",
-    "for f in os.listdir(tests_folder):\n",
-    "    # remove files and pycache\n",
-    "    if f.endswith(\".py\") or f == \"__pycache__\":\n",
-    "        os.system(f\"rm -rf {tests_folder}/{f}\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "After running the command above, confirm that a new `my_tests` directory was created successfully. For example:\n",
-    "\n",
-    "```\n",
-    "~/notebooks/tutorials/model_validation/my_tests/\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_2__'></a>\n",
-    "\n",
-    "#### Save an inline test\n",
-    "\n",
-    "The `@vm.test` decorator we used in **Implement a custom inline test** above to register one-off custom tests also includes a convenience method on the function object that allows you to simply call `<func_name>.save()` to save the test to a Python file at a specified path.\n",
-    "\n",
-    "While `save()` will get you started by creating the file and saving the function code with the correct name, it won't automatically include any imports, or other functions or variables, outside of the functions that are needed for the test to run. To solve this, pass in an optional `imports` argument ensuring necessary imports are added to the file.\n",
-    "\n",
-    "The `confusion_matrix` test requires the following additional imports:\n",
-    "\n",
-    "```python\n",
-    "import matplotlib.pyplot as plt\n",
-    "from sklearn import metrics\n",
-    "```\n",
-    "\n",
-    "Let's pass these imports to the `save()` method to ensure they are included in the file with the following command:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "confusion_matrix.save(\n",
-    "    # Save it to the custom tests folder we created\n",
-    "    tests_folder,\n",
-    "    imports=[\"import matplotlib.pyplot as plt\", \"from sklearn import metrics\"],\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "- [x] Confirm that the `save()` method saved the `confusion_matrix` function to a file named `ConfusionMatrix.py` in the `my_tests` folder.\n",
-    "- [x] Note that the new file provides some context on the origin of the test, which is useful for traceability:\n",
-    "\n",
-    "    ```\n",
-    "    # Saved from __main__.confusion_matrix\n",
-    "    # Original Test ID: my_custom_tests.ConfusionMatrix\n",
-    "    # New Test ID: <test_provider_namespace>.ConfusionMatrix\n",
-    "    ```\n",
-    "\n",
-    "- [x]  Additionally, the new test function has been stripped off its decorator, as it now resides in a file that will be loaded by the test provider:\n",
-    "\n",
-    "    ```python\n",
-    "    def ConfusionMatrix(dataset, model, normalize=False):\n",
-    "    ```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_3__'></a>\n",
-    "\n",
-    "#### Register a local test provider\n",
-    "\n",
-    "Now that your `my_tests` folder has a sample custom test, let's initialize a test provider that will tell the ValidMind Library where to find your custom tests:\n",
-    "\n",
-    "- ValidMind offers out-of-the-box test providers for local tests (tests in a folder) or a Github provider for tests in a Github repository.\n",
-    "- You can also create your own test provider by creating a class that has a [`load_test` method](https://docs.validmind.ai/validmind/validmind/tests.html#load_test) that takes a test ID and returns the test function matching that ID.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about test providers?</b></span>\n",
-    "<br></br>\n",
-    "An extended introduction to test providers can be found in: <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/custom_tests/integrate_external_test_providers.html\" style=\"color: #DE257E;\"><b>Integrate external test providers</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "##### Initialize a local test provider\n",
-    "\n",
-    "For most use cases, using a `LocalTestProvider` that allows you to load custom tests from a designated directory should be sufficient.\n",
-    "\n",
-    "**The most important attribute for a test provider is its `namespace`.** This is a string that will be used to prefix test IDs in model documentation. This allows you to have multiple test providers with tests that can even share the same ID, but are distinguished by their namespace.\n",
-    "\n",
-    "Let's go ahead and load the custom tests from our `my_tests` directory:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.tests import LocalTestProvider\n",
-    "\n",
-    "# initialize the test provider with the tests folder we created earlier\n",
-    "my_test_provider = LocalTestProvider(tests_folder)\n",
-    "\n",
-    "vm.tests.register_test_provider(\n",
-    "    namespace=\"my_test_provider\",\n",
-    "    test_provider=my_test_provider,\n",
-    ")\n",
-    "# `my_test_provider.load_test()` will be called for any test ID that starts with `my_test_provider`\n",
-    "# e.g. `my_test_provider.ConfusionMatrix` will look for a function named `ConfusionMatrix` in `my_tests/ConfusionMatrix.py` file"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "##### Run test provider tests\n",
-    "\n",
-    "Now that we've set up the test provider, we can run any test that's located in the tests folder by using the `run_test()` method as with any other test:\n",
-    "\n",
-    "- For tests that reside in a test provider directory, the test ID will be the `namespace` specified when registering the provider, followed by the path to the test file relative to the tests folder.\n",
-    "- For example, the Confusion Matrix test we created earlier will have the test ID `my_test_provider.ConfusionMatrix`. You could organize the tests in subfolders, say `classification` and `regression`, and the test ID for the Confusion Matrix test would then be `my_test_provider.classification.ConfusionMatrix`.\n",
-    "\n",
-    "Let's go ahead and re-run the confusion matrix test with our testing dataset for our two models by using the test ID `my_test_provider.ConfusionMatrix`. This should load the test from the test provider and run it as before."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Champion with test dataset and test provider custom test\n",
-    "vm.tests.run_test(\n",
-    "    test_id=\"my_test_provider.ConfusionMatrix:champion\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_test_ds],\n",
-    "        \"model\" : [vm_log_model]\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Challenger with test dataset  and test provider custom test\n",
-    "vm.tests.run_test(\n",
-    "    test_id=\"my_test_provider.ConfusionMatrix:challenger\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_test_ds],\n",
-    "        \"model\" : [vm_rf_model]\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Verify test runs\n",
-    "\n",
-    "Our final task is to verify that all the tests provided by the model development team were run and reported accurately. Note the appended `result_ids` to delineate which dataset we ran the test with for the relevant tests.\n",
-    "\n",
-    "Here, we'll specify all the tests we'd like to independently rerun in a dictionary called `test_config`. **Note here that `inputs` and `input_grid` expect the `input_id` of the dataset or model as the value rather than the variable name we specified**:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test_config = {\n",
-    "    # Run with the raw dataset\n",
-    "    'validmind.data_validation.DatasetDescription:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'}\n",
-    "    },\n",
-    "    'validmind.data_validation.DescriptiveStatistics:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'}\n",
-    "    },\n",
-    "    'validmind.data_validation.MissingValues:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'min_percentage_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.ClassImbalance:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'min_percent_threshold': 10}\n",
-    "    },\n",
-    "    'validmind.data_validation.Duplicates:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'min_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.HighCardinality:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {\n",
-    "            'num_threshold': 100,\n",
-    "            'percent_threshold': 0.1,\n",
-    "            'threshold_type': 'percent'\n",
-    "        }\n",
-    "    },\n",
-    "    'validmind.data_validation.Skewness:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'max_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.UniqueRows:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'min_percent_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.TooManyZeroValues:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'max_percent_threshold': 0.03}\n",
-    "    },\n",
-    "    'validmind.data_validation.IQROutliersTable:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'threshold': 5}\n",
-    "    },\n",
-    "    # Run with the preprocessed dataset\n",
-    "    'validmind.data_validation.DescriptiveStatistics:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset_preprocessed'}\n",
-    "    },\n",
-    "    'validmind.data_validation.TabularDescriptionTables:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset_preprocessed'}\n",
-    "    },\n",
-    "    'validmind.data_validation.MissingValues:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset_preprocessed'},\n",
-    "        'params': {'min_percentage_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.TabularNumericalHistograms:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset_preprocessed'}\n",
-    "    },\n",
-    "    'validmind.data_validation.TabularCategoricalBarPlots:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset_preprocessed'}\n",
-    "    },\n",
-    "    'validmind.data_validation.TargetRateBarPlots:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset_preprocessed'},\n",
-    "        'params': {'default_column': 'loan_status'}\n",
-    "    },\n",
-    "    # Run with the training and test datasets\n",
-    "    'validmind.data_validation.DescriptiveStatistics:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']}\n",
-    "    },\n",
-    "    'validmind.data_validation.TabularDescriptionTables:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']}\n",
-    "    },\n",
-    "    'validmind.data_validation.ClassImbalance:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']},\n",
-    "        'params': {'min_percent_threshold': 10}\n",
-    "    },\n",
-    "    'validmind.data_validation.UniqueRows:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']},\n",
-    "        'params': {'min_percent_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.TabularNumericalHistograms:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']}\n",
-    "    },\n",
-    "    'validmind.data_validation.MutualInformation:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']},\n",
-    "        'params': {'min_threshold': 0.01}\n",
-    "    },\n",
-    "    'validmind.data_validation.PearsonCorrelationMatrix:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']}\n",
-    "    },\n",
-    "    'validmind.data_validation.HighPearsonCorrelation:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']},\n",
-    "        'params': {'max_threshold': 0.3, 'top_n_correlations': 10}\n",
-    "    },\n",
-    "    'validmind.model_validation.ModelMetadata': {\n",
-    "        'input_grid': {'model': ['log_model_champion', 'rf_model']}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.ModelParameters': {\n",
-    "        'input_grid': {'model': ['log_model_champion', 'rf_model']}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.ROCCurve': {\n",
-    "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final'], 'model': ['log_model_champion']}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.MinimumROCAUCScore': {\n",
-    "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final'], 'model': ['log_model_champion']},\n",
-    "        'params': {'min_threshold': 0.5}\n",
-    "    }\n",
-    "}"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Then batch run and log our tests in `test_config`:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "for t in test_config:\n",
-    "    print(t)\n",
-    "    try:\n",
-    "        # Check if test has input_grid\n",
-    "        if 'input_grid' in test_config[t]:\n",
-    "            # For tests with input_grid, pass the input_grid configuration\n",
-    "            if 'params' in test_config[t]:\n",
-    "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid'], params=test_config[t]['params']).log()\n",
-    "            else:\n",
-    "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid']).log()\n",
-    "        else:\n",
-    "            # Original logic for regular inputs\n",
-    "            if 'params' in test_config[t]:\n",
-    "                vm.tests.run_test(t, inputs=test_config[t]['inputs'], params=test_config[t]['params']).log()\n",
-    "            else:\n",
-    "                vm.tests.run_test(t, inputs=test_config[t]['inputs']).log()\n",
-    "    except Exception as e:\n",
-    "        print(f\"Error running test {t}: {str(e)}\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## In summary\n",
-    "\n",
-    "In this final notebook, you learned how to:\n",
-    "\n",
-    "- [x] Implement a custom inline test\n",
-    "- [x] Run and log your custom inline tests\n",
-    "- [x] Use external custom test providers\n",
-    "- [x] Run and log tests from your custom test providers\n",
-    "- [x] Re-run tests provided by your model development team to verify that they were run and reported accurately\n",
-    "\n",
-    "With our ValidMind for model validation series of notebooks, you learned how to validate a model end-to-end with the ValidMind Library by running through some common scenarios in a typical model validation setting:\n",
-    "\n",
-    "- Verifying the data quality steps performed by the model development team\n",
-    "- Independently replicating the champion model's results and conducting additional tests to assess performance, stability, and robustness\n",
-    "- Setting up test inputs and a challenger model for comparative analysis\n",
-    "- Running validation tests, analyzing results, and logging artifacts to ValidMind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Next steps"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1__'></a>\n",
-    "\n",
-    "### Work with your validation report\n",
-    "\n",
-    "Now that you've logged all your test results and verified the work done by the model development team, head to the ValidMind Platform to wrap up your validation report. Continue to work on your validation report by:\n",
-    "\n",
-    "- **Inserting additional test results:** Click **Link Evidence to Report** under any section of 2. Validation in your validation report. (Learn more: [Link evidence to reports](https://docs.validmind.ai/guide/model-validation/assess-compliance.html#link-evidence-to-reports))\n",
-    "\n",
-    "- **Making qualitative edits to your test descriptions:** Expand any linked evidence under Validator Evidence and click **See evidence details** to review and edit the ValidMind-generated test descriptions for quality and accuracy. (Learn more: [Preparing validation reports](https://docs.validmind.ai/guide/model-validation/preparing-validation-reports.html#get-started))\n",
-    "\n",
-    "- **Adding more findings:** Click **Link Finding to Report** in any validation report section, then click **+ Create New Finding**. (Learn more: [Add and manage model findings](https://docs.validmind.ai/guide/model-validation/add-manage-model-findings.html))\n",
-    "\n",
-    "- **Adding risk assessment notes:** Click under **Risk Assessment Notes** in any validation report section to access the text editor and content editing toolbar, including an option to generate a draft with AI. Once generated, edit your ValidMind-generated test descriptions to adhere to your organization's requirements. (Learn more: [Work with content blocks](https://docs.validmind.ai/guide/model-documentation/work-with-content-blocks.html#content-editing-toolbar))\n",
-    "\n",
-    "- **Assessing compliance:** Under the Guideline for any validation report section, click **ASSESSMENT** and select the compliance status from the drop-down menu. (Learn more: [Provide compliance assessments](https://docs.validmind.ai/guide/model-validation/assess-compliance.html#provide-compliance-assessments))\n",
-    "\n",
-    "- **Collaborate with other stakeholders:** Use the ValidMind Platform's real-time collaborative features to work seamlessly together with the rest of your organization, including model developers. Propose suggested changes in the model documentation, work with versioned history, and use comments to discuss specific portions of the model documentation. (Learn more: [Collaborate with others](https://docs.validmind.ai/guide/model-documentation/collaborate-with-others.html))\n",
-    "\n",
-    "When your validation report is complete and ready for review, submit it for approval from the same ValidMind Platform where you made your edits and collaborated with the rest of your organization, ensuring transparency and a thorough model validation history. (Learn more: [Submit for approval](https://docs.validmind.ai/guide/model-documentation/submit-for-approval.html))"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2__'></a>\n",
-    "\n",
-    "### Learn more\n",
-    "\n",
-    "Now that you're familiar with the basics, you can explore the following notebooks to get a deeper understanding on how the ValidMind Library assists you in streamlining model validation:"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2_1__'></a>\n",
-    "\n",
-    "#### Use cases\n",
-    "\n",
-    "- [Validate an application scorecard model](../../use_cases/model_validation/validate_application_scorecard.ipynb)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2_2__'></a>\n",
-    "\n",
-    "#### Discover more learning resources\n",
-    "\n",
-    "Learn more about the ValidMind Library tools we used in this notebook:\n",
-    "\n",
-    "- [Explore tests](../../how_to/tests/explore_tests/explore_tests.ipynb)\n",
-    "- [Run dataset-based tests](../../how_to/tests/run_tests/1_run_dataset_based_tests.ipynb)\n",
-    "- [Implement custom tests](../../how_to/tests/custom_tests/implement_custom_tests.ipynb)\n",
-    "- [Integrate external test providers](../../how_to/tests/custom_tests/integrate_external_test_providers.ipynb)\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-8028ef6a3da9409a8eab5aa0cf246c57",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
-  },
-  "language_info": {
-   "name": "python",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
-}
diff --git a/site/notebooks/tutorials/model_validation/inserted-class-imbalance-results.png b/site/notebooks/tutorials/model_validation/inserted-class-imbalance-results.png
deleted file mode 100644
index 2efea1a09b..0000000000
Binary files a/site/notebooks/tutorials/model_validation/inserted-class-imbalance-results.png and /dev/null differ
diff --git a/site/notebooks/tutorials/model_validation/link-artifact.png b/site/notebooks/tutorials/model_validation/link-artifact.png
deleted file mode 100644
index 23edc1c9eb..0000000000
Binary files a/site/notebooks/tutorials/model_validation/link-artifact.png and /dev/null differ
diff --git a/site/notebooks/tutorials/model_validation/link-validator-evidence.png b/site/notebooks/tutorials/model_validation/link-validator-evidence.png
deleted file mode 100644
index 660a19cfab..0000000000
Binary files a/site/notebooks/tutorials/model_validation/link-validator-evidence.png and /dev/null differ
diff --git a/site/notebooks/tutorials/validation/1-set_up_validmind_for_validation.ipynb b/site/notebooks/tutorials/validation/1-set_up_validmind_for_validation.ipynb
new file mode 100644
index 0000000000..feda59a354
--- /dev/null
+++ b/site/notebooks/tutorials/validation/1-set_up_validmind_for_validation.ipynb
@@ -0,0 +1,533 @@
+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# ValidMind for validation 1 — Set up the ValidMind Library for validation\n",
+        "\n",
+        "Learn how to use ValidMind for your end-to-end validation process based on common scenarios with our series of four introductory notebooks. In this first notebook, set up the ValidMind Library in preparation for validating a champion.\n",
+        "\n",
+        "These notebooks use a binary classification model as an example, but the same principles shown here apply to other record (model) types.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
+        "<br></br>\n",
+        "Our course tailor-made for validators new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/validator-fundamentals/validator-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Validator Fundamentals</b></a></div>"
+      ],
+      "id": "821a881e"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [Introduction](#toc1__)    \n",
+        "- [About ValidMind](#toc2__)    \n",
+        "  - [Before you begin](#toc2_1__)    \n",
+        "  - [New to ValidMind?](#toc2_2__)    \n",
+        "  - [Key concepts](#toc2_3__)    \n",
+        "- [Setting up](#toc3__)    \n",
+        "  - [Register a sample model](#toc3_1__)    \n",
+        "    - [Assign validator credentials](#toc3_1_1__)    \n",
+        "    - [Apply documentation template](#toc3_1_2__)    \n",
+        "    - [Apply validation report template](#toc3_1_3__)    \n",
+        "  - [Install the ValidMind Library](#toc3_2__)    \n",
+        "  - [Initialize the ValidMind Library](#toc3_3__)    \n",
+        "    - [Get your code snippet](#toc3_3_1__)    \n",
+        "- [Getting to know ValidMind](#toc4__)    \n",
+        "  - [Preview the validation report template](#toc4_1__)    \n",
+        "    - [View validation report in the ValidMind Platform](#toc4_1_1__)    \n",
+        "  - [Explore available tests](#toc4_2__)    \n",
+        "- [Upgrade ValidMind](#toc5__)    \n",
+        "- [In summary](#toc6__)    \n",
+        "- [Next steps](#toc7__)    \n",
+        "  - [Start the validation process](#toc7_1__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ],
+      "id": "19ea797c"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## Introduction\n",
+        "\n",
+        "Validation aims to independently assess the compliance of *champions* created by developers with regulatory guidance by conducting thorough testing and analysis, potentially including the use of challengers to benchmark performance. Assessments, presented in the form of a validation report, typically include *artifacts (findings)* and recommendations to address those issues.\n",
+        "\n",
+        "A *binary classification model* is a type of predictive model used in churn analysis to identify customers who are likely to leave a service or subscription by analyzing various behavioral, transactional, and demographic factors.\n",
+        "\n",
+        "- This model helps businesses take proactive measures to retain at-risk customers by offering personalized incentives, improving customer service, or adjusting pricing strategies.\n",
+        "- Effective validation of a churn prediction model ensures that businesses can accurately identify potential churners, optimize retention efforts, and enhance overall customer satisfaction while minimizing revenue loss."
+      ],
+      "id": "d624f88d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate comparison and other validation tests, and then use the ValidMind Platform to submit compliance assessments of champions via comprehensive validation reports. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and developers."
+      ],
+      "id": "4fb1ef5a"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
+      ],
+      "id": "594f9fd4"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+      ],
+      "id": "262ed111"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**validation report:** A validation report is a comprehensive and structured review evaluating a record's accuracy, performance, and suitability for its intended purpose. A report follows established validation guidelines to ensure consistency and adherence to internal and regulatory standards — encompassing the process of risk assessment, identifying areas of potential error or risk within the record's components, supporting transparency, regulatory compliance, and informed decision-making by documenting the validator’s independent review and conclusions.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**validation report template**: A default ValidMind document template that serves as a standardized framework for conducting and documenting validation, including sections designated for attaching test results, evidence, or artifacts (findings). By outlining required documentation, recommended analyses, and expected validation tests, validation report templates ensure consistency and completeness across validation reports and help guide validators through a systematic review process while promoting comparability and traceability of validation outcomes.\n",
+        "\n",
+        "**artifacts (findings)**: Observations or issues identified during validation, including any deviations from expected performance or standards. Artifacts are organized by type — default types provided by ValidMind include Validation Issue, Policy Exception, and Limitation. Custom artifact types can be created to track other categories relevant to your organization.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ],
+      "id": "0eb67fe9"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Setting up"
+      ],
+      "id": "e0e1cf3d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Register a sample model\n",
+        "\n",
+        "In a usual lifecycle, a champion will have been independently registered in your inventory and submitted to you for validation by your development team as part of the effective challenge process. (**Learn more:** [Submit documents](https://docs.validmind.ai/guide/documentation/submit-documents.html))\n",
+        "\n",
+        "For this notebook, we'll have you register a dummy record (model) in the ValidMind Platform inventory and assign yourself as the validator to familiarize you with the ValidMind interface and circumvent the need for an existing model:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down — don’t worry, we’ll adjust these permissions next for validation.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ],
+      "id": "609fe59b"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1_1__'></a>\n",
+        "\n",
+        "#### Assign validator credentials\n",
+        "\n",
+        "In order to log tests as a validator instead of as a developer, on the details page that appears after you've successfully registered your sample model:\n",
+        "\n",
+        "1. Remove yourself as an owner:\n",
+        "\n",
+        "    - Click on the **OWNERS** tile.\n",
+        "    - Click the **x** next to your name to remove yourself from that model's role.\n",
+        "    - Click **Save** to apply your changes to that role.\n",
+        "\n",
+        "2. Remove yourself as a developer:\n",
+        "\n",
+        "    - Click on the **DEVELOPERS** tile.\n",
+        "    - Click the **x** next to your name to remove yourself from that model's role.\n",
+        "    - Click **Save** to apply your changes to that role.\n",
+        "\n",
+        "3. Add yourself as a validator:\n",
+        "\n",
+        "    - Click on the **VALIDATORS** tile.\n",
+        "    - Select your name from the drop-down menu.\n",
+        "    - Click **Save** to apply your changes to that role."
+      ],
+      "id": "58e552bb"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier for developers.\n",
+        "\n",
+        "We'll need this documentation template later for reference as we draft our validation report:\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Documentation**.\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Binary classification`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ],
+      "id": "84251589"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1_3__'></a>\n",
+        "\n",
+        "#### Apply validation report template\n",
+        "\n",
+        "Next, let's select a validation report template. A template predefines sections for your report and provides a general outline to follow, making the validation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Validation**.\n",
+        "\n",
+        "    If you cannot locate your Validation document, make sure Validation type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Generic Validation Report`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ],
+      "id": "fdfb5dc5"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
+        "<br></br>\n",
+        "Python 3.8 <= x <= 3.14</div>\n",
+        "\n",
+        "To install the library:"
+      ],
+      "id": "f656d0d6"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "931d8f7f"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_3__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ],
+      "id": "1435fd5b"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_3_1__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Validation` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ],
+      "id": "b375b341"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"validation-report\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "d5d87e2d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Getting to know ValidMind"
+      ],
+      "id": "331e1c07"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Preview the validation report template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will attach evidence to this template in the form of risk assessment notes, artifacts, and test results later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library:"
+      ],
+      "id": "f6331a98"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "13d34bbb"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1_1__'></a>\n",
+        "\n",
+        "#### View validation report in the ValidMind Platform\n",
+        "\n",
+        "Next, let's head to the ValidMind Platform to see the template in action:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, navigate to **Inventory** and select the model you registered for this \"ValidMind for validation\" series of notebooks.\n",
+        "\n",
+        "3. Click **Validation** under Documents for your model and note:\n",
+        "\n",
+        "    - [x] The risk assessment compliance summary at the top of the report (screenshot below)\n",
+        "    - [x] How the structure of the validation report reflects the previewed template\n",
+        "\n",
+        "    <img src= \"compliance-summary.png\" alt=\"Screenshot showing the risk assessment compliance summary\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
+        "    <br><br>"
+      ],
+      "id": "20717133"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Explore available tests\n",
+        "\n",
+        "Next, let's explore the list of all available tests in the ValidMind Library with [the `vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) — we'll later narrow down the tests we want to run from this list when we learn to run tests."
+      ],
+      "id": "f5d0aaab"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.list_tests()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "de6abc2a"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ],
+      "id": "dce47e40"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "10272aa9"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ],
+      "id": "7a0c3cc2"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ],
+      "id": "2dac11d5"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## In summary\n",
+        "\n",
+        "In this first notebook, you learned how to:\n",
+        "\n",
+        "- [x] Register a record (model) within the ValidMind Platform and assign yourself as the validator\n",
+        "- [x] Install and initialize the ValidMind Library\n",
+        "- [x] Preview the validation report template for your model\n",
+        "- [x] Explore the available tests offered by the ValidMind Library"
+      ],
+      "id": "174d2c8d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "<a id='toc7_1__'></a>\n",
+        "\n",
+        "### Start the validation process\n",
+        "\n",
+        "Now that the ValidMind Library is connected to your model in the ValidMind Library with the correct template applied, we can go ahead and start the validation process: **[2 — Start the validation process](2-start_validation_process.ipynb)**"
+      ],
+      "id": "d8ffdcf7"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-5d7a1c159e4840fca79011d1c0380725"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "name": "python",
+      "version": "3.10.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 5
+}
diff --git a/site/notebooks/tutorials/validation/2-start_validation_process.ipynb b/site/notebooks/tutorials/validation/2-start_validation_process.ipynb
new file mode 100644
index 0000000000..a0d4440e6c
--- /dev/null
+++ b/site/notebooks/tutorials/validation/2-start_validation_process.ipynb
@@ -0,0 +1,896 @@
+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# ValidMind for validation 2 — Start the validation process\n",
+        "\n",
+        "Learn how to use ValidMind for your end-to-end validation process with our series of four introductory notebooks. In this second notebook, independently verify the data quality tests performed on the dataset used to train the champion.\n",
+        "\n",
+        "You'll learn how to run relevant validation tests with ValidMind, log the results of those tests to the ValidMind Platform, and insert your logged test results as evidence into your validation report. You'll become familiar with the tests available in ValidMind, as well as how to run them. Running tests during validation is crucial to the effective challenge process, as we want to independently evaluate the evidence and assessments provided by the development team.\n",
+        "\n",
+        "While running our tests in this notebook, we'll focus on:\n",
+        "\n",
+        "- Ensuring that data used for training and testing the champion is of appropriate data quality\n",
+        "- Ensuring that the raw data has been preprocessed appropriately and that the resulting final datasets reflects this\n",
+        "\n",
+        "**For a full list of out-of-the-box tests and descriptions,** use the interactive [ValidMind test sandbox](https://docs.validmind.ai/developer/how-to/test-sandbox.html).\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
+        "<br></br>\n",
+        "Our course tailor-made for validators new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/validator-fundamentals/validator-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Validator Fundamentals</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [Prerequisites](#toc1__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_1__)    \n",
+        "- [Load the sample dataset](#toc3__)    \n",
+        "- [Verifying data quality adjustments](#toc4__)    \n",
+        "  - [Identify qualitative tests](#toc4_1__)    \n",
+        "  - [Initialize the ValidMind dataset](#toc4_2__)    \n",
+        "  - [Run data quality tests](#toc4_3__)    \n",
+        "    - [Run tabular data tests](#toc4_3_1__)    \n",
+        "  - [Remove highly correlated features](#toc4_4__)    \n",
+        "- [Documenting test results](#toc5__)    \n",
+        "  - [Configure and run comparison tests](#toc5_1__)    \n",
+        "  - [Log tests with unique identifiers](#toc5_2__)    \n",
+        "  - [Add test results to reporting](#toc5_3__)    \n",
+        "- [Preparing the preprocessed dataset](#toc6__)    \n",
+        "  - [Split the preprocessed dataset](#toc6_1__)    \n",
+        "  - [Initialize the split datasets](#toc6_2__)    \n",
+        "- [In summary](#toc7__)    \n",
+        "- [Next steps](#toc8__)    \n",
+        "  - [Develop potential challenger models](#toc8_1__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## Prerequisites\n",
+        "\n",
+        "In order to independently assess the quality of your datasets with notebook, you'll need to first have:\n",
+        "\n",
+        "- [x] Registered a model within the ValidMind Platform and granted yourself access to the model as a validator\n",
+        "- [x] Installed the ValidMind Library in your local environment, allowing you to access all its features\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Need help with the above steps?</b></span>\n",
+        "<br></br>\n",
+        "Refer to the first notebook in this series: <a href=\"1-set_up_validmind_for_validation.ipynb\" style=\"color: #DE257E;\"><b>1 — Set up the ValidMind Library for validation</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library\n",
+        "\n",
+        "First, let's connect up the ValidMind Library to our model we previously registered in the ValidMind Platform:\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Validation` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Make sure the ValidMind Library is installed\n",
+        "\n",
+        "%pip install -q validmind\n",
+        "\n",
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"validation-report\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Load the sample dataset\n",
+        "\n",
+        "Let's first import the public [Bank Customer Churn Prediction](https://www.kaggle.com/datasets/shantanudhakadd/bank-customer-churn-prediction) dataset from Kaggle, which was used to develop the dummy champion.\n",
+        "\n",
+        "We'll use this dataset to review steps that should have been conducted during the initial development and documentation of the champion to ensure that the model was built correctly. By independently performing steps taken by the development team, we can confirm whether the model was built using appropriate and properly processed data.\n",
+        "\n",
+        "In our below example, note that:\n",
+        "\n",
+        "- The target column, `Exited` has a value of `1` when a customer has churned and `0` otherwise.\n",
+        "- The ValidMind Library provides a wrapper to automatically load the dataset as a [Pandas DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html) object. A Pandas Dataframe is a two-dimensional tabular data structure that makes use of rows and columns."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "from validmind.datasets.classification import customer_churn as demo_dataset\n",
+        "\n",
+        "print(\n",
+        "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{demo_dataset.target_column}' \\n\\t• Class labels: {demo_dataset.class_labels}\"\n",
+        ")\n",
+        "\n",
+        "raw_df = demo_dataset.load_data()\n",
+        "raw_df.head()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Verifying data quality adjustments\n",
+        "\n",
+        "Let's say that thanks to the documentation submitted by the development team (**Learn more:** [ValidMind for development](https://docs.validmind.ai/developer/validmind-library.html#development)), we know that the sample dataset was first modified before being used to train the champion. After performing some data quality assessments on the raw dataset, it was determined that the dataset required rebalancing, and highly correlated features were also removed."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Identify qualitative tests\n",
+        "\n",
+        "During validation, we use the same data processing logic and training procedure to confirm that the model's results can be reproduced independently, so let's start by doing some data quality assessments by running a few individual tests just like the development team did.\n",
+        "\n",
+        "Use the [`vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) introduced by the first notebook in this series in combination with [`vm.tests.list_tags()`](https://docs.validmind.ai/validmind/validmind/tests.html#list_tags) and [`vm.tests.list_tasks()`](https://docs.validmind.ai/validmind/validmind/tests.html#list_tasks) to find which prebuilt tests are relevant for data quality assessment:\n",
+        "\n",
+        "- **`tasks`** represent the kind of modeling task associated with a test. Here we'll focus on `classification` tasks.\n",
+        "- **`tags`** are free-form descriptions providing more details about the test, for example, what category the test falls into. Here we'll focus on the `data_quality` tag."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Get the list of available task types\n",
+        "sorted(vm.tests.list_tasks())"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Get the list of available tags\n",
+        "sorted(vm.tests.list_tags())"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You can pass `tags` and `tasks` as parameters to the `vm.tests.list_tests()` function to filter the tests based on the tags and task types.\n",
+        "\n",
+        "For example, to find tests related to tabular data quality for classification models, you can call `list_tests()` like this:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "vm.tests.list_tests(task=\"classification\", tags=[\"tabular_data\", \"data_quality\"])"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about navigating ValidMind tests?</b></span>\n",
+        "<br></br>\n",
+        "Refer to our notebook outlining the utilities available for viewing and understanding available ValidMind tests: <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/explore_tests/explore_tests.html\" style=\"color: #DE257E;\"><b>Explore tests</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind dataset\n",
+        "\n",
+        "With the individual tests we want to run identified, the next step is to connect your data with a ValidMind `Dataset` object. **This step is always necessary every time you want to connect a dataset to documentation and produce test results through ValidMind,** but you only need to do it once per dataset.\n",
+        "\n",
+        "Initialize a ValidMind dataset object using the [`init_dataset` function](https://docs.validmind.ai/validmind/validmind.html#init_dataset) from the ValidMind (`vm`) module. For this example, we'll pass in the following arguments:\n",
+        "\n",
+        "- **`dataset`** — The raw dataset that you want to provide as input to tests.\n",
+        "- **`input_id`** — A unique identifier that allows tracking what inputs are used when running each individual test.\n",
+        "- **`target_column`** — A required argument if tests require access to true values. This is the name of the target column in the dataset."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# vm_raw_dataset is now a VMDataset object that you can pass to any ValidMind test\n",
+        "vm_raw_dataset = vm.init_dataset(\n",
+        "    dataset=raw_df,\n",
+        "    input_id=\"raw_dataset\",\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_3__'></a>\n",
+        "\n",
+        "### Run data quality tests\n",
+        "\n",
+        "Now that we know how to initialize a ValidMind `dataset` object, we're ready to run some tests!\n",
+        "\n",
+        "You run individual tests by calling [the `run_test` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test) provided by the `validmind.tests` module. For the examples below, we'll pass in the following arguments:\n",
+        "\n",
+        "- **`test_id`** — The ID of the test to run, as seen in the `ID` column when you run `list_tests`. \n",
+        "- **`params`** — A dictionary of parameters for the test. These will override any `default_params` set in the test definition. "
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_3_1__'></a>\n",
+        "\n",
+        "#### Run tabular data tests\n",
+        "\n",
+        "The inputs expected by a test can also be found in the test definition — let's take `validmind.data_validation.DescriptiveStatistics` as an example.\n",
+        "\n",
+        "Note that the output of the [`describe_test()` function](https://docs.validmind.ai/validmind/validmind/tests.html#describe_test) below shows that this test expects a `dataset` as input:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "vm.tests.describe_test(\"validmind.data_validation.DescriptiveStatistics\")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Now, let's run a few tests to assess the quality of the dataset:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "result2 = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.ClassImbalance\",\n",
+        "    inputs={\"dataset\": vm_raw_dataset},\n",
+        "    params={\"min_percent_threshold\": 30},\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "The output above shows that the `validmind.data_validation.ClassImbalance` test did not pass according to the value we set for `min_percent_threshold` — great, this matches what was reported by the development team.\n",
+        "\n",
+        "To address this issue, we'll re-run the test on some processed data. In this case let's apply a very simple rebalancing technique to the dataset:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "import pandas as pd\n",
+        "\n",
+        "raw_copy_df = raw_df.sample(frac=1)  # Create a copy of the raw dataset\n",
+        "\n",
+        "# Create a balanced dataset with the same number of exited and not exited customers\n",
+        "exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 1]\n",
+        "not_exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 0].sample(n=exited_df.shape[0])\n",
+        "\n",
+        "balanced_raw_df = pd.concat([exited_df, not_exited_df])\n",
+        "balanced_raw_df = balanced_raw_df.sample(frac=1, random_state=42)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "With this new balanced dataset, you can re-run the individual test to see if it now passes the class imbalance test requirement.\n",
+        "\n",
+        "As this is technically a different dataset, **remember to first initialize a new ValidMind `Dataset` object** to pass in as input as required by `run_test()`:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Register new data and now 'balanced_raw_dataset' is the new dataset object of interest\n",
+        "vm_balanced_raw_dataset = vm.init_dataset(\n",
+        "    dataset=balanced_raw_df,\n",
+        "    input_id=\"balanced_raw_dataset\",\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Pass the initialized `balanced_raw_dataset` as input into the test run\n",
+        "result = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.ClassImbalance\",\n",
+        "    inputs={\"dataset\": vm_balanced_raw_dataset},\n",
+        "    params={\"min_percent_threshold\": 30},\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_4__'></a>\n",
+        "\n",
+        "### Remove highly correlated features\n",
+        "\n",
+        "Next, let's also remove highly correlated features from our dataset as outlined by the development team. Removing highly correlated features helps make the model simpler, more stable, and easier to understand.\n",
+        "\n",
+        "You can utilize the output from a ValidMind test for further use — in this below example, to retrieve the list of features with the highest correlation coefficients and use them to reduce the final list of features for modeling.\n",
+        "\n",
+        "First, we'll run `validmind.data_validation.HighPearsonCorrelation` with the `balanced_raw_dataset` we initialized previously as input as is for comparison with later runs:\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "corr_result = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
+        "    params={\"max_threshold\": 0.3},\n",
+        "    inputs={\"dataset\": vm_balanced_raw_dataset},\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "The output above shows that the test did not pass according to the value we set for `max_threshold` — as reported and expected.\n",
+        "\n",
+        "`corr_result` is an object of type `TestResult`. We can inspect the result object to see what the test has produced:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "print(type(corr_result))\n",
+        "print(\"Result ID: \", corr_result.result_id)\n",
+        "print(\"Params: \", corr_result.params)\n",
+        "print(\"Passed: \", corr_result.passed)\n",
+        "print(\"Tables: \", corr_result.tables)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let's remove the highly correlated features and create a new VM `dataset` object.\n",
+        "\n",
+        "We'll begin by checking out the table in the result and extracting a list of features that failed the test:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Extract table from `corr_result.tables`\n",
+        "features_df = corr_result.tables[0].data\n",
+        "features_df"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Extract list of features that failed the test\n",
+        "high_correlation_features = features_df[features_df[\"Pass/Fail\"] == \"Fail\"][\"Columns\"].tolist()\n",
+        "high_correlation_features"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Next, extract the feature names from the list of strings (example: `(Age, Exited)` > `Age`):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "high_correlation_features = [feature.split(\",\")[0].strip(\"()\") for feature in high_correlation_features]\n",
+        "high_correlation_features"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Now, it's time to re-initialize the dataset with the highly correlated features removed.\n",
+        "\n",
+        "**Note the use of a different `input_id`.** This allows tracking the inputs used when running each individual test."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Remove the highly correlated features from the dataset\n",
+        "balanced_raw_no_age_df = balanced_raw_df.drop(columns=high_correlation_features)\n",
+        "\n",
+        "# Re-initialize the dataset object\n",
+        "vm_raw_dataset_preprocessed = vm.init_dataset(\n",
+        "    dataset=balanced_raw_no_age_df,\n",
+        "    input_id=\"raw_dataset_preprocessed\",\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Re-running the test with the reduced feature set should pass the test:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "corr_result = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
+        "    params={\"max_threshold\": 0.3},\n",
+        "    inputs={\"dataset\": vm_raw_dataset_preprocessed},\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You can also plot the correlation matrix to visualize the new correlation between features:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "corr_result = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.PearsonCorrelationMatrix\",\n",
+        "    inputs={\"dataset\": vm_raw_dataset_preprocessed},\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Documenting test results\n",
+        "\n",
+        "Now that we've done some analysis on two different datasets, we can use ValidMind to easily document why certain things were done to our raw data with testing to support it. Every test result returned by the `run_test()` function has a `.log()` method that can be used to send the test results to the ValidMind Platform.\n",
+        "\n",
+        "When logging validation test results to the platform, you'll need to manually add those results to the desired section of the validation report. To demonstrate how to add test results to your validation report, we'll log our data quality tests and insert the results via the ValidMind Platform."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Configure and run comparison tests\n",
+        "\n",
+        "Below, we'll perform comparison tests between the original raw dataset (`raw_dataset`) and the final preprocessed (`raw_dataset_preprocessed`) dataset, again logging the results to the ValidMind Platform. \n",
+        "\n",
+        "We can specify all the tests we'd ike to run in a dictionary called `test_config`, and we'll pass in the following arguments for each test:\n",
+        "\n",
+        "  - **`params`:** Individual test parameters.\n",
+        "  - **`input_grid`:** Individual test inputs to compare. In this case, we'll input our two datasets for comparison.\n",
+        "\n",
+        "**Note here that the `input_grid` expects the `input_id` of the dataset as the value rather than the variable name we specified:**"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Individual test config with inputs specified\n",
+        "test_config = {\n",
+        "    \"validmind.data_validation.ClassImbalance\": {\n",
+        "        \"input_grid\": {\"dataset\": [\"raw_dataset\", \"raw_dataset_preprocessed\"]},\n",
+        "        \"params\": {\"min_percent_threshold\": 30}\n",
+        "    },\n",
+        "    \"validmind.data_validation.HighPearsonCorrelation\": {\n",
+        "        \"input_grid\": {\"dataset\": [\"raw_dataset\", \"raw_dataset_preprocessed\"]},\n",
+        "        \"params\": {\"max_threshold\": 0.3}\n",
+        "    },\n",
+        "}"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Then batch run and log our tests in `test_config`:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "for t in test_config:\n",
+        "    print(t)\n",
+        "    try:\n",
+        "        # Check if test has input_grid\n",
+        "        if 'input_grid' in test_config[t]:\n",
+        "            # For tests with input_grid, pass the input_grid configuration\n",
+        "            if 'params' in test_config[t]:\n",
+        "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid'], params=test_config[t]['params']).log()\n",
+        "            else:\n",
+        "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid']).log()\n",
+        "        else:\n",
+        "            # Original logic for regular inputs\n",
+        "            if 'params' in test_config[t]:\n",
+        "                vm.tests.run_test(t, inputs=test_config[t]['inputs'], params=test_config[t]['params']).log()\n",
+        "            else:\n",
+        "                vm.tests.run_test(t, inputs=test_config[t]['inputs']).log()\n",
+        "    except Exception as e:\n",
+        "        print(f\"Error running test {t}: {str(e)}\")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your documentation for some test IDs. </b></span>\n",
+        "<br></br>\n",
+        "That's expected, as when we run validations tests the results logged need to be manually added to your report as part of your compliance assessment process within the ValidMind Platform.</div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2__'></a>\n",
+        "\n",
+        "### Log tests with unique identifiers\n",
+        "\n",
+        "Next, we'll use the previously initialized `vm_balanced_raw_dataset` (that still has a highly correlated `Age` column) as input to run an individual test, then log the result to the ValidMind Platform.\n",
+        "\n",
+        "When running individual tests, **you can use a custom `result_id` to tag the individual result with a unique identifier:**\n",
+        "\n",
+        "- This `result_id` can be appended to `test_id` with a `:` separator.\n",
+        "- The `balanced_raw_dataset` result identifier will correspond to the `balanced_raw_dataset` input, the dataset that still has the `Age` column."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "result = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.HighPearsonCorrelation:balanced_raw_dataset\",\n",
+        "    params={\"max_threshold\": 0.3},\n",
+        "    inputs={\"dataset\": vm_balanced_raw_dataset},\n",
+        ")\n",
+        "result.log()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_3__'></a>\n",
+        "\n",
+        "### Add test results to reporting\n",
+        "\n",
+        "With some test results logged, let's head to the model we connected to at the beginning of this notebook and learn how to insert a test result into our validation report. (**Learn more:** [Assess compliance](https://docs.validmind.ai/guide/validation/assess-compliance.html#link-validator-evidence))\n",
+        "\n",
+        "While the example below focuses on a specific test result, you can follow the same general procedure for your other results:\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you connected to earlier.\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Validation** under Documents.\n",
+        "\n",
+        "3. Click on **2.2.1. Data Quality** to expand that section.\n",
+        "\n",
+        "4. Under the Class Imbalance Assessment guideline, click **Evidence** to expand the evidence panel.\n",
+        "\n",
+        "5. Click **Link Evidence**, then select **Validator Evidence**.\n",
+        "\n",
+        "6. Select the Class Imbalance test results we logged: **ValidMind Data Validation Class Imbalance**\n",
+        "\n",
+        "    <img src= \"selecting-class-imbalance-results.png\" alt=\"Screenshot showing the ClassImbalance test selected\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
+        "    <br><br>\n",
+        "\n",
+        "7. Click **Update Linked Evidence** to add the test results to the validation report.\n",
+        "\n",
+        "8. Confirm that the results for the Class Imbalance test you inserted has been correctly inserted into section **2.2.1. Data Quality** of the report.\n",
+        "\n",
+        "    - Note that these test results are flagged as **Requires Attention** — as they include comparative results from our initial raw dataset.\n",
+        "    - Click **See evidence details** to review the LLM-generated description that summarizes the test results, that confirm that our final preprocessed dataset actually passes our test:\n",
+        "\n",
+        "    <img src= \"class-imbalance-results-detail.png\" alt=\"Screenshot showing the ClassImbalance test generated description in the text editor\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
+        "    <br><br>\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>    Here in this text editor, you can make qualitative edits to the draft that ValidMind generated to finalize the test results.</b></span>\n",
+        "<br></br>\n",
+        "Learn more: <a href=\"https://docs.validmind.ai/guide/documentation/work-with-content-blocks.html\" style=\"color: #DE257E;\"><b>Work with content blocks</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Preparing the preprocessed dataset"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_1__'></a>\n",
+        "\n",
+        "### Split the preprocessed dataset\n",
+        "\n",
+        "With our raw dataset rebalanced with highly correlated features removed, let's now **spilt our dataset into train and test** in preparation for model evaluation testing.\n",
+        "\n",
+        "To start, let's grab the first few rows from the `balanced_raw_no_age_df` dataset we initialized earlier:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "balanced_raw_no_age_df.head()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Before training the model, we need to encode the categorical features in the dataset:\n",
+        "\n",
+        "- Use the `OneHotEncoder` class from the `sklearn.preprocessing` module to encode the categorical features.\n",
+        "- The categorical features in the dataset are `Geography` and `Gender`."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "balanced_raw_no_age_df = pd.get_dummies(\n",
+        "    balanced_raw_no_age_df, columns=[\"Geography\", \"Gender\"], drop_first=True\n",
+        ")\n",
+        "balanced_raw_no_age_df.head()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Splitting our dataset into training and testing is essential for proper validation testing, as this helps assess how well the model generalizes to unseen data:\n",
+        "\n",
+        "- We start by dividing our `balanced_raw_no_age_df` dataset into training and test subsets using `train_test_split`, with 80% of the data allocated to training (`train_df`) and 20% to testing (`test_df`).\n",
+        "- From each subset, we separate the features (all columns except \"Exited\") into `X_train` and `X_test`, and the target column (\"Exited\") into `y_train` and `y_test`."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "from sklearn.model_selection import train_test_split\n",
+        "\n",
+        "train_df, test_df = train_test_split(balanced_raw_no_age_df, test_size=0.20)\n",
+        "\n",
+        "X_train = train_df.drop(\"Exited\", axis=1)\n",
+        "y_train = train_df[\"Exited\"]\n",
+        "X_test = test_df.drop(\"Exited\", axis=1)\n",
+        "y_test = test_df[\"Exited\"]"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2__'></a>\n",
+        "\n",
+        "### Initialize the split datasets\n",
+        "\n",
+        "Next, let's initialize the training and testing datasets so they are available for use:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "vm_train_ds = vm.init_dataset(\n",
+        "    input_id=\"train_dataset_final\",\n",
+        "    dataset=train_df,\n",
+        "    target_column=\"Exited\",\n",
+        ")\n",
+        "\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    input_id=\"test_dataset_final\",\n",
+        "    dataset=test_df,\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## In summary\n",
+        "\n",
+        "In this second notebook, you learned how to:\n",
+        "\n",
+        "- [x] Import a sample dataset\n",
+        "- [x] Identify which tests you might want to run with ValidMind\n",
+        "- [x] Initialize ValidMind datasets\n",
+        "- [x] Run individual tests\n",
+        "- [x] Utilize the output from tests you’ve run\n",
+        "- [x] Log test results as evidence to the ValidMind Platform\n",
+        "- [x] Insert test results into your validation report"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "<a id='toc8_1__'></a>\n",
+        "\n",
+        "### Develop potential challenger models\n",
+        "\n",
+        "Now that you're familiar with the basics of using the ValidMind Library, let's use it to develop a challenger model: **[3 — Developing a potential challenger](3-developing_potential_challenger.ipynb)**"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "copyright-5715327492f24f8fadeab186aecb10ba",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ]
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "name": "python",
+      "version": "3.10.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 2
+}
diff --git a/site/notebooks/tutorials/validation/3-developing_potential_challenger.ipynb b/site/notebooks/tutorials/validation/3-developing_potential_challenger.ipynb
new file mode 100644
index 0000000000..2ed29a195f
--- /dev/null
+++ b/site/notebooks/tutorials/validation/3-developing_potential_challenger.ipynb
@@ -0,0 +1,889 @@
+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# ValidMind for validation 3 — Developing a potential challenger\n",
+        "\n",
+        "Learn how to use ValidMind for your end-to-end validation process with our series of four introductory notebooks. In this third notebook, develop a potential challenger and then pass your challenger and its predictions to ValidMind.\n",
+        "\n",
+        "A *challenger* is an alternate record (model) that attempts to outperform the champion, ensuring that the best performing fit-for-purpose record is always considered for deployment. Challengers also help avoid over-reliance on a single record, and allow testing of new features, algorithms, or data sources without disrupting the production lifecycle.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
+        "<br></br>\n",
+        "Our course tailor-made for validators new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/validator-fundamentals/validator-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Validator Fundamentals</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [Prerequisites](#toc1__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_1__)    \n",
+        "  - [Import the sample dataset](#toc2_2__)    \n",
+        "    - [Preprocess the dataset](#toc2_2_1__)    \n",
+        "  - [Split the preprocessed dataset](#toc2_3__)    \n",
+        "- [Import the champion model](#toc3__)    \n",
+        "- [Training a potential challenger model](#toc4__)    \n",
+        "  - [Random forest classification model](#toc4_1__)    \n",
+        "  - [Initialize the ValidMind models](#toc4_2__)    \n",
+        "  - [Assign predictions](#toc4_3__)    \n",
+        "- [Running model evaluation tests](#toc5__)    \n",
+        "  - [Run model performance tests](#toc5_1__)    \n",
+        "    - [Evaluate performance of the champion model](#toc5_1_1__)    \n",
+        "    - [Log an artifact](#toc5_1_2__)    \n",
+        "    - [Evaluate performance of challenger model](#toc5_1_3__)    \n",
+        "  - [Run diagnostic tests](#toc5_2__)    \n",
+        "  - [Run feature importance tests](#toc5_3__)    \n",
+        "- [In summary](#toc6__)    \n",
+        "- [Next steps](#toc7__)    \n",
+        "  - [Finalize validation and reporting](#toc7_1__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## Prerequisites\n",
+        "\n",
+        "In order to develop potential challengers with this notebook, you'll need to first have:\n",
+        "\n",
+        "- [x] Registered a model within the ValidMind Platform and granted yourself access to the model as a validator\n",
+        "- [x] Installed the ValidMind Library in your local environment, allowing you to access all its features\n",
+        "- [x] Learned how to import and initialize datasets for use with ValidMind\n",
+        "- [x] Understood the basics of how to run and log tests with ValidMind\n",
+        "- [x] Run data quality tests on the datasets used to train the champion, and logged the results of those tests to ValidMind\n",
+        "- [x] Inserted your logged test results into your validation report\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Need help with the above steps?</b></span>\n",
+        "<br></br>\n",
+        "Refer to the first two notebooks in this series:\n",
+        "\n",
+        "- <a href=\"1-set_up_validmind_for_validation.ipynb\" style=\"color: #DE257E;\"><b>1 — Set up the ValidMind Library for validation</b></a>\n",
+        "- <a href=\"2-start_validation_process.ipynb\" style=\"color: #DE257E;\"><b>2 — Start the validation process</b></a>\n",
+        "\n",
+        "</div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up\n",
+        "\n",
+        "This section should be quite familiar to you — as we performed the same actions in the previous notebook, **[2 — Start the validation process](2-start_validation_process.ipynb)**."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library\n",
+        "\n",
+        "As usual, let's first connect up the ValidMind Library to our model we previously registered in the ValidMind Platform:\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Validation` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Make sure the ValidMind Library is installed\n",
+        "\n",
+        "%pip install -q validmind\n",
+        "\n",
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"validation-report\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Import the sample dataset\n",
+        "\n",
+        "Next, we'll load in the sample [Bank Customer Churn Prediction](https://www.kaggle.com/datasets/shantanudhakadd/bank-customer-churn-prediction) dataset used to develop the champion that we will independently preprocess:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Load the sample dataset\n",
+        "from validmind.datasets.classification import customer_churn as demo_dataset\n",
+        "\n",
+        "print(\n",
+        "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{demo_dataset.target_column}' \\n\\t• Class labels: {demo_dataset.class_labels}\"\n",
+        ")\n",
+        "\n",
+        "raw_df = demo_dataset.load_data()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Preprocess the dataset\n",
+        "\n",
+        "We’ll apply a simple rebalancing technique to the dataset before continuing:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "import pandas as pd\n",
+        "\n",
+        "raw_copy_df = raw_df.sample(frac=1)  # Create a copy of the raw dataset\n",
+        "\n",
+        "# Create a balanced dataset with the same number of exited and not exited customers\n",
+        "exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 1]\n",
+        "not_exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 0].sample(n=exited_df.shape[0])\n",
+        "\n",
+        "balanced_raw_df = pd.concat([exited_df, not_exited_df])\n",
+        "balanced_raw_df = balanced_raw_df.sample(frac=1, random_state=42)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let’s also quickly remove highly correlated features from the dataset using the output from a ValidMind test.\n",
+        "\n",
+        "As you know, before we can run tests you’ll need to initialize a ValidMind dataset object with the [`init_dataset` function](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Register new data and now 'balanced_raw_dataset' is the new dataset object of interest\n",
+        "vm_balanced_raw_dataset = vm.init_dataset(\n",
+        "    dataset=balanced_raw_df,\n",
+        "    input_id=\"balanced_raw_dataset\",\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "With our balanced dataset initialized, we can then run our test and utilize the output to help us identify the features we want to remove:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Run HighPearsonCorrelation test with our balanced dataset as input and return a result object\n",
+        "corr_result = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
+        "    params={\"max_threshold\": 0.3},\n",
+        "    inputs={\"dataset\": vm_balanced_raw_dataset},\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# From result object, extract table from `corr_result.tables`\n",
+        "features_df = corr_result.tables[0].data\n",
+        "features_df"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Extract list of features that failed the test\n",
+        "high_correlation_features = features_df[features_df[\"Pass/Fail\"] == \"Fail\"][\"Columns\"].tolist()\n",
+        "high_correlation_features"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Extract feature names from the list of strings\n",
+        "high_correlation_features = [feature.split(\",\")[0].strip(\"()\") for feature in high_correlation_features]\n",
+        "high_correlation_features"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "We can then re-initialize the dataset with a different `input_id` and the highly correlated features removed and re-run the test for confirmation:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Remove the highly correlated features from the dataset\n",
+        "balanced_raw_no_age_df = balanced_raw_df.drop(columns=high_correlation_features)\n",
+        "\n",
+        "# Re-initialize the dataset object\n",
+        "vm_raw_dataset_preprocessed = vm.init_dataset(\n",
+        "    dataset=balanced_raw_no_age_df,\n",
+        "    input_id=\"raw_dataset_preprocessed\",\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Re-run the test with the reduced feature set\n",
+        "corr_result = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
+        "    params={\"max_threshold\": 0.3},\n",
+        "    inputs={\"dataset\": vm_raw_dataset_preprocessed},\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Split the preprocessed dataset\n",
+        "\n",
+        "With our raw dataset rebalanced with highly correlated features removed, let's now **spilt our dataset into train and test** in preparation for model evaluation testing:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Encode categorical features in the dataset\n",
+        "balanced_raw_no_age_df = pd.get_dummies(\n",
+        "    balanced_raw_no_age_df, columns=[\"Geography\", \"Gender\"], drop_first=True\n",
+        ")\n",
+        "balanced_raw_no_age_df.head()"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "from sklearn.model_selection import train_test_split\n",
+        "\n",
+        "# Split the dataset into train and test\n",
+        "train_df, test_df = train_test_split(balanced_raw_no_age_df, test_size=0.20)\n",
+        "\n",
+        "X_train = train_df.drop(\"Exited\", axis=1)\n",
+        "y_train = train_df[\"Exited\"]\n",
+        "X_test = test_df.drop(\"Exited\", axis=1)\n",
+        "y_test = test_df[\"Exited\"]"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Initialize the split datasets\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    input_id=\"train_dataset_final\",\n",
+        "    dataset=train_df,\n",
+        "    target_column=\"Exited\",\n",
+        ")\n",
+        "\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    input_id=\"test_dataset_final\",\n",
+        "    dataset=test_df,\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Import the champion model\n",
+        "\n",
+        "With our raw dataset assessed and preprocessed, let's go ahead and import the champion submitted by the development team in the format of a `.pkl` file: **[lr_model_champion.pkl](lr_model_champion.pkl)**"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Import the champion model\n",
+        "import pickle as pkl\n",
+        "\n",
+        "with open(\"lr_model_champion.pkl\", \"rb\") as f:\n",
+        "    log_reg = pkl.load(f)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Training a potential challenger model\n",
+        "\n",
+        "We're curious how an alternate model compares to our champion, so let's train a challenger as a basis for our testing.\n",
+        "\n",
+        "Our champion *logistic regression model* is a simpler, parametric model that assumes a linear relationship between the independent variables and the log-odds of the outcome. While logistic regression may not capture complex patterns as effectively, it offers a high degree of interpretability and is easier to explain to stakeholders. However, risk is not calculated in isolation from a single factor, but rather in consideration with trade-offs in predictive performance, ease of interpretability, and overall alignment with business objectives."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Random forest classification model\n",
+        "\n",
+        "A *random forest classification model* is an ensemble machine learning algorithm that uses multiple decision trees to classify data. In ensemble learning, multiple models are combined to improve prediction accuracy and robustness.\n",
+        "\n",
+        "Random forest classification models generally have higher accuracy because they capture complex, non-linear relationships, but as a result they lack transparency in their predictions."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Import the Random Forest Classification model\n",
+        "from sklearn.ensemble import RandomForestClassifier\n",
+        "\n",
+        "# Create the model instance with 50 decision trees\n",
+        "rf_model = RandomForestClassifier(\n",
+        "    n_estimators=50,\n",
+        "    random_state=42,\n",
+        ")\n",
+        "\n",
+        "# Train the model\n",
+        "rf_model.fit(X_train, y_train)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind models\n",
+        "\n",
+        "In addition to the initialized datasets, you'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for each of our two models.\n",
+        "\n",
+        "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+        "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
+        "\n",
+        "Initialize your model objects with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Initialize the champion logistic regression model\n",
+        "vm_log_model = vm.init_model(\n",
+        "    log_reg,\n",
+        "    input_id=\"log_model_champion\",\n",
+        ")\n",
+        "\n",
+        "# Initialize the challenger random forest classification model\n",
+        "vm_rf_model = vm.init_model(\n",
+        "    rf_model,\n",
+        "    input_id=\"rf_model\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_3__'></a>\n",
+        "\n",
+        "### Assign predictions\n",
+        "\n",
+        "With our models registered, we'll move on to assigning both the predictive probabilities coming directly from each model's predictions, and the binary prediction after applying the cutoff threshold described in the Compute binary predictions step above.\n",
+        "\n",
+        "- The [`assign_predictions()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#assign_predictions) from the `Dataset` object can link existing predictions to any number of models.\n",
+        "- This method links the model's class prediction values and probabilities to our `vm_train_ds` and `vm_test_ds` datasets.\n",
+        "\n",
+        "If no prediction values are passed, the method will compute predictions automatically:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Champion — Logistic regression model\n",
+        "vm_train_ds.assign_predictions(model=vm_log_model)\n",
+        "vm_test_ds.assign_predictions(model=vm_log_model)\n",
+        "\n",
+        "# Challenger — Random forest classification model\n",
+        "vm_train_ds.assign_predictions(model=vm_rf_model)\n",
+        "vm_test_ds.assign_predictions(model=vm_rf_model)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Running model evaluation tests\n",
+        "\n",
+        "With our setup complete, let's run the rest of our validation tests. Since we have already verified the data quality of the dataset used to train our champion, we will now focus on comprehensive performance evaluations of both the champion and challenger models."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Run model performance tests\n",
+        "\n",
+        "Let's run some performance tests, beginning with independent testing of our champion logistic regression model, then moving on to our potential challenger model.\n",
+        "\n",
+        "Use [`vm.tests.list_tests()`](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) to identify all the model performance tests for classification:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "\n",
+        "vm.tests.list_tests(tags=[\"model_performance\"], task=\"classification\")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "We'll isolate the specific tests we want to run in `mpt`:\n",
+        "\n",
+        "- `model_validation.sklearn.ClassifierPerformance`\n",
+        "- `model_validation.sklearn.ConfusionMatrix`\n",
+        "- `model_validation.sklearn.MinimumAccuracy`\n",
+        "- `model_validation.sklearn.MinimumF1Score`\n",
+        "- `model_validation.sklearn.ROCCurve`\n",
+        "\n",
+        "As we learned in the previous notebook [2 — Start the model validation process](2-start_validation_process.ipynb), you can use a custom `result_id` to tag the individual result with a unique identifier by appending this `result_id` to the `test_id` with a `:` separator. We'll append an identifier for our champion model here:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "mpt = [\n",
+        "    \"validmind.model_validation.sklearn.ClassifierPerformance:logreg_champion\",\n",
+        "    \"validmind.model_validation.sklearn.ConfusionMatrix:logreg_champion\",\n",
+        "    \"validmind.model_validation.sklearn.MinimumAccuracy:logreg_champion\",\n",
+        "    \"validmind.model_validation.sklearn.MinimumF1Score:logreg_champion\",\n",
+        "    \"validmind.model_validation.sklearn.ROCCurve:logreg_champion\"\n",
+        "]"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1_1__'></a>\n",
+        "\n",
+        "#### Evaluate performance of the champion model\n",
+        "\n",
+        "Now, let's run and log our batch of model performance tests using our testing dataset (`vm_test_ds`) for our champion model:\n",
+        "\n",
+        "- The test set serves as a proxy for real-world data, providing an unbiased estimate of model performance since it was not used during training or tuning.\n",
+        "- The test set also acts as protection against selection bias and model tweaking, giving a final, more unbiased checkpoint."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "for test in mpt:\n",
+        "    vm.tests.run_test(\n",
+        "        test,\n",
+        "        inputs={\n",
+        "            \"dataset\": vm_test_ds, \"model\" : vm_log_model,\n",
+        "        },\n",
+        "    ).log()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your documentation for some test IDs. </b></span>\n",
+        "<br></br>\n",
+        "That's expected, as when we run validations tests the results logged need to be manually added to your report as part of your compliance assessment process within the ValidMind Platform.</div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1_2__'></a>\n",
+        "\n",
+        "#### Log an artifact\n",
+        "\n",
+        "As we can observe from the output above, our champion doesn't pass the `MinimumAccuracy` based on the default thresholds of the out-of-the-box test, so let's log an artifact (finding) in the ValidMind Platform  (**Learn more:** [Add and manage artifacts](https://docs.validmind.ai/guide/validation/add-manage-artifacts.html)):\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you connected to earlier.\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Validation** under Documents.\n",
+        "\n",
+        "3. Click on **2.2.2. Model Performance** to expand that section.\n",
+        "\n",
+        "4. Under the Model Performance Metrics guideline, click to expand the **Artifacts** panel.\n",
+        "\n",
+        "5. Click **Link Artifact** and select **Validation Issue** as the type of artifact.\n",
+        "\n",
+        "6. Click **+ Add Validation Issue** and enter in the details for your validation issue, for example:\n",
+        "\n",
+        "    - **TITLE** — Champion Logistic Regression Model Fails Minimum Accuracy Threshold\n",
+        "    - **RISK AREA** — Model Performance\n",
+        "    - **DOCUMENTATION SECTION** — 3.2. Model Evaluation\n",
+        "    - **DESCRIPTION** — The logistic regression champion model was subjected to a Minimum Accuracy test to determine whether its predictive accuracy meets the predefined performance threshold of 0.7. The model achieved an accuracy score of 0.6136, which falls below the required minimum. As a result, the test produced a Fail outcome.\n",
+        "\n",
+        "7. Click **Add Validation Issue** to submit the validation issue.\n",
+        "\n",
+        "8. Select the validation issue you just added to link to your validation report.\n",
+        "\n",
+        "9. Click **Update Linked Artifacts** to insert your validation issue.\n",
+        "\n",
+        "10. Confirm that the validation issue you inserted has been correctly inserted into section 2.2.2. Model Performance of the report.\n",
+        "\n",
+        "11. Click on the validation issue to expand the issue, where you can adjust details such as severity, owner, due date, status, etc. as well as include proposed remediation plans or supporting documentation as attachments."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1_3__'></a>\n",
+        "\n",
+        "#### Evaluate performance of challenger model\n",
+        "\n",
+        "We've now conducted similar tests as the development team for our champion, with the aim of verifying their test results.\n",
+        "\n",
+        "Next, let's see how our challengers compare. We'll use the same batch of tests here as we did in `mpt`, but append a different `result_id` to indicate that these results should be associated with our challenger:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "mpt_chall = [\n",
+        "    \"validmind.model_validation.sklearn.ClassifierPerformance:champion_vs_challenger\",\n",
+        "    \"validmind.model_validation.sklearn.ConfusionMatrix:champion_vs_challenger\",\n",
+        "    \"validmind.model_validation.sklearn.MinimumAccuracy:champion_vs_challenger\",\n",
+        "    \"validmind.model_validation.sklearn.MinimumF1Score:champion_vs_challenger\",\n",
+        "    \"validmind.model_validation.sklearn.ROCCurve:champion_vs_challenger\"\n",
+        "]"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "We'll run each test once for each model with the same `vm_test_ds` dataset to compare them:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "for test in mpt_chall:\n",
+        "    vm.tests.run_test(\n",
+        "        test,\n",
+        "        input_grid={\n",
+        "            \"dataset\": [vm_test_ds], \"model\" : [vm_log_model,vm_rf_model]\n",
+        "        }\n",
+        "    ).log()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Based on the performance metrics, our challenger random forest classification model passes the <code>MinimumAccuracy</code> where our champion did not.</b></span>\n",
+        "<br></br>\n",
+        "In your validation report, support your recommendation in your validation issue's <b>Proposed Remediation Plan</b> to investigate the usage of our challenger by inserting the performance tests we logged with this notebook into the appropriate section.</div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2__'></a>\n",
+        "\n",
+        "### Run diagnostic tests\n",
+        "\n",
+        "Next, we want to inspect the robustness and stability testing comparison between our champion and challenger.\n",
+        "\n",
+        "Use `list_tests()` to list all available diagnosis tests applicable to classification tasks:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "vm.tests.list_tests(tags=[\"model_diagnosis\"], task=\"classification\")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let’s now assess the models for potential signs of *overfitting* and identify any sub-segments where performance may inconsistent with the `model_validation.sklearn.OverfitDiagnosis` test.\n",
+        "\n",
+        "Overfitting occurs when a model learns the training data too well, capturing not only the true pattern but noise and random fluctuations resulting in excellent performance on the training dataset but poor generalization to new, unseen data:\n",
+        "\n",
+        "- Since the training dataset (`vm_train_ds`) was used to fit the model, we use this set to establish a baseline performance for how well the model performs on data it has already seen.\n",
+        "- The testing dataset (`vm_test_ds`) was never seen during training, and here simulates real-world generalization, or how well the model performs on new, unseen data. "
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "vm.tests.run_test(\n",
+        "    test_id=\"validmind.model_validation.sklearn.OverfitDiagnosis:champion_vs_challenger\",\n",
+        "    input_grid={\n",
+        "        \"datasets\": [[vm_train_ds,vm_test_ds]],\n",
+        "        \"model\" : [vm_log_model,vm_rf_model]\n",
+        "    }\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let's also conduct *robustness* and *stability* testing of the two models with the `model_validation.sklearn.RobustnessDiagnosis` test.\n",
+        "\n",
+        "Robustness refers to a model's ability to maintain consistent performance, and stability refers to a model's ability to produce consistent outputs over time across different data subsets.\n",
+        "\n",
+        "Again, we'll use both the training and testing datasets to establish baseline performance and to simulate real-world generalization:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "vm.tests.run_test(\n",
+        "    test_id=\"validmind.model_validation.sklearn.RobustnessDiagnosis:Champion_vs_LogRegression\",\n",
+        "    input_grid={\n",
+        "        \"datasets\": [[vm_train_ds,vm_test_ds]],\n",
+        "        \"model\" : [vm_log_model,vm_rf_model]\n",
+        "    },\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_3__'></a>\n",
+        "\n",
+        "### Run feature importance tests\n",
+        "\n",
+        "We also want to verify the relative influence of different input features on our models' predictions, as well as inspect the differences between our champion and challenger to see if a certain model offers more understandable or logical importance scores for features.\n",
+        "\n",
+        "Use `list_tests()` to identify all the feature importance tests for classification:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Store the feature importance tests\n",
+        "FI = vm.tests.list_tests(tags=[\"feature_importance\"], task=\"classification\",pretty=False)\n",
+        "FI"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "We'll only use our testing dataset (`vm_test_ds`) here, to provide a realistic, unseen sample that mimic future or production data, as the training dataset has already influenced our model during learning:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Run and log our feature importance tests for both models for the testing dataset\n",
+        "for test in FI:\n",
+        "    vm.tests.run_test(\n",
+        "        \"\".join((test,':champion_vs_challenger')),\n",
+        "        input_grid={\n",
+        "            \"dataset\": [vm_test_ds], \"model\" : [vm_log_model,vm_rf_model]\n",
+        "        },\n",
+        "    ).log()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## In summary\n",
+        "\n",
+        "In this third notebook, you learned how to:\n",
+        "\n",
+        "- [x] Initialize ValidMind model objects\n",
+        "- [x] Assign predictions and probabilities to your ValidMind model objects\n",
+        "- [x] Use tests from ValidMind to evaluate the potential of models, including comparative tests between champion and challengers\n",
+        "- [x] Log an artifact in the ValidMind Platform"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "<a id='toc7_1__'></a>\n",
+        "\n",
+        "### Finalize validation and reporting\n",
+        "\n",
+        "Now that you're familiar with the basics of using the ValidMind Library to run and log validation tests, let's learn how to implement some custom tests and wrap up our validation: **[4 — Finalize validation and reporting](4-finalize_validation_reporting.ipynb)**"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "copyright-910d55973ae44bb1a1cd609d39ae5ca8",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ]
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "name": "python",
+      "version": "3.10.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 2
+}
diff --git a/site/notebooks/tutorials/validation/4-finalize_validation_reporting.ipynb b/site/notebooks/tutorials/validation/4-finalize_validation_reporting.ipynb
new file mode 100644
index 0000000000..32d46c6e2d
--- /dev/null
+++ b/site/notebooks/tutorials/validation/4-finalize_validation_reporting.ipynb
@@ -0,0 +1,1235 @@
+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# ValidMind for validation 4 — Finalize testing and reporting\n",
+        "\n",
+        "Learn how to use ValidMind for your end-to-end validation process with our series of four introductory notebooks. In this last notebook, finalize the compliance assessment process and have a complete validation report ready for review.\n",
+        "\n",
+        "This notebook will walk you through how to supplement ValidMind tests with your own custom tests and include them as additional evidence in your validation report. A custom test is any function that takes a set of inputs and parameters as arguments and returns one or more outputs:\n",
+        "\n",
+        "- The function can be as simple or as complex as you need it to be — it can use external libraries, make API calls, or do anything else that you can do in Python.\n",
+        "- The only requirement is that the function signature and return values can be \"understood\" and handled by the ValidMind Library. As such, custom tests offer added flexibility by extending the default tests provided by ValidMind, enabling you to document any type of record (model) or use case.\n",
+        "\n",
+        "**For a more in-depth introduction to custom tests,** refer to our [Implement custom tests](../../how_to/tests/custom_tests/implement_custom_tests.ipynb) notebook.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Learn by doing</b></span>\n",
+        "<br></br>\n",
+        "Our course tailor-made for validators new to ValidMind combines this series of notebooks with more a more in-depth introduction to the ValidMind Platform — <a href=\"https://docs.validmind.ai/training/validator-fundamentals/validator-fundamentals-register.html\" style=\"color: #DE257E;\"><b>Validator Fundamentals</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [Prerequisites](#toc1__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_1__)    \n",
+        "  - [Import the sample dataset](#toc2_2__)    \n",
+        "  - [Split the preprocessed dataset](#toc2_3__)    \n",
+        "  - [Import the champion model](#toc2_4__)    \n",
+        "  - [Train potential challenger model](#toc2_5__)    \n",
+        "  - [Initialize the ValidMind models](#toc2_6__)    \n",
+        "- [Implementing custom tests](#toc3__)    \n",
+        "  - [Implement a custom inline test](#toc3_1__)    \n",
+        "    - [Create a confusion matrix plot](#toc3_1_1__)    \n",
+        "    - [Add parameters to custom tests](#toc3_1_2__)    \n",
+        "    - [Pass parameters to custom tests](#toc3_1_3__)    \n",
+        "  - [Use external test providers](#toc3_2__)    \n",
+        "    - [Create custom tests folder](#toc3_2_1__)    \n",
+        "    - [Save an inline test](#toc3_2_2__)    \n",
+        "    - [Register a local test provider](#toc3_2_3__)    \n",
+        "- [Verify test runs](#toc4__)    \n",
+        "- [In summary](#toc5__)    \n",
+        "- [Next steps](#toc6__)    \n",
+        "  - [Work with your validation report](#toc6_1__)    \n",
+        "  - [Learn more](#toc6_2__)    \n",
+        "    - [Use cases](#toc6_2_1__)    \n",
+        "    - [Discover more learning resources](#toc6_2_2__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## Prerequisites\n",
+        "\n",
+        "In order to finalize validation and reporting, you'll need to first have:\n",
+        "\n",
+        "- [x] Registered a model within the ValidMind Platform and granted yourself access to the model as a validator\n",
+        "- [x] Installed the ValidMind Library in your local environment, allowing you to access all its features\n",
+        "- [x] Learned how to import and initialize datasets and models for use with ValidMind\n",
+        "- [x] Understood the basics of how to identify and run validation tests\n",
+        "- [x] Run validation tests for your champion and challengers, and logged the results of those tests to the ValidMind Platform\n",
+        "- [x] Inserted your logged test results into your validation report\n",
+        "- [x] Added some preliminary artifacts (findings) to your validation report\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Need help with the above steps?</b></span>\n",
+        "<br></br>\n",
+        "Refer to the first three notebooks in this series:\n",
+        "\n",
+        "- <a href=\"1-set_up_validmind_for_validation.ipynb\" style=\"color: #DE257E;\"><b>1 — Set up the ValidMind Library for validation</b></a>\n",
+        "- <a href=\"2-start_validation_process.ipynb\" style=\"color: #DE257E;\"><b>2 — Start the validation process</b></a>\n",
+        "- <a href=\"3-developing_potential_challenger.ipynb\" style=\"color: #DE257E;\"><b>3 — Developing a potential challenger</b></a>\n",
+        "\n",
+        "</div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up\n",
+        "\n",
+        "This section should be very familiar to you now — as we performed the same actions in the previous two notebooks in this series."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library\n",
+        "\n",
+        "As usual, let's first connect up the ValidMind Library to our model we previously registered in the ValidMind Platform:\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Validation` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Make sure the ValidMind Library is installed\n",
+        "\n",
+        "%pip install -q validmind\n",
+        "\n",
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"validation-report\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Import the sample dataset\n",
+        "\n",
+        "Next, we'll load in the same sample [Bank Customer Churn Prediction](https://www.kaggle.com/datasets/shantanudhakadd/bank-customer-churn-prediction) dataset used to develop the champion that we will independently preprocess:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Load the sample dataset\n",
+        "from validmind.datasets.classification import customer_churn as demo_dataset\n",
+        "\n",
+        "print(\n",
+        "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{demo_dataset.target_column}' \\n\\t• Class labels: {demo_dataset.class_labels}\"\n",
+        ")\n",
+        "\n",
+        "raw_df = demo_dataset.load_data()"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Initialize the raw dataset for use in ValidMind tests\n",
+        "vm_raw_dataset = vm.init_dataset(\n",
+        "    dataset=raw_df,\n",
+        "    input_id=\"raw_dataset\",\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "import pandas as pd\n",
+        "\n",
+        "raw_copy_df = raw_df.sample(frac=1)  # Create a copy of the raw dataset\n",
+        "\n",
+        "# Create a balanced dataset with the same number of exited and not exited customers\n",
+        "exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 1]\n",
+        "not_exited_df = raw_copy_df.loc[raw_copy_df[\"Exited\"] == 0].sample(n=exited_df.shape[0])\n",
+        "\n",
+        "balanced_raw_df = pd.concat([exited_df, not_exited_df])\n",
+        "balanced_raw_df = balanced_raw_df.sample(frac=1, random_state=42)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let’s also quickly remove highly correlated features from the dataset using the output from a ValidMind test:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Register new data and now 'balanced_raw_dataset' is the new dataset object of interest\n",
+        "vm_balanced_raw_dataset = vm.init_dataset(\n",
+        "    dataset=balanced_raw_df,\n",
+        "    input_id=\"balanced_raw_dataset\",\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Run HighPearsonCorrelation test with our balanced dataset as input and return a result object\n",
+        "corr_result = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
+        "    params={\"max_threshold\": 0.3},\n",
+        "    inputs={\"dataset\": vm_balanced_raw_dataset},\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# From result object, extract table from `corr_result.tables`\n",
+        "features_df = corr_result.tables[0].data\n",
+        "features_df"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Extract list of features that failed the test\n",
+        "high_correlation_features = features_df[features_df[\"Pass/Fail\"] == \"Fail\"][\"Columns\"].tolist()\n",
+        "high_correlation_features"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Extract feature names from the list of strings\n",
+        "high_correlation_features = [feature.split(\",\")[0].strip(\"()\") for feature in high_correlation_features]\n",
+        "high_correlation_features"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Remove the highly correlated features from the dataset\n",
+        "balanced_raw_no_age_df = balanced_raw_df.drop(columns=high_correlation_features)\n",
+        "\n",
+        "# Re-initialize the dataset object\n",
+        "vm_raw_dataset_preprocessed = vm.init_dataset(\n",
+        "    dataset=balanced_raw_no_age_df,\n",
+        "    input_id=\"raw_dataset_preprocessed\",\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Re-run the test with the reduced feature set\n",
+        "corr_result = vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
+        "    params={\"max_threshold\": 0.3},\n",
+        "    inputs={\"dataset\": vm_raw_dataset_preprocessed},\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Split the preprocessed dataset\n",
+        "\n",
+        "With our raw dataset rebalanced with highly correlated features removed, let's now **spilt our dataset into train and test** in preparation for model evaluation testing:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Encode categorical features in the dataset\n",
+        "balanced_raw_no_age_df = pd.get_dummies(\n",
+        "    balanced_raw_no_age_df, columns=[\"Geography\", \"Gender\"], drop_first=True\n",
+        ")\n",
+        "balanced_raw_no_age_df.head()"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "from sklearn.model_selection import train_test_split\n",
+        "\n",
+        "# Split the dataset into train and test\n",
+        "train_df, test_df = train_test_split(balanced_raw_no_age_df, test_size=0.20)\n",
+        "\n",
+        "X_train = train_df.drop(\"Exited\", axis=1)\n",
+        "y_train = train_df[\"Exited\"]\n",
+        "X_test = test_df.drop(\"Exited\", axis=1)\n",
+        "y_test = test_df[\"Exited\"]"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Initialize the split datasets\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    input_id=\"train_dataset_final\",\n",
+        "    dataset=train_df,\n",
+        "    target_column=\"Exited\",\n",
+        ")\n",
+        "\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    input_id=\"test_dataset_final\",\n",
+        "    dataset=test_df,\n",
+        "    target_column=\"Exited\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_4__'></a>\n",
+        "\n",
+        "### Import the champion model\n",
+        "\n",
+        "With our raw dataset assessed and preprocessed, let's go ahead and import the champion submitted by the development team in the format of a `.pkl` file: **[lr_model_champion.pkl](lr_model_champion.pkl)**"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Import the champion model\n",
+        "import pickle as pkl\n",
+        "\n",
+        "with open(\"lr_model_champion.pkl\", \"rb\") as f:\n",
+        "    log_reg = pkl.load(f)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_5__'></a>\n",
+        "\n",
+        "### Train potential challenger model\n",
+        "\n",
+        "We'll also train our random forest classification challenger to see how it compares:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Import the Random Forest Classification model\n",
+        "from sklearn.ensemble import RandomForestClassifier\n",
+        "\n",
+        "# Create the model instance with 50 decision trees\n",
+        "rf_model = RandomForestClassifier(\n",
+        "    n_estimators=50,\n",
+        "    random_state=42,\n",
+        ")\n",
+        "\n",
+        "# Train the model\n",
+        "rf_model.fit(X_train, y_train)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_6__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind models\n",
+        "\n",
+        "In addition to the initialized datasets, you'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for each of our two models:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Initialize the champion logistic regression model\n",
+        "vm_log_model = vm.init_model(\n",
+        "    log_reg,\n",
+        "    input_id=\"log_model_champion\",\n",
+        ")\n",
+        "\n",
+        "# Initialize the challenger random forest classification model\n",
+        "vm_rf_model = vm.init_model(\n",
+        "    rf_model,\n",
+        "    input_id=\"rf_model\",\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Assign predictions to Champion — Logistic regression model\n",
+        "vm_train_ds.assign_predictions(model=vm_log_model)\n",
+        "vm_test_ds.assign_predictions(model=vm_log_model)\n",
+        "\n",
+        "# Assign predictions to Challenger — Random forest classification model\n",
+        "vm_train_ds.assign_predictions(model=vm_rf_model)\n",
+        "vm_test_ds.assign_predictions(model=vm_rf_model)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Implementing custom tests\n",
+        "\n",
+        "Thanks to the documentation (**Learn more:** [ValidMind for development](https://docs.validmind.ai/developer/validmind-library.html#development)), we know that the development team implemented a custom test to further evaluate the performance of the champion.\n",
+        "\n",
+        "In a usual validation situation, you would load a saved custom test provided by the development team. In the following section, we'll have you implement the same custom test and make it available for reuse, to familiarize you with the processes.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about custom tests?</b></span>\n",
+        "<br></br>\n",
+        "Refer to our in-depth introduction to custom tests: <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/custom_tests/implement_custom_tests.html\" style=\"color: #DE257E;\"><b>Implement custom tests</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Implement a custom inline test\n",
+        "\n",
+        "Let's implement the same custom *inline test* that calculates the confusion matrix for a binary classification model that the development team used in their performance evaluations.\n",
+        "\n",
+        "- An inline test refers to a test written and executed within the same environment as the code being tested — in this case, right in this Jupyter Notebook —  without requiring a separate test file or framework.\n",
+        "- You'll note that the custom test function is just a regular Python function that can include and require any Python library as you see fit."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1_1__'></a>\n",
+        "\n",
+        "#### Create a confusion matrix plot\n",
+        "\n",
+        "Let's first create a confusion matrix plot using the `confusion_matrix` function from the `sklearn.metrics` module:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "import matplotlib.pyplot as plt\n",
+        "from sklearn import metrics\n",
+        "\n",
+        "# Get the predicted classes\n",
+        "y_pred = log_reg.predict(vm_test_ds.x)\n",
+        "\n",
+        "confusion_matrix = metrics.confusion_matrix(y_test, y_pred)\n",
+        "\n",
+        "cm_display = metrics.ConfusionMatrixDisplay(\n",
+        "    confusion_matrix=confusion_matrix, display_labels=[False, True]\n",
+        ")\n",
+        "cm_display.plot()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Next, create a [`@vm.test` wrapper](https://docs.validmind.ai/validmind/validmind.html#test) that will allow you to create a reusable test. **Note the following changes in the code below:**\n",
+        "\n",
+        "- The function `confusion_matrix` takes two arguments `dataset` and `model`. This is a `VMDataset` and `VMModel` object respectively.\n",
+        "  - `VMDataset` objects allow you to access the dataset's true (target) values by accessing the `.y` attribute.\n",
+        "  - `VMDataset` objects allow you to access the predictions for a given record (model) by accessing the `.y_pred()` method.\n",
+        "- The function docstring provides a description of what the test does. This will be displayed along with the result in this notebook as well as in the ValidMind Platform.\n",
+        "- The function body calculates the confusion matrix using the `sklearn.metrics.confusion_matrix` function as we just did above.\n",
+        "- The function then returns the `ConfusionMatrixDisplay.figure_` object — this is important as the ValidMind Library expects the output of the custom test to be a plot or a table.\n",
+        "- The `@vm.test` decorator is doing the work of creating a wrapper around the function that will allow it to be run by the ValidMind Library. It also registers the test so it can be found by the ID `my_custom_tests.ConfusionMatrix`."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "@vm.test(\"my_custom_tests.ConfusionMatrix\")\n",
+        "def confusion_matrix(dataset, model):\n",
+        "    \"\"\"The confusion matrix is a table that is often used to describe the performance of a classification model on a set of data for which the true values are known.\n",
+        "\n",
+        "    The confusion matrix is a 2x2 table that contains 4 values:\n",
+        "\n",
+        "    - True Positive (TP): the number of correct positive predictions\n",
+        "    - True Negative (TN): the number of correct negative predictions\n",
+        "    - False Positive (FP): the number of incorrect positive predictions\n",
+        "    - False Negative (FN): the number of incorrect negative predictions\n",
+        "\n",
+        "    The confusion matrix can be used to assess the holistic performance of a classification model by showing the accuracy, precision, recall, and F1 score of the model on a single figure.\n",
+        "    \"\"\"\n",
+        "    y_true = dataset.y\n",
+        "    y_pred = dataset.y_pred(model=model)\n",
+        "\n",
+        "    confusion_matrix = metrics.confusion_matrix(y_true, y_pred)\n",
+        "\n",
+        "    cm_display = metrics.ConfusionMatrixDisplay(\n",
+        "        confusion_matrix=confusion_matrix, display_labels=[False, True]\n",
+        "    )\n",
+        "    cm_display.plot()\n",
+        "\n",
+        "    plt.close()  # close the plot to avoid displaying it\n",
+        "\n",
+        "    return cm_display.figure_  # return the figure object itself"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You can now run the newly created custom test on both the training and test datasets for both models using the [`run_test()` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Champion train and test\n",
+        "vm.tests.run_test(\n",
+        "    test_id=\"my_custom_tests.ConfusionMatrix:champion\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds,vm_test_ds],\n",
+        "        \"model\" : [vm_log_model]\n",
+        "    }\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Challenger train and test\n",
+        "vm.tests.run_test(\n",
+        "    test_id=\"my_custom_tests.ConfusionMatrix:challenger\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds,vm_test_ds],\n",
+        "        \"model\" : [vm_rf_model]\n",
+        "    }\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your documentation for some test IDs. </b></span>\n",
+        "<br></br>\n",
+        "That's expected, as when we run validations tests the results logged need to be manually added to your report as part of your compliance assessment process within the ValidMind Platform.</div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1_2__'></a>\n",
+        "\n",
+        "#### Add parameters to custom tests\n",
+        "\n",
+        "Custom tests can take parameters just like any other function. To demonstrate, let's modify the `confusion_matrix` function to take an additional parameter `normalize` that will allow you to normalize the confusion matrix:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "@vm.test(\"my_custom_tests.ConfusionMatrix\")\n",
+        "def confusion_matrix(dataset, model, normalize=False):\n",
+        "    \"\"\"The confusion matrix is a table that is often used to describe the performance of a classification model on a set of data for which the true values are known.\n",
+        "\n",
+        "    The confusion matrix is a 2x2 table that contains 4 values:\n",
+        "\n",
+        "    - True Positive (TP): the number of correct positive predictions\n",
+        "    - True Negative (TN): the number of correct negative predictions\n",
+        "    - False Positive (FP): the number of incorrect positive predictions\n",
+        "    - False Negative (FN): the number of incorrect negative predictions\n",
+        "\n",
+        "    The confusion matrix can be used to assess the holistic performance of a classification model by showing the accuracy, precision, recall, and F1 score of the model on a single figure.\n",
+        "    \"\"\"\n",
+        "    y_true = dataset.y\n",
+        "    y_pred = dataset.y_pred(model=model)\n",
+        "\n",
+        "    if normalize:\n",
+        "        confusion_matrix = metrics.confusion_matrix(y_true, y_pred, normalize=\"all\")\n",
+        "    else:\n",
+        "        confusion_matrix = metrics.confusion_matrix(y_true, y_pred)\n",
+        "\n",
+        "    cm_display = metrics.ConfusionMatrixDisplay(\n",
+        "        confusion_matrix=confusion_matrix, display_labels=[False, True]\n",
+        "    )\n",
+        "    cm_display.plot()\n",
+        "\n",
+        "    plt.close()  # close the plot to avoid displaying it\n",
+        "\n",
+        "    return cm_display.figure_  # return the figure object itself"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1_3__'></a>\n",
+        "\n",
+        "#### Pass parameters to custom tests\n",
+        "\n",
+        "You can pass parameters to custom tests by providing a dictionary of parameters to the `run_test()` function.\n",
+        "\n",
+        "- The parameters will override any default parameters set in the custom test definition. Note that `dataset` and `model` are still passed as `inputs`.\n",
+        "- Since these are `VMDataset` or `VMModel` inputs, they have a special meaning.\n",
+        "\n",
+        "Re-running and logging the custom confusion matrix with `normalize=True` for both models and our testing dataset looks like this:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Champion with test dataset and normalize=True\n",
+        "vm.tests.run_test(\n",
+        "    test_id=\"my_custom_tests.ConfusionMatrix:test_normalized_champion\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_test_ds],\n",
+        "        \"model\" : [vm_log_model]\n",
+        "    },\n",
+        "    params={\"normalize\": True}\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Challenger with test dataset and normalize=True\n",
+        "vm.tests.run_test(\n",
+        "    test_id=\"my_custom_tests.ConfusionMatrix:test_normalized_challenger\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_test_ds],\n",
+        "        \"model\" : [vm_rf_model]\n",
+        "    },\n",
+        "    params={\"normalize\": True}\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2__'></a>\n",
+        "\n",
+        "### Use external test providers\n",
+        "\n",
+        "Sometimes you may want to reuse the same set of custom tests across multiple records (models) and share them with others in your organization, like the development team would have done with you in this example workflow featured in this series of notebooks. In this case, you can create an external custom *test provider* that will allow you to load custom tests from a local folder or a Git repository.\n",
+        "\n",
+        "In this section you will learn how to declare a local filesystem test provider that allows loading tests from a local folder following these high level steps:\n",
+        "\n",
+        "1. Create a folder of custom tests from existing inline tests (tests that exist in your active Jupyter Notebook)\n",
+        "2. Save an inline test to a file\n",
+        "3. Define and register a [`LocalTestProvider`](https://docs.validmind.ai/validmind/validmind/tests.html#LocalTestProvider) that points to that folder\n",
+        "4. Run test provider tests\n",
+        "5. Add the test results to your documentation"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_1__'></a>\n",
+        "\n",
+        "#### Create custom tests folder\n",
+        "\n",
+        "Let's start by creating a new folder that will contain reusable custom tests from your existing inline tests.\n",
+        "\n",
+        "The following code snippet will create a new `my_tests` directory in the current working directory if it doesn't exist:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "tests_folder = \"my_tests\"\n",
+        "\n",
+        "import os\n",
+        "\n",
+        "# create tests folder\n",
+        "os.makedirs(tests_folder, exist_ok=True)\n",
+        "\n",
+        "# remove existing tests\n",
+        "for f in os.listdir(tests_folder):\n",
+        "    # remove files and pycache\n",
+        "    if f.endswith(\".py\") or f == \"__pycache__\":\n",
+        "        os.system(f\"rm -rf {tests_folder}/{f}\")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "After running the command above, confirm that a new `my_tests` directory was created successfully. For example:\n",
+        "\n",
+        "```\n",
+        "~/notebooks/tutorials/validation/my_tests/\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_2__'></a>\n",
+        "\n",
+        "#### Save an inline test\n",
+        "\n",
+        "The `@vm.test` decorator we used in **Implement a custom inline test** above to register one-off custom tests also includes a convenience method on the function object that allows you to simply call `<func_name>.save()` to save the test to a Python file at a specified path.\n",
+        "\n",
+        "While `save()` will get you started by creating the file and saving the function code with the correct name, it won't automatically include any imports, or other functions or variables, outside of the functions that are needed for the test to run. To solve this, pass in an optional `imports` argument ensuring necessary imports are added to the file.\n",
+        "\n",
+        "The `confusion_matrix` test requires the following additional imports:\n",
+        "\n",
+        "```python\n",
+        "import matplotlib.pyplot as plt\n",
+        "from sklearn import metrics\n",
+        "```\n",
+        "\n",
+        "Let's pass these imports to the `save()` method to ensure they are included in the file with the following command:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "confusion_matrix.save(\n",
+        "    # Save it to the custom tests folder we created\n",
+        "    tests_folder,\n",
+        "    imports=[\"import matplotlib.pyplot as plt\", \"from sklearn import metrics\"],\n",
+        ")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "- [x] Confirm that the `save()` method saved the `confusion_matrix` function to a file named `ConfusionMatrix.py` in the `my_tests` folder.\n",
+        "- [x] Note that the new file provides some context on the origin of the test, which is useful for traceability:\n",
+        "\n",
+        "    ```\n",
+        "    # Saved from __main__.confusion_matrix\n",
+        "    # Original Test ID: my_custom_tests.ConfusionMatrix\n",
+        "    # New Test ID: <test_provider_namespace>.ConfusionMatrix\n",
+        "    ```\n",
+        "\n",
+        "- [x]  Additionally, the new test function has been stripped off its decorator, as it now resides in a file that will be loaded by the test provider:\n",
+        "\n",
+        "    ```python\n",
+        "    def ConfusionMatrix(dataset, model, normalize=False):\n",
+        "    ```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_3__'></a>\n",
+        "\n",
+        "#### Register a local test provider\n",
+        "\n",
+        "Now that your `my_tests` folder has a sample custom test, let's initialize a test provider that will tell the ValidMind Library where to find your custom tests:\n",
+        "\n",
+        "- ValidMind offers out-of-the-box test providers for local tests (tests in a folder) or a Github provider for tests in a Github repository.\n",
+        "- You can also create your own test provider by creating a class that has a [`load_test` method](https://docs.validmind.ai/validmind/validmind/tests.html#load_test) that takes a test ID and returns the test function matching that ID.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about test providers?</b></span>\n",
+        "<br></br>\n",
+        "An extended introduction to test providers can be found in: <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/custom_tests/integrate_external_test_providers.html\" style=\"color: #DE257E;\"><b>Integrate external test providers</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Initialize a local test provider\n",
+        "\n",
+        "For most use cases, using a `LocalTestProvider` that allows you to load custom tests from a designated directory should be sufficient.\n",
+        "\n",
+        "**The most important attribute for a test provider is its `namespace`.** This is a string that will be used to prefix test IDs in documentation. This allows you to have multiple test providers with tests that can even share the same ID, but are distinguished by their namespace.\n",
+        "\n",
+        "Let's go ahead and load the custom tests from our `my_tests` directory:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "from validmind.tests import LocalTestProvider\n",
+        "\n",
+        "# initialize the test provider with the tests folder we created earlier\n",
+        "my_test_provider = LocalTestProvider(tests_folder)\n",
+        "\n",
+        "vm.tests.register_test_provider(\n",
+        "    namespace=\"my_test_provider\",\n",
+        "    test_provider=my_test_provider,\n",
+        ")\n",
+        "# `my_test_provider.load_test()` will be called for any test ID that starts with `my_test_provider`\n",
+        "# e.g. `my_test_provider.ConfusionMatrix` will look for a function named `ConfusionMatrix` in `my_tests/ConfusionMatrix.py` file"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Run test provider tests\n",
+        "\n",
+        "Now that we've set up the test provider, we can run any test that's located in the tests folder by using the `run_test()` method as with any other test:\n",
+        "\n",
+        "- For tests that reside in a test provider directory, the test ID will be the `namespace` specified when registering the provider, followed by the path to the test file relative to the tests folder.\n",
+        "- For example, the Confusion Matrix test we created earlier will have the test ID `my_test_provider.ConfusionMatrix`. You could organize the tests in subfolders, say `classification` and `regression`, and the test ID for the Confusion Matrix test would then be `my_test_provider.classification.ConfusionMatrix`.\n",
+        "\n",
+        "Let's go ahead and re-run the confusion matrix test with our testing dataset for our two models by using the test ID `my_test_provider.ConfusionMatrix`. This should load the test from the test provider and run it as before."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Champion with test dataset and test provider custom test\n",
+        "vm.tests.run_test(\n",
+        "    test_id=\"my_test_provider.ConfusionMatrix:champion\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_test_ds],\n",
+        "        \"model\" : [vm_log_model]\n",
+        "    }\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "# Challenger with test dataset  and test provider custom test\n",
+        "vm.tests.run_test(\n",
+        "    test_id=\"my_test_provider.ConfusionMatrix:challenger\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_test_ds],\n",
+        "        \"model\" : [vm_rf_model]\n",
+        "    }\n",
+        ").log()"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Verify test runs\n",
+        "\n",
+        "Our final task is to verify that all the tests provided by the development team were run and reported accurately. Note the appended `result_ids` to delineate which dataset we ran the test with for the relevant tests.\n",
+        "\n",
+        "Here, we'll specify all the tests we'd like to independently rerun in a dictionary called `test_config`. **Note here that `inputs` and `input_grid` expect the `input_id` of the dataset or model as the value rather than the variable name we specified**:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "test_config = {\n",
+        "    # Run with the raw dataset\n",
+        "    'validmind.data_validation.DatasetDescription:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'}\n",
+        "    },\n",
+        "    'validmind.data_validation.DescriptiveStatistics:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'}\n",
+        "    },\n",
+        "    'validmind.data_validation.MissingValues:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'min_percentage_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.ClassImbalance:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'min_percent_threshold': 10}\n",
+        "    },\n",
+        "    'validmind.data_validation.Duplicates:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'min_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.HighCardinality:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {\n",
+        "            'num_threshold': 100,\n",
+        "            'percent_threshold': 0.1,\n",
+        "            'threshold_type': 'percent'\n",
+        "        }\n",
+        "    },\n",
+        "    'validmind.data_validation.Skewness:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'max_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.UniqueRows:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'min_percent_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.TooManyZeroValues:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'max_percent_threshold': 0.03}\n",
+        "    },\n",
+        "    'validmind.data_validation.IQROutliersTable:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'threshold': 5}\n",
+        "    },\n",
+        "    # Run with the preprocessed dataset\n",
+        "    'validmind.data_validation.DescriptiveStatistics:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset_preprocessed'}\n",
+        "    },\n",
+        "    'validmind.data_validation.TabularDescriptionTables:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset_preprocessed'}\n",
+        "    },\n",
+        "    'validmind.data_validation.MissingValues:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset_preprocessed'},\n",
+        "        'params': {'min_percentage_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.TabularNumericalHistograms:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset_preprocessed'}\n",
+        "    },\n",
+        "    'validmind.data_validation.TabularCategoricalBarPlots:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset_preprocessed'}\n",
+        "    },\n",
+        "    'validmind.data_validation.TargetRateBarPlots:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset_preprocessed'},\n",
+        "        'params': {'default_column': 'loan_status'}\n",
+        "    },\n",
+        "    # Run with the training and test datasets\n",
+        "    'validmind.data_validation.DescriptiveStatistics:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']}\n",
+        "    },\n",
+        "    'validmind.data_validation.TabularDescriptionTables:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']}\n",
+        "    },\n",
+        "    'validmind.data_validation.ClassImbalance:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']},\n",
+        "        'params': {'min_percent_threshold': 10}\n",
+        "    },\n",
+        "    'validmind.data_validation.UniqueRows:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']},\n",
+        "        'params': {'min_percent_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.TabularNumericalHistograms:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']}\n",
+        "    },\n",
+        "    'validmind.data_validation.MutualInformation:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']},\n",
+        "        'params': {'min_threshold': 0.01}\n",
+        "    },\n",
+        "    'validmind.data_validation.PearsonCorrelationMatrix:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']}\n",
+        "    },\n",
+        "    'validmind.data_validation.HighPearsonCorrelation:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final']},\n",
+        "        'params': {'max_threshold': 0.3, 'top_n_correlations': 10}\n",
+        "    },\n",
+        "    'validmind.model_validation.ModelMetadata': {\n",
+        "        'input_grid': {'model': ['log_model_champion', 'rf_model']}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.ModelParameters': {\n",
+        "        'input_grid': {'model': ['log_model_champion', 'rf_model']}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.ROCCurve': {\n",
+        "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final'], 'model': ['log_model_champion']}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.MinimumROCAUCScore': {\n",
+        "        'input_grid': {'dataset': ['train_dataset_final', 'test_dataset_final'], 'model': ['log_model_champion']},\n",
+        "        'params': {'min_threshold': 0.5}\n",
+        "    }\n",
+        "}"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Then batch run and log our tests in `test_config`:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {},
+      "outputs": [],
+      "source": [
+        "for t in test_config:\n",
+        "    print(t)\n",
+        "    try:\n",
+        "        # Check if test has input_grid\n",
+        "        if 'input_grid' in test_config[t]:\n",
+        "            # For tests with input_grid, pass the input_grid configuration\n",
+        "            if 'params' in test_config[t]:\n",
+        "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid'], params=test_config[t]['params']).log()\n",
+        "            else:\n",
+        "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid']).log()\n",
+        "        else:\n",
+        "            # Original logic for regular inputs\n",
+        "            if 'params' in test_config[t]:\n",
+        "                vm.tests.run_test(t, inputs=test_config[t]['inputs'], params=test_config[t]['params']).log()\n",
+        "            else:\n",
+        "                vm.tests.run_test(t, inputs=test_config[t]['inputs']).log()\n",
+        "    except Exception as e:\n",
+        "        print(f\"Error running test {t}: {str(e)}\")"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## In summary\n",
+        "\n",
+        "In this final notebook, you learned how to:\n",
+        "\n",
+        "- [x] Implement a custom inline test\n",
+        "- [x] Run and log your custom inline tests\n",
+        "- [x] Use external custom test providers\n",
+        "- [x] Run and log tests from your custom test providers\n",
+        "- [x] Re-run tests provided by your development team to verify that they were run and reported accurately\n",
+        "\n",
+        "With our ValidMind for validation series of notebooks, you learned how to validate a record (model) end-to-end with the ValidMind Library by running through some common scenarios in a typical validation setting:\n",
+        "\n",
+        "- Verifying the data quality steps performed by the development team\n",
+        "- Independently replicating the champion's results and conducting additional tests to assess performance, stability, and robustness\n",
+        "- Setting up test inputs and a challenger for comparative analysis\n",
+        "- Running validation tests, analyzing results, and logging artifacts to ValidMind"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Next steps"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_1__'></a>\n",
+        "\n",
+        "### Work with your validation report\n",
+        "\n",
+        "Now that you've logged all your test results and verified the work done by the development team, head to the ValidMind Platform to wrap up your validation report. Continue to work on your validation report by:\n",
+        "\n",
+        "- **Inserting additional test results:** Click **Link Evidence** under any Evidence panel of 2. Validation in your validation report. (Learn more: [Link evidence to reports](https://docs.validmind.ai/guide/validation/assess-compliance.html#link-evidence-to-reports))\n",
+        "\n",
+        "- **Making qualitative edits to your test descriptions:** Expand any linked evidence under Validator Evidence and click **See evidence details** to review and edit the ValidMind-generated test descriptions for quality and accuracy. (Learn more: [Preparing validation reports](https://docs.validmind.ai/guide/validation/preparing-validation-reports.html#validation-overview))\n",
+        "\n",
+        "- **Adding more findings:** Click **Link Finding to Report** in any validation report section, then click **+ Create New Finding**. (Learn more: [Add and manage artifacts](https://docs.validmind.ai/guide/validation/add-manage-artifacts.html))\n",
+        "\n",
+        "- **Adding risk assessment notes:** Click under **Risk Assessment Notes** in any validation report section to access the text editor and content editing toolbar, including an option to generate a draft with AI. Once generated, edit your ValidMind-generated test descriptions to adhere to your organization's requirements. (Learn more: [Work with content blocks](https://docs.validmind.ai/guide/documentation/work-with-content-blocks.html#content-editing-toolbar))\n",
+        "\n",
+        "- **Assessing compliance:** Under the Guideline for any validation report section, click **ASSESSMENT** and select the compliance status from the drop-down menu. (Learn more: [Assign compliance assessments](https://docs.validmind.ai/guide/validation/assess-compliance.html#assign-compliance-assessments))\n",
+        "\n",
+        "- **Collaborate with other stakeholders:** Use the ValidMind Platform's real-time collaborative features to work seamlessly together with the rest of your organization, including developers. Propose suggested changes in the documentation, work with versioned history, and use comments to discuss specific portions of the documentation. (Learn more: [Collaborate with others](https://docs.validmind.ai/guide/documentation/collaborate-with-others.html))\n",
+        "\n",
+        "When your validation report is complete and ready for review, submit it for approval from the same ValidMind Platform where you made your edits and collaborated with the rest of your organization, ensuring transparency and a thorough validation history. (Learn more: [Submit documents](https://docs.validmind.ai/guide/documentation/submit-documents.html))"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2__'></a>\n",
+        "\n",
+        "### Learn more\n",
+        "\n",
+        "Now that you're familiar with the basics, you can explore the following notebooks to get a deeper understanding on how the ValidMind Library assists you in streamlining validation:"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2_1__'></a>\n",
+        "\n",
+        "#### Use cases\n",
+        "\n",
+        "- [Validate an application scorecard model](../../use_cases/validation/validate_application_scorecard.ipynb)"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2_2__'></a>\n",
+        "\n",
+        "#### Discover more learning resources\n",
+        "\n",
+        "Learn more about the ValidMind Library tools we used in this notebook:\n",
+        "\n",
+        "- [Explore tests](../../how_to/tests/explore_tests/explore_tests.ipynb)\n",
+        "- [Run dataset-based tests](../../how_to/tests/run_tests/1-run_dataset-based_tests.ipynb)\n",
+        "- [Implement custom tests](../../how_to/tests/custom_tests/implement_custom_tests.ipynb)\n",
+        "- [Integrate external test providers](../../how_to/tests/custom_tests/integrate_external_test_providers.ipynb)\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "id": "copyright-0f5cad51d1144e528b343ccbd8f66d06",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ]
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "name": "python",
+      "version": "3.10.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 2
+}
diff --git a/site/notebooks/tutorials/model_validation/class-imbalance-results-detail.png b/site/notebooks/tutorials/validation/class-imbalance-results-detail.png
similarity index 100%
rename from site/notebooks/tutorials/model_validation/class-imbalance-results-detail.png
rename to site/notebooks/tutorials/validation/class-imbalance-results-detail.png
diff --git a/site/notebooks/tutorials/model_validation/compliance-summary.png b/site/notebooks/tutorials/validation/compliance-summary.png
similarity index 100%
rename from site/notebooks/tutorials/model_validation/compliance-summary.png
rename to site/notebooks/tutorials/validation/compliance-summary.png
diff --git a/site/notebooks/tutorials/model_validation/inserted-minimum-f1-scores.png b/site/notebooks/tutorials/validation/inserted-minimum-f1-scores.png
similarity index 100%
rename from site/notebooks/tutorials/model_validation/inserted-minimum-f1-scores.png
rename to site/notebooks/tutorials/validation/inserted-minimum-f1-scores.png
diff --git a/site/notebooks/tutorials/model_validation/lr_model_champion.pkl b/site/notebooks/tutorials/validation/lr_model_champion.pkl
similarity index 100%
rename from site/notebooks/tutorials/model_validation/lr_model_champion.pkl
rename to site/notebooks/tutorials/validation/lr_model_champion.pkl
diff --git a/site/notebooks/tutorials/model_validation/selecting-class-imbalance-results.png b/site/notebooks/tutorials/validation/selecting-class-imbalance-results.png
similarity index 100%
rename from site/notebooks/tutorials/model_validation/selecting-class-imbalance-results.png
rename to site/notebooks/tutorials/validation/selecting-class-imbalance-results.png
diff --git a/site/notebooks/tutorials/model_validation/selecting-minimum-f1-scores.png b/site/notebooks/tutorials/validation/selecting-minimum-f1-scores.png
similarity index 100%
rename from site/notebooks/tutorials/model_validation/selecting-minimum-f1-scores.png
rename to site/notebooks/tutorials/validation/selecting-minimum-f1-scores.png
diff --git a/site/notebooks/use_cases/agents/document_agentic_ai.ipynb b/site/notebooks/use_cases/agents/document_agentic_ai.ipynb
index 2516a13bd2..621fe8b171 100644
--- a/site/notebooks/use_cases/agents/document_agentic_ai.ipynb
+++ b/site/notebooks/use_cases/agents/document_agentic_ai.ipynb
@@ -1,2187 +1,2194 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "id": "eee6b64c",
-   "metadata": {},
-   "source": [
-    "# Document an agentic AI system\n",
-    "\n",
-    "Build and document an agentic AI system with the ValidMind Library. Construct a LangGraph-based banking agent, assign AI evaluation metric scores to your agent, and run accuracy, RAGAS, and safety tests, then log those test results to the ValidMind Platform.\n",
-    "\n",
-    "An _AI agent_ is an autonomous system that interprets inputs, selects from available tools or actions, and executes multi-step behaviors to achieve defined goals. In this notebook, the agent acts as a banking assistant that analyzes user requests and automatically selects and invokes the appropriate specialized banking tool to deliver accurate, compliant, and actionable responses.\n",
-    "\n",
-    "- This agent enables financial institutions to automate complex banking workflows where different customer requests require different specialized tools and knowledge bases.\n",
-    "- Effective validation of agentic AI systems reduces the risks of agents misinterpreting inputs, failing to extract required parameters, or producing incorrect assessments or actions — such as selecting the wrong tool.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For the LLM components in this notebook to function properly, you'll need access to OpenAI.</b></span>\n",
-    "<br></br>\n",
-    "Before you continue, ensure that a valid <code>OPENAI_API_KEY</code> is set in your <code>.env</code> file.</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "30927b2b",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "    - [Preview the documentation template](#toc2_2_4__)    \n",
-    "  - [Verify OpenAI API access](#toc2_3__)    \n",
-    "  - [Initialize the Python environment](#toc2_4__)    \n",
-    "- [Building the LangGraph agent](#toc3__)    \n",
-    "  - [Test available banking tools](#toc3_1__)    \n",
-    "  - [Create LangGraph banking agent](#toc3_2__)    \n",
-    "    - [Define system prompt](#toc3_2_1__)    \n",
-    "    - [Initialize the LLM](#toc3_2_2__)    \n",
-    "    - [Define agent state structure](#toc3_2_3__)    \n",
-    "    - [Create agent workflow function](#toc3_2_4__)    \n",
-    "    - [Instantiate the banking agent](#toc3_2_5__)    \n",
-    "  - [Integrate agent with ValidMind](#toc3_3__)    \n",
-    "    - [Import ValidMind components](#toc3_3_1__)    \n",
-    "    - [Create agent wrapper function](#toc3_3_2__)    \n",
-    "    - [Initialize the ValidMind model object](#toc3_3_3__)    \n",
-    "    - [Store the agent reference](#toc3_3_4__)    \n",
-    "    - [Verify integration](#toc3_3_5__)    \n",
-    "  - [Validate the system prompt](#toc3_4__)    \n",
-    "- [Initializing the ValidMind dataset](#toc4__)    \n",
-    "  - [Assign predictions](#toc4_1__)    \n",
-    "- [Running accuracy tests](#toc5__)    \n",
-    "  - [Response accuracy test](#toc5_1__)    \n",
-    "  - [Tool selection accuracy test](#toc5_2__)    \n",
-    "- [Assigning AI evaluation metric scores](#toc6__)    \n",
-    "  - [Identify relevant DeepEval scorers](#toc6_1__)    \n",
-    "  - [Assign reasoning scores](#toc6_2__)    \n",
-    "    - [Plan quality score](#toc6_2_1__)    \n",
-    "    - [Plan adherence score](#toc6_2_2__)    \n",
-    "  - [Assign action scores](#toc6_3__)    \n",
-    "    - [Tool correctness score](#toc6_3_1__)    \n",
-    "    - [Argument correctness score](#toc6_3_2__)    \n",
-    "  - [Assign execution score](#toc6_4__)    \n",
-    "    - [Task completion score](#toc6_4_1__)    \n",
-    "- [Running RAGAS tests](#toc7__)    \n",
-    "  - [Identify relevant RAGAS tests](#toc7_1__)    \n",
-    "    - [Faithfulness](#toc7_1_1__)    \n",
-    "    - [Response Relevancy](#toc7_1_2__)    \n",
-    "    - [Context Recall](#toc7_1_3__)    \n",
-    "- [Running safety tests](#toc8__)    \n",
-    "    - [AspectCritic](#toc8_1_1__)    \n",
-    "    - [Bias](#toc8_1_2__)    \n",
-    "- [Next steps](#toc9__)    \n",
-    "  - [Work with your model documentation](#toc9_1__)    \n",
-    "  - [Customize the banking agent for your use case](#toc9_2__)    \n",
-    "  - [Discover more learning resources](#toc9_3__)    \n",
-    "- [Upgrade ValidMind](#toc10__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b58139db",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models. \n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "7e30d36b",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "1cba586e",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "5c46f003",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Metrics**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
-    "\n",
-    "**Custom metrics**: Custom metrics are functions that you define to evaluate your model or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom metric.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom metric. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/run_tests_that_require_multiple_datasets.html))\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a metric, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom metrics can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "11a2d7a5",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "fbab0edf",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
-    "<br></br>\n",
-    "Python 3.9 <= x <= 3.14</div>\n",
-    "\n",
-    "Let's begin by installing the ValidMind Library with large language model (LLM) support:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "1982a118",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q \"validmind[llm]\" \"langgraph==0.3.21\""
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "14578e26",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "83d47d89",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook.\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "bb2c5670",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Agentic AI`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "98e475c1",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Can't select this template?</b></span>\n",
-    "<br></br>\n",
-    "Your organization administrators may need to add it to your template library:\n",
-    "<ul>\n",
-    "<li><a href=\"agentic_ai_template.yaml\" style=\"color: #DE257E;\"><b>Download Template YAML</b></a></li>\n",
-    "<li><a href=\"https://docs.validmind.ai/guide/templates/customize-document-templates.html\" style=\"color: #DE257E;\"><b>Customize Document Templates</b></a></li>\n",
-    "</ul>\n",
-    "</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "0d1a13ca",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "d6ccbefc",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "3605df4f",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_4__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "dffdaa6f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "d467c1d2",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Verify OpenAI API access\n",
-    "\n",
-    "Verify that a valid `OPENAI_API_KEY` is set in your `.env` file:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "22cc39cb",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load environment variables if using .env file\n",
-    "try:\n",
-    "    from dotenv import load_dotenv\n",
-    "    load_dotenv()\n",
-    "except ImportError:\n",
-    "    print(\"dotenv not installed. Make sure OPENAI_API_KEY is set in your environment.\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b56c3f39",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_4__'></a>\n",
-    "\n",
-    "### Initialize the Python environment\n",
-    "\n",
-    "Let's import all the necessary libraries to prepare for building our banking LangGraph agentic system:\n",
-    "\n",
-    "- **Standard libraries** for data handling and environment management.\n",
-    "- **pandas**, a Python library for data manipulation and analytics, as an alias. We'll also configure pandas to show all columns and all rows at full width for easier debugging and inspection.\n",
-    "- **LangChain** components for LLM integration and tool management.\n",
-    "- **LangGraph** for building stateful, multi-step agent workflows.\n",
-    "- **Banking tools** for specialized financial services as defined in [banking_tools.py](banking_tools.py)."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "2058d1ac",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from typing import TypedDict, Annotated, Sequence\n",
-    "\n",
-    "from langchain_core.messages import BaseMessage, HumanMessage, SystemMessage\n",
-    "from langchain_openai import ChatOpenAI\n",
-    "from langgraph.checkpoint.memory import MemorySaver\n",
-    "from langgraph.graph import StateGraph, END, START\n",
-    "from langgraph.graph.message import add_messages\n",
-    "from langgraph.prebuilt import ToolNode\n",
-    "\n",
-    "# LOCAL IMPORTS FROM banking_tools.py\n",
-    "from banking_tools import AVAILABLE_TOOLS\n",
-    "\n",
-    "import pandas as pd\n",
-    "# Configure pandas to show all columns and all rows at full width\n",
-    "pd.set_option('display.max_columns', None)\n",
-    "pd.set_option('display.max_colwidth', None)\n",
-    "pd.set_option('display.width', None)\n",
-    "pd.set_option('display.max_rows', None)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "cc1d3265",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Building the LangGraph agent"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "a3c421c4",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Test available banking tools\n",
-    "\n",
-    "We'll use the demo banking tools defined in `banking_tools.py` that provide use cases of financial services:\n",
-    "\n",
-    "- **Credit Risk Analyzer** - Loan applications and credit decisions\n",
-    "- **Customer Account Manager** - Account services and customer support\n",
-    "- **Fraud Detection System** - Security and fraud prevention"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "1e0a120c",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "print(f\"Available tools: {len(AVAILABLE_TOOLS)}\")\n",
-    "print(\"\\nTool Details:\")\n",
-    "for i, tool in enumerate(AVAILABLE_TOOLS, 1):\n",
-    "    print(f\"   - {tool.name}\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "53906630",
-   "metadata": {},
-   "source": [
-    "Let's test each banking tool individually to ensure they're working correctly before integrating them into our agent:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "dc0caff2",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Test 1: Credit Risk Analyzer\n",
-    "print(\"TEST 1: Credit Risk Analyzer\")\n",
-    "print(\"-\" * 40)\n",
-    "try:\n",
-    "    # Access the underlying function using .func\n",
-    "    credit_result = AVAILABLE_TOOLS[0].func(\n",
-    "        customer_income=75000,\n",
-    "        customer_debt=1200,\n",
-    "        credit_score=720,\n",
-    "        loan_amount=50000,\n",
-    "        loan_type=\"personal\"\n",
-    "    )\n",
-    "    print(credit_result)\n",
-    "    print(\"Credit Risk Analyzer test PASSED\")\n",
-    "except Exception as e:\n",
-    "    print(f\"Credit Risk Analyzer test FAILED: {e}\")\n",
-    "\n",
-    "print(\"\" + \"=\" * 60)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "b6b227db",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "\n",
-    "# Test 2: Customer Account Manager\n",
-    "print(\"TEST 2: Customer Account Manager\")\n",
-    "print(\"-\" * 40)\n",
-    "try:\n",
-    "    # Test checking balance\n",
-    "    account_result = AVAILABLE_TOOLS[1].func(\n",
-    "        account_type=\"checking\",\n",
-    "        customer_id=\"12345\",\n",
-    "        action=\"check_balance\"\n",
-    "    )\n",
-    "    print(account_result)\n",
-    "\n",
-    "    # Test getting account info\n",
-    "    info_result = AVAILABLE_TOOLS[1].func(\n",
-    "        account_type=\"all\",\n",
-    "        customer_id=\"12345\", \n",
-    "        action=\"get_info\"\n",
-    "    )\n",
-    "    print(info_result)\n",
-    "    print(\"Customer Account Manager test PASSED\")\n",
-    "except Exception as e:\n",
-    "    print(f\"Customer Account Manager test FAILED: {e}\")\n",
-    "\n",
-    "print(\"\" + \"=\" * 60)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "a983b30d",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "\n",
-    "# Test 3: Fraud Detection System\n",
-    "print(\"TEST 3: Fraud Detection System\")\n",
-    "print(\"-\" * 40)\n",
-    "try:\n",
-    "    fraud_result = AVAILABLE_TOOLS[2].func(\n",
-    "        transaction_id=\"TX123\",\n",
-    "        customer_id=\"12345\",\n",
-    "        transaction_amount=500.00,\n",
-    "        transaction_type=\"withdrawal\",\n",
-    "        location=\"Miami, FL\",\n",
-    "        device_id=\"DEVICE_001\"\n",
-    "    )\n",
-    "    print(fraud_result)\n",
-    "    print(\"Fraud Detection System test PASSED\")\n",
-    "except Exception as e:\n",
-    "    print(f\"Fraud Detection System test FAILED: {e}\")\n",
-    "\n",
-    "print(\"\" + \"=\" * 60)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "1424baed",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2__'></a>\n",
-    "\n",
-    "### Create LangGraph banking agent\n",
-    "\n",
-    "With our tools ready to go, we'll create our intelligent banking agent with LangGraph that automatically selects and uses the appropriate banking tool based on a user request."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "3469d656",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_1__'></a>\n",
-    "\n",
-    "#### Define system prompt\n",
-    "\n",
-    "We'll begin by defining our system prompt, which provides the LLM with context about its role as a banking assistant and guidance on when to use each available tool:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "7971c427",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "\n",
-    "# Enhanced banking system prompt with tool selection guidance\n",
-    "system_context = \"\"\"You are a professional banking AI assistant with access to specialized banking tools.\n",
-    "            Analyze the user's banking request and directly use the most appropriate tools to help them.\n",
-    "            \n",
-    "            AVAILABLE BANKING TOOLS:\n",
-    "            \n",
-    "            credit_risk_analyzer - Analyze credit risk for loan applications and credit decisions\n",
-    "            - Use for: loan applications, credit assessments, risk analysis, mortgage eligibility\n",
-    "            - Examples: \"Analyze credit risk for $50k personal loan\", \"Assess mortgage eligibility for $300k home purchase\"\n",
-    "            - Parameters: customer_income, customer_debt, credit_score, loan_amount, loan_type\n",
-    "\n",
-    "            customer_account_manager - Manage customer accounts and provide banking services\n",
-    "            - Use for: account information, transaction processing, product recommendations, customer service\n",
-    "            - Examples: \"Check balance for checking account 12345\", \"Recommend products for customer with high balance\"\n",
-    "            - Parameters: account_type, customer_id, action, amount, account_details\n",
-    "\n",
-    "            fraud_detection_system - Analyze transactions for potential fraud and security risks\n",
-    "            - Use for: transaction monitoring, fraud prevention, risk assessment, security alerts\n",
-    "            - Examples: \"Analyze fraud risk for $500 ATM withdrawal in Miami\", \"Check security for $2000 online purchase\"\n",
-    "            - Parameters: transaction_id, customer_id, transaction_amount, transaction_type, location, device_id\n",
-    "\n",
-    "            BANKING INSTRUCTIONS:\n",
-    "            - Analyze the user's banking request carefully and identify the primary need\n",
-    "            - If they need credit analysis → use credit_risk_analyzer\n",
-    "            - If they need financial calculations → use financial_calculator\n",
-    "            - If they need account services → use customer_account_manager\n",
-    "            - If they need security analysis → use fraud_detection_system\n",
-    "            - Extract relevant parameters from the user's request\n",
-    "            - Provide helpful, accurate banking responses based on tool outputs\n",
-    "            - Always consider banking regulations, risk management, and best practices\n",
-    "            - Be professional and thorough in your analysis\n",
-    "\n",
-    "            Choose and use tools wisely to provide the most helpful banking assistance.\n",
-    "            Describe the response in user friendly manner with details describing the tool output. \n",
-    "            Provide the response in at least 500 words.\n",
-    "            Generate a concise execution plan for the banking request.\n",
-    "        \"\"\""
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b66c1ac4",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_2__'></a>\n",
-    "\n",
-    "#### Initialize the LLM\n",
-    "\n",
-    "Let's initialize the LLM that will power our banking agent:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "866066e7",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize the main LLM for banking responses\n",
-    "main_llm = ChatOpenAI(\n",
-    "    model=\"gpt-5-mini\",\n",
-    "    reasoning={\n",
-    "        \"effort\": \"low\",\n",
-    "        \"summary\": \"auto\"\n",
-    "    }\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "8220afd6",
-   "metadata": {},
-   "source": [
-    "Then bind the available banking tools to the LLM, enabling the model to automatically recognize and invoke each tool when appropriate based on request input and the system prompt we defined above:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "906d8132",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Bind all banking tools to the main LLM\n",
-    "llm_with_tools = main_llm.bind_tools(AVAILABLE_TOOLS)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "43f56651",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_3__'></a>\n",
-    "\n",
-    "#### Define agent state structure\n",
-    "\n",
-    "The agent state defines the data structure that flows through the LangGraph workflow. It includes:\n",
-    "\n",
-    "- **messages** — The conversation history between the user and agent\n",
-    "- **user_input** — The current user request\n",
-    "- **session_id** — A unique identifier for the conversation session\n",
-    "- **context** — Additional context that can be passed between nodes\n",
-    "\n",
-    "Defining this state structure maintains the structure throughout the agent's execution and allows for multi-turn conversations with memory:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "6b926ddf",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Banking Agent State Definition\n",
-    "class BankingAgentState(TypedDict):\n",
-    "    messages: Annotated[Sequence[BaseMessage], add_messages]\n",
-    "    user_input: str\n",
-    "    session_id: str\n",
-    "    context: dict"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "387ba780",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_4__'></a>\n",
-    "\n",
-    "#### Create agent workflow function\n",
-    "\n",
-    "We'll build the LangGraph agent workflow with two main components:\n",
-    "\n",
-    "1. **LLM node** — Processes user requests, applies the system prompt, and decides whether to use tools.\n",
-    "2. **Tools node** — Executes the selected banking tools when the LLM determines they're needed.\n",
-    "\n",
-    "The workflow begins with the LLM analyzing the request, then uses tools if needed — or ends if the response is complete, and finally returns to the LLM to generate the final response."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "2c9bf585",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def create_banking_langgraph_agent():\n",
-    "    \"\"\"Create a comprehensive LangGraph banking agent with intelligent tool selection.\"\"\"\n",
-    "    def llm_node(state: BankingAgentState) -> BankingAgentState:\n",
-    "        \"\"\"Main LLM node that processes banking requests and selects appropriate tools.\"\"\"\n",
-    "        messages = state[\"messages\"]\n",
-    "        # Add system context to messages\n",
-    "        enhanced_messages = [SystemMessage(content=system_context)] + list(messages)\n",
-    "        # Get LLM response with tool selection\n",
-    "        response = llm_with_tools.invoke(enhanced_messages)\n",
-    "        return {\n",
-    "            **state,\n",
-    "            \"messages\": messages + [response]\n",
-    "        }\n",
-    "    \n",
-    "    def should_continue(state: BankingAgentState) -> str:\n",
-    "        \"\"\"Decide whether to use tools or end the conversation.\"\"\"\n",
-    "        last_message = state[\"messages\"][-1]\n",
-    "        # Check if the LLM wants to use tools\n",
-    "        if hasattr(last_message, 'tool_calls') and last_message.tool_calls:\n",
-    "            return \"tools\"\n",
-    "        return END\n",
-    "        \n",
-    "    # Create the banking state graph\n",
-    "    workflow = StateGraph(BankingAgentState)\n",
-    "    # Add nodes\n",
-    "    workflow.add_node(\"llm\", llm_node)\n",
-    "    workflow.add_node(\"tools\", ToolNode(AVAILABLE_TOOLS))\n",
-    "    # Simplified entry point - go directly to LLM\n",
-    "    workflow.add_edge(START, \"llm\")\n",
-    "    # From LLM, decide whether to use tools or end\n",
-    "    workflow.add_conditional_edges(\n",
-    "        \"llm\",\n",
-    "        should_continue,\n",
-    "        {\"tools\": \"tools\", END: END}\n",
-    "    )\n",
-    "    # Tool execution flows back to LLM for final response\n",
-    "    workflow.add_edge(\"tools\", \"llm\")\n",
-    "    # Set up memory\n",
-    "    memory = MemorySaver()\n",
-    "    # Compile the graph\n",
-    "    agent = workflow.compile(checkpointer=memory)\n",
-    "    return agent"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "765242e9",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_5__'></a>\n",
-    "\n",
-    "#### Instantiate the banking agent\n",
-    "\n",
-    "Now, we'll create an instance of the banking agent by calling the workflow creation function.\n",
-    "\n",
-    "This compiled agent is ready to process banking requests and will automatically select and use the appropriate tools based on user queries:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "455b8ee4",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Create the banking intelligent agent\n",
-    "banking_agent = create_banking_langgraph_agent()\n",
-    "\n",
-    "print(\"Banking LangGraph Agent Created Successfully!\")\n",
-    "print(\"\\nFeatures:\")\n",
-    "print(\"   - Intelligent banking tool selection\")\n",
-    "print(\"   - Comprehensive banking system prompt\")\n",
-    "print(\"   - Streamlined workflow: LLM → Tools → Response\")\n",
-    "print(\"   - Automatic tool parameter extraction\")\n",
-    "print(\"   - Professional banking assistance\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e00dac77",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_3__'></a>\n",
-    "\n",
-    "### Integrate agent with ValidMind\n",
-    "\n",
-    "To integrate our LangGraph banking agent with ValidMind, we need to create a wrapper function that ValidMind can use to invoke the agent and extract the necessary information for testing and documentation, allowing ValidMind to run validation tests on the agent's behavior, tool usage, and responses."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "a124857e",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_3_1__'></a>\n",
-    "\n",
-    "#### Import ValidMind components\n",
-    "\n",
-    "We'll start with importing the necessary ValidMind components for integrating our agent:\n",
-    "\n",
-    "- `Prompt` from `validmind.models` for handling prompt-based model inputs\n",
-    "- `extract_tool_calls_from_agent_output` and `_convert_to_tool_call_list` from `validmind.scorers.llm.deepeval` for extracting and converting tool calls from agent outputs"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "9aeb8969",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.models import Prompt\n",
-    "from validmind.scorers.llm.deepeval import extract_tool_calls_from_agent_output, _convert_to_tool_call_list\n",
-    "from deepeval.tracing import observe, update_current_span\n",
-    "from deepeval.test_case import LLMTestCase"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "ed72903f",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_3_2__'></a>\n",
-    "\n",
-    "#### Create agent wrapper function\n",
-    "\n",
-    "We'll then create a wrapper function that:\n",
-    "\n",
-    "- Accepts input in ValidMind's expected format (with `input` and `session_id` fields)\n",
-    "- Invokes the banking agent with the proper state initialization\n",
-    "- Captures tool outputs and tool calls for evaluation\n",
-    "- Returns a standardized response format that includes the prediction, full output, tool messages, and tool call information\n",
-    "- Handles errors gracefully with fallback responses"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "0e4d5a82",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "@observe(type=\"agent\")\n",
-    "def banking_agent_fn(input):\n",
-    "    \"\"\"\n",
-    "    Invoke the banking agent with the given input.\n",
-    "    \"\"\"\n",
-    "    try:\n",
-    "        # Initial state for banking agent\n",
-    "        initial_state = {\n",
-    "            \"user_input\": input[\"input\"],\n",
-    "            \"messages\": [HumanMessage(content=input[\"input\"])],\n",
-    "            \"session_id\": input[\"session_id\"],\n",
-    "            \"context\": {}\n",
-    "        }\n",
-    "        session_config = {\"configurable\": {\"thread_id\": input[\"session_id\"]}}\n",
-    "        result = banking_agent.invoke(initial_state, config=session_config)\n",
-    "\n",
-    "        from utils import capture_tool_output_messages\n",
-    "\n",
-    "        # Capture all tool outputs and metadata\n",
-    "        captured_data = capture_tool_output_messages(result)\n",
-    "    \n",
-    "        # Access specific tool outputs, this will be used for RAGAS tests\n",
-    "        tool_message = \"\"\n",
-    "        for output in captured_data[\"tool_outputs\"]:\n",
-    "            tool_message += output['content']\n",
-    "        \n",
-    "        tool_calls_found = []\n",
-    "        messages = result['messages']\n",
-    "        for message in messages:\n",
-    "            if hasattr(message, 'tool_calls') and message.tool_calls:\n",
-    "                for tool_call in message.tool_calls:\n",
-    "                    # Handle both dictionary and object formats\n",
-    "                    if isinstance(tool_call, dict):\n",
-    "                        tool_calls_found.append(tool_call['name'])\n",
-    "                    else:\n",
-    "                        # ToolCall object - use attribute access\n",
-    "                        tool_calls_found.append(tool_call.name)\n",
-    "\n",
-    "        prediction_text = result['messages'][-1].content[0]['text']\n",
-    "        tools_called_value = _convert_to_tool_call_list(extract_tool_calls_from_agent_output(result))\n",
-    "        expected_tools_value = _convert_to_tool_call_list(input.get(\"expected_tools\", []))\n",
-    "\n",
-    "        # Feed trace data for DeepEval metrics (e.g. PlanQuality) that require tracing\n",
-    "        update_current_span(\n",
-    "            test_case=LLMTestCase(\n",
-    "                input=input[\"input\"],\n",
-    "                actual_output=prediction_text,\n",
-    "                tools_called=tools_called_value,\n",
-    "                expected_tools=expected_tools_value\n",
-    "            )\n",
-    "        )\n",
-    "\n",
-    "        return {\n",
-    "            \"prediction\": prediction_text,\n",
-    "            \"output\": result,\n",
-    "            \"tool_messages\": [tool_message],\n",
-    "            # \"tool_calls\": tool_calls_found,\n",
-    "            \"tool_called\": tools_called_value\n",
-    "        }\n",
-    "    except Exception as e:\n",
-    "        # Return a fallback response if the agent fails\n",
-    "        error_message = f\"\"\"I apologize, but I encountered an error while processing your banking request: {str(e)}.\n",
-    "        Please try rephrasing your question or contact support if the issue persists.\"\"\"\n",
-    "        return {\n",
-    "            \"prediction\": error_message, \n",
-    "            \"output\": {\n",
-    "                \"messages\": [HumanMessage(content=input[\"input\"]), SystemMessage(content=error_message)],\n",
-    "                \"error\": str(e)\n",
-    "            }\n",
-    "        }"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "fda87401",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_3_3__'></a>\n",
-    "\n",
-    "#### Initialize the ValidMind model object\n",
-    "\n",
-    "We'll also need to register the banking agent as a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data.\n",
-    "\n",
-    "You simply initialize this model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model) that:\n",
-    "\n",
-    "- Associates the wrapper function with the model for prediction\n",
-    "- Stores the system prompt template for documentation\n",
-    "- Provides a unique `input_id` for tracking and identification\n",
-    "- Enables the agent to be used with ValidMind's testing and documentation features"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "60a2ce7a",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize the agent as a model\n",
-    "vm_banking_model = vm.init_model(\n",
-    "    input_id=\"banking_agent_model\",\n",
-    "    predict_fn=banking_agent_fn,\n",
-    "    prompt=Prompt(template=system_context)\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "949bcf53",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_3_4__'></a>\n",
-    "\n",
-    "#### Store the agent reference\n",
-    "\n",
-    "We'll also store a reference to the original banking agent object in the ValidMind model. This allows us to access the full agent functionality directly if needed, while still maintaining the wrapper function interface for ValidMind's testing framework."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "2c653471",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Add the banking agent to the vm model\n",
-    "vm_banking_model.model = banking_agent"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "d8d0c1c1",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_3_5__'></a>\n",
-    "\n",
-    "#### Verify integration\n",
-    "\n",
-    "Let's confirm that the banking agent has been successfully integrated with ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "8e101b0f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "print(\"Banking Agent Successfully Integrated with ValidMind!\")\n",
-    "print(f\"Model ID: {vm_banking_model.input_id}\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "2a5f874e",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_4__'></a>\n",
-    "\n",
-    "### Validate the system prompt\n",
-    "\n",
-    "Let's get an initial sense of how well our defined system prompt meets a few best practices for prompt engineering by running a few tests — we'll run evaluation tests later on our agent's performance.\n",
-    "\n",
-    "You run individual tests by calling [the `run_test` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test) provided by the `validmind.tests` module. Passing in our agentic model as an input, the tests below rate the prompt on a scale of 1-10 against the following criteria:\n",
-    "\n",
-    "- **[Clarity](https://docs.validmind.ai/tests/prompt_validation/Clarity.html)** — How clearly the prompt states the task.\n",
-    "- **[Conciseness](https://docs.validmind.ai/tests/prompt_validation/Conciseness.html)** — How succinctly the prompt states the task.\n",
-    "- **[Delimitation](https://docs.validmind.ai/tests/prompt_validation/Delimitation.html)** — When using complex prompts containing examples, contextual information, or other elements, is the prompt formatted in such a way that each element is clearly separated?\n",
-    "- **[NegativeInstruction](https://docs.validmind.ai/tests/prompt_validation/NegativeInstruction.html)** — Whether the prompt contains negative instructions.\n",
-    "- **[Specificity](https://docs.validmind.ai/tests/prompt_validation/NegativeInstruction.html)** — How specific the prompt defines the task."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "f52dceb1",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    \"validmind.prompt_validation.Clarity\",\n",
-    "    inputs={\n",
-    "        \"model\": vm_banking_model,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "70d52333",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    \"validmind.prompt_validation.Conciseness\",\n",
-    "    inputs={\n",
-    "        \"model\": vm_banking_model,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "5aa89976",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    \"validmind.prompt_validation.Delimitation\",\n",
-    "    inputs={\n",
-    "        \"model\": vm_banking_model,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "8630197e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    \"validmind.prompt_validation.NegativeInstruction\",\n",
-    "    inputs={\n",
-    "        \"model\": vm_banking_model,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "bba99915",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    \"validmind.prompt_validation.Specificity\",\n",
-    "    inputs={\n",
-    "        \"model\": vm_banking_model,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "51d61141",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Initializing the ValidMind dataset\n",
-    "\n",
-    "After validation our system prompt, let's import our sample dataset ([banking_test_dataset.py](banking_test_dataset.py)), which we'll use in the next section to evaluate our agent's performance across different banking scenarios:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "0c70ca2c",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from banking_test_dataset import banking_test_dataset"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "442ab66d",
-   "metadata": {},
-   "source": [
-    "The next step is to connect your data with a ValidMind `Dataset` object. **This step is always necessary every time you want to connect a dataset to documentation and produce test results through ValidMind,** but you only need to do it once per dataset.\n",
-    "\n",
-    "Initialize a ValidMind dataset object using the [`init_dataset` function](https://docs.validmind.ai/validmind/validmind.html#init_dataset) from the ValidMind (`vm`) module. For this example, we'll pass in the following arguments:\n",
-    "\n",
-    "- **`input_id`** — A unique identifier that allows tracking what inputs are used when running each individual test.\n",
-    "- **`dataset`** — The raw dataset that you want to provide as input to tests.\n",
-    "- **`text_column`** — The name of the column containing the text input data.\n",
-    "- **`target_column`** — A required argument if tests require access to true values. This is the name of the target column in the dataset."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "a7e9d158",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_test_dataset = vm.init_dataset(\n",
-    "    input_id=\"banking_test_dataset\",\n",
-    "    dataset=banking_test_dataset,\n",
-    "    text_column=\"input\",\n",
-    "    target_column=\"possible_outputs\",\n",
-    ")\n",
-    "\n",
-    "print(\"Banking Test Dataset Initialized in ValidMind!\")\n",
-    "print(f\"Dataset ID: {vm_test_dataset.input_id}\")\n",
-    "print(f\"Dataset columns: {vm_test_dataset._df.columns}\")\n",
-    "vm_test_dataset._df"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "7b01021c",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Assign predictions\n",
-    "\n",
-    "Now that both the model object and the datasets have been registered, we'll assign predictions to capture the banking agent's responses for evaluation:\n",
-    "\n",
-    "- The [`assign_predictions()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#assign_predictions) from the `Dataset` object can link existing predictions to any number of models.\n",
-    "- This method links the model's class prediction values and probabilities to our `vm_train_ds` and `vm_test_ds` datasets.\n",
-    "\n",
-    "If no prediction values are passed, the method will compute predictions automatically:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "1d462663",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_test_dataset.assign_predictions(vm_banking_model)\n",
-    "\n",
-    "print(\"Banking Agent Predictions Generated Successfully!\")\n",
-    "print(f\"Predictions assigned to {len(vm_test_dataset._df)} test cases\")\n",
-    "vm_test_dataset._df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "4e56f556",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Running accuracy tests\n",
-    "\n",
-    "Using [`@vm.test`](https://docs.validmind.ai/validmind/validmind.html#test), let's implement some reusable custom *inline tests* to assess the accuracy of our banking agent:\n",
-    "\n",
-    "- An inline test refers to a test written and executed within the same environment as the code being tested — in this case, right in this Jupyter Notebook —  without requiring a separate test file or framework.\n",
-    "- You'll note that the custom test functions are just regular Python functions that can include and require any Python library as you see fit."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "1bce9258",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_1__'></a>\n",
-    "\n",
-    "### Response accuracy test\n",
-    "\n",
-    "We'll create a custom test that evaluates the banking agent's ability to provide accurate responses by:\n",
-    "\n",
-    "- Testing against a dataset of predefined banking questions and expected answers.\n",
-    "- Checking if responses contain expected keywords and banking terminology.\n",
-    "- Providing detailed test results including pass/fail status.\n",
-    "- Helping identify any gaps in the agent's banking knowledge or response quality."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "90232066",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "\n",
-    "@vm.test(\"my_custom_tests.banking_accuracy_test\")\n",
-    "def banking_accuracy_test(model, dataset, list_of_columns):\n",
-    "    \"\"\"\n",
-    "    The Banking Accuracy Test evaluates whether the agent’s responses include \n",
-    "    critical domain-specific keywords and phrases that indicate accurate, compliant,\n",
-    "    and contextually appropriate banking information. This test ensures that the agent\n",
-    "    provides responses containing the expected banking terminology, risk classifications,\n",
-    "    account details, or other domain-relevant information required for regulatory compliance,\n",
-    "    customer safety, and operational accuracy.\n",
-    "    \"\"\"\n",
-    "    df = dataset._df\n",
-    "    \n",
-    "    # Pre-compute responses for all tests\n",
-    "    y_true = dataset.y.tolist()\n",
-    "    y_pred = dataset.y_pred(model).tolist()\n",
-    "\n",
-    "    # Vectorized test results\n",
-    "    test_results = []\n",
-    "    for response, keywords in zip(y_pred, y_true):\n",
-    "        # Convert keywords to list if not already a list\n",
-    "        if not isinstance(keywords, list):\n",
-    "            keywords = [keywords]\n",
-    "        test_results.append(any(str(keyword).lower() in str(response).lower() for keyword in keywords))\n",
-    "        \n",
-    "    results = pd.DataFrame()\n",
-    "    column_names = [col + \"_details\" for col in list_of_columns]\n",
-    "    results[column_names] = df[list_of_columns]\n",
-    "    results[\"actual\"] = y_pred\n",
-    "    results[\"expected\"] = y_true\n",
-    "    results[\"passed\"] = test_results\n",
-    "    results[\"error\"] = None if test_results else f'Response did not contain any expected keywords: {y_true}'\n",
-    "    \n",
-    "    return results"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "2a7f71f8",
-   "metadata": {},
-   "source": [
-    "Now that we've defined our custom response accuracy test, we can run the test using the same `run_test()` function we used earlier to validate the system prompt using our sample dataset and agentic model as input, and log the test results to the ValidMind Platform with the [`log()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#log):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "e68884d5",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = vm.tests.run_test(\n",
-    "    \"my_custom_tests.banking_accuracy_test\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_test_dataset,\n",
-    "        \"model\": vm_banking_model\n",
-    "    },\n",
-    "    params={\n",
-    "        \"list_of_columns\": [\"input\"]\n",
-    "    }\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "94a717e7",
-   "metadata": {},
-   "source": [
-    "Let's review the first five rows of the test dataset to inspect the results to see how well the banking agent performed. Each column in the output serves a specific purpose in evaluating agent performance:\n",
-    "\n",
-    "| Column header | Description | Importance |\n",
-    "|--------------|-------------|------------|\n",
-    "| **`input`** | Original user query or request | Essential for understanding the context of each test case and tracing which inputs led to specific agent behaviors. |\n",
-    "| **`expected_tools`** | Banking tools that should be invoked for this request | Enables validation of correct tool selection, which is critical for agentic AI systems where choosing the right tool is a key success metric. |\n",
-    "| **`expected_output`** | Expected output or keywords that should appear in the response | Defines the success criteria for each test case, enabling objective evaluation of whether the agent produced the correct result. |\n",
-    "| **`session_id`** | Unique identifier for each test session | Allows tracking and correlation of related test runs, debugging specific sessions, and maintaining audit trails. |\n",
-    "| **`category`** | Classification of the request type | Helps organize test results by domain and identify performance patterns across different banking use cases. |\n",
-    "| **`banking_agent_model_output`** | Complete agent response including all messages and reasoning | Allows you to examine the full output to assess response quality, completeness, and correctness beyond just keyword matching. |\n",
-    "| **`banking_agent_model_tool_messages`** | Messages exchanged with the banking tools | Critical for understanding how the agent interacted with tools, what parameters were passed, and what tool outputs were received. |\n",
-    "| **`banking_agent_model_tool_called`** | Specific tool that was invoked | Enables validation that the agent selected the correct tool for each request, which is fundamental to agentic AI validation. |\n",
-    "| **`possible_outputs`** | Alternative valid outputs or keywords that could appear in the response | Provides flexibility in evaluation by accounting for multiple acceptable response formats or variations. |"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "78f7edb1",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_test_dataset.df.head(5)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "1cb3e8bd",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2__'></a>\n",
-    "\n",
-    "### Tool selection accuracy test\n",
-    "\n",
-    "We'll also create a custom test that evaluates the banking agent's ability to select the correct tools for different requests by:\n",
-    "\n",
-    "- Testing against a dataset of predefined banking queries with expected tool selections.\n",
-    "- Comparing the tools actually invoked by the agent against the expected tools for each request.\n",
-    "- Providing quantitative accuracy scores that measure the proportion of expected tools correctly selected.\n",
-    "- Helping identify gaps in the agent's understanding of user needs and tool selection logic."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "69263d62",
-   "metadata": {},
-   "source": [
-    "First, we'll define a helper function that extracts tool calls from the agent's messages and compares them against the expected tools. This function handles different message formats (dictionary or object) and calculates accuracy scores:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "e68798be",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def validate_tool_calls_simple(messages, expected_tools):\n",
-    "    \"\"\"Simple validation of tool calls without RAGAS dependency issues.\"\"\"\n",
-    "    \n",
-    "    tool_calls_found = []\n",
-    "    \n",
-    "    for message in messages:\n",
-    "        if hasattr(message, 'tool_calls') and message.tool_calls:\n",
-    "            for tool_call in message.tool_calls:\n",
-    "                # Handle both dictionary and object formats\n",
-    "                if isinstance(tool_call, dict):\n",
-    "                    tool_calls_found.append(tool_call['name'])\n",
-    "                else:\n",
-    "                    # ToolCall object - use attribute access\n",
-    "                    tool_calls_found.append(tool_call.name)\n",
-    "    \n",
-    "    # Check if expected tools were called\n",
-    "    accuracy = 0.0\n",
-    "    matches = 0\n",
-    "    if expected_tools:\n",
-    "        matches = sum(1 for tool in expected_tools if tool in tool_calls_found)\n",
-    "        accuracy = matches / len(expected_tools)\n",
-    "    \n",
-    "    return {\n",
-    "        'expected_tools': expected_tools,\n",
-    "        'found_tools': tool_calls_found,\n",
-    "        'matches': matches,\n",
-    "        'total_expected': len(expected_tools) if expected_tools else 0,\n",
-    "        'accuracy': accuracy,\n",
-    "    }"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "8f494fd3",
-   "metadata": {},
-   "source": [
-    "Now we'll define the main test function that uses the helper function to evaluate tool selection accuracy across all test cases in the dataset:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "604d7313",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "@vm.test(\"my_custom_tests.BankingToolCallAccuracy\")\n",
-    "def BankingToolCallAccuracy(dataset, agent_output_column, expected_tools_column):\n",
-    "    \"\"\"\n",
-    "    Evaluates the tool selection accuracy of a LangGraph-powered banking agent.\n",
-    "\n",
-    "    This test measures whether the agent correctly identifies and invokes the required banking tools\n",
-    "    for each user query scenario.\n",
-    "    For each case, the outputs generated by the agent (including its tool calls) are compared against an\n",
-    "    expected set of tools. The test considers both coverage and exactness: it computes the proportion of\n",
-    "    expected tools correctly called by the agent for each instance.\n",
-    "\n",
-    "    Parameters:\n",
-    "        dataset (VMDataset): The dataset containing user queries, agent outputs, and ground-truth tool expectations.\n",
-    "        agent_output_column (str): Dataset column name containing agent outputs (should include tool call details in 'messages').\n",
-    "        expected_tools_column (str): Dataset column specifying the true expected tools (as lists).\n",
-    "\n",
-    "    Returns:\n",
-    "        List[dict]: Per-row dictionaries with details: expected tools, found tools, match count, total expected, and accuracy score.\n",
-    "\n",
-    "    Purpose:\n",
-    "        Provides diagnostic evidence of the banking agent's core reasoning ability—specifically, its capacity to\n",
-    "        interpret user needs and select the correct banking actions. Useful for diagnosing gaps in tool coverage,\n",
-    "        misclassifications, or breakdowns in agent logic.\n",
-    "\n",
-    "    Interpretation:\n",
-    "        - An accuracy of 1.0 signals perfect tool selection for that example.\n",
-    "        - Lower scores may indicate partial or complete failures to invoke required tools.\n",
-    "        - Review 'found_tools' vs. 'expected_tools' to understand the source of discrepancies.\n",
-    "\n",
-    "    Strengths:\n",
-    "        - Directly tests a core capability of compositional tool-use agents.\n",
-    "        - Framework-agnostic; robust to tool call output format (object or dict).\n",
-    "        - Supports batch validation and result logging for systematic documentation.\n",
-    "\n",
-    "    Limitations:\n",
-    "        - Does not penalize extra, unnecessary tool calls.\n",
-    "        - Does not assess result quality—only correct invocation.\n",
-    "\n",
-    "    \"\"\"\n",
-    "    df = dataset._df\n",
-    "    \n",
-    "    results = []\n",
-    "    for i, row in df.iterrows():\n",
-    "        result = validate_tool_calls_simple(row[agent_output_column]['messages'], row[expected_tools_column])\n",
-    "        results.append(result)\n",
-    "         \n",
-    "    return results"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "57ab606b",
-   "metadata": {},
-   "source": [
-    "Finally, we can call our function with `run_test()` and log the test results to the ValidMind Platform:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "dd14115e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = vm.tests.run_test(\n",
-    "    \"my_custom_tests.BankingToolCallAccuracy\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_test_dataset,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"agent_output_column\": \"banking_agent_model_output\",\n",
-    "        \"expected_tools_column\": \"expected_tools\"\n",
-    "    }\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "be8d5270",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Assigning AI evaluation metric scores\n",
-    "\n",
-    "*AI agent evaluation metrics* are specialized measurements designed to assess how well autonomous LLM-based agents reason, plan, select and execute tools, and ultimately complete user tasks by analyzing the *full execution trace* — including reasoning steps, tool calls, intermediate decisions, and outcomes, rather than just single input–output pairs. These metrics are essential because agent failures often occur in ways traditional LLM metrics miss — for example, choosing the right tool with wrong arguments, creating a good plan but not following it, or completing a task inefficiently.\n",
-    "\n",
-    "In this section, we'll evaluate our banking agent's outputs and add scoring to our sample dataset against metrics defined in [DeepEval’s AI agent evaluation framework](https://deepeval.com/guides/guides-ai-agent-evaluation-metrics) which breaks down AI agent evaluation into three layers with corresponding subcategories: **reasoning**, **action**, and **execution**.\n",
-    "\n",
-    "Together, these three metrics enable granular diagnosis of agent behavior, help pinpoint where failures occur (reasoning, action, or execution), and support both development benchmarking and production monitoring."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "25828bef",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1__'></a>\n",
-    "\n",
-    "### Identify relevant DeepEval scorers\n",
-    "\n",
-    "*Scorers* are evaluation metrics that analyze model outputs and store their results in the dataset:\n",
-    "\n",
-    "- Each scorer adds a new column to the dataset with format: `{scorer_name}_{metric_name}`\n",
-    "- The column contains the numeric score (typically `0`-`1`) for each example\n",
-    "- Multiple scorers can be run on the same dataset, each adding their own column\n",
-    "- Scores are persisted in the dataset for later analysis and visualization\n",
-    "- Common scorer patterns include:\n",
-    "  - Model performance metrics (accuracy, F1, etc.)\n",
-    "  - Output quality metrics (relevance, faithfulness)\n",
-    "  - Task-specific metrics (completion, correctness)\n",
-    "\n",
-    "Use `list_scorers()` from [`validmind.scorers`](https://docs.validmind.ai/validmind/validmind/tests.html#scorer) to discover all available scoring methods and their IDs that can be used with `assign_scores()`. We'll filter these results to return only DeepEval scorers for our desired three metrics in a formatted table with descriptions:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "730c70ec",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load all DeepEval scorers\n",
-    "llm_scorers_dict = vm.tests.load._load_tests([s for s in vm.scorer.list_scorers() if \"deepeval\" in s.lower()])\n",
-    "\n",
-    "# Categorize scorers by metric layer\n",
-    "reasoning_scorers = {}\n",
-    "action_scorers = {}\n",
-    "execution_scorers = {}\n",
-    "\n",
-    "for scorer_id, scorer_func in llm_scorers_dict.items():\n",
-    "    tags = getattr(scorer_func, \"__tags__\", [])\n",
-    "    scorer_name = scorer_id.split(\".\")[-1]\n",
-    "\n",
-    "    if \"reasoning_layer\" in tags:\n",
-    "        reasoning_scorers[scorer_id] = scorer_func\n",
-    "    elif \"action_layer\" in tags:\n",
-    "        action_scorers[scorer_id] = scorer_func\n",
-    "    elif \"TaskCompletion\" in scorer_name:\n",
-    "        execution_scorers[scorer_id] = scorer_func\n",
-    "\n",
-    "# Display scorers by category\n",
-    "print(\"=\" * 80)\n",
-    "print(\"REASONING LAYER\")\n",
-    "print(\"=\" * 80)\n",
-    "if reasoning_scorers:\n",
-    "    reasoning_df = vm.tests.load._pretty_list_tests(reasoning_scorers, truncate=True)\n",
-    "    display(reasoning_df)\n",
-    "else:\n",
-    "    print(\"No reasoning layer scorers found.\")\n",
-    "\n",
-    "print(\"\\n\" + \"=\" * 80)\n",
-    "print(\"ACTION LAYER\")\n",
-    "print(\"=\" * 80)\n",
-    "if action_scorers:\n",
-    "    action_df = vm.tests.load._pretty_list_tests(action_scorers, truncate=True)\n",
-    "    display(action_df)\n",
-    "else:\n",
-    "    print(\"No action layer scorers found.\")\n",
-    "\n",
-    "print(\"\\n\" + \"=\" * 80)\n",
-    "print(\"EXECUTION LAYER\")\n",
-    "print(\"=\" * 80)\n",
-    "if execution_scorers:\n",
-    "    execution_df = vm.tests.load._pretty_list_tests(execution_scorers, truncate=True)\n",
-    "    display(execution_df)\n",
-    "else:\n",
-    "    print(\"No execution layer scorers found.\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e5fb739b",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2__'></a>\n",
-    "\n",
-    "### Assign reasoning scores\n",
-    "\n",
-    "*Reasoning* evaluates planning and strategy generation:\n",
-    "\n",
-    "- **Plan quality** – How logical, complete, and efficient the agent’s plan is.\n",
-    "- **Plan adherence** – Whether the agent follows its own plan during execution."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "fde94d01",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2_1__'></a>\n",
-    "\n",
-    "#### Plan quality score\n",
-    "\n",
-    "Let's measure how well our banking agent generates a plan before acting. A high score means the plan is logical, complete, and efficient."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "52f362ba",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_test_dataset.assign_scores(\n",
-    "    metrics = \"validmind.scorers.llm.deepeval.PlanQuality\",\n",
-    "    model = vm_banking_model,\n",
-    "    input_column = \"input\",\n",
-    ")\n",
-    "vm_test_dataset._df[['banking_agent_model_PlanQuality_score','banking_agent_model_PlanQuality_reason']]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "d631fd12",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2_2__'></a>\n",
-    "\n",
-    "#### Plan adherence score\n",
-    "\n",
-    "Let's check whether our banking agent follows the plan it created. Deviations lower this score and indicate gaps between reasoning and execution."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "4124a7c2",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_test_dataset.assign_scores(\n",
-    "    metrics = \"validmind.scorers.llm.deepeval.PlanAdherence\",\n",
-    "    input_column = \"input\",\n",
-    "    model = vm_banking_model,\n",
-    ")\n",
-    "vm_test_dataset._df[['banking_agent_model_PlanAdherence_score','banking_agent_model_PlanAdherence_reason']]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "82e5e6f1",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_3__'></a>\n",
-    "\n",
-    "### Assign action scores\n",
-    "\n",
-    "*Action* assesses tool usage and argument generation:\n",
-    "\n",
-    "- **Tool correctness** – Whether the agent selects and calls the right tools.\n",
-    "- **Argument correctness** – Whether the agent generates correct tool arguments."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e641c9f2",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_3_1__'></a>\n",
-    "\n",
-    "#### Tool correctness score\n",
-    "\n",
-    "Let's evaluate if our banking agent selects the appropriate tool for the task. Choosing the wrong tool reduces performance even if reasoning was correct."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "8d2e8a25",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_test_dataset.assign_scores(\n",
-    "    metrics = \"validmind.scorers.llm.deepeval.ToolCorrectness\",\n",
-    "    input_column = \"input\",\n",
-    "    model = vm_banking_model,\n",
-    "    expected_tools_called_column = \"expected_tools\",\n",
-    "    actual_tools_called_column = \"banking_agent_model_tool_called\",\n",
-    ")\n",
-    "vm_test_dataset._df[['banking_agent_model_ToolCorrectness_score','banking_agent_model_ToolCorrectness_reason']]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "dd758ba5",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_3_2__'></a>\n",
-    "\n",
-    "#### Argument correctness score\n",
-    "\n",
-    "Let's assesses whether our banking agent provides correct inputs or arguments to the selected tool. Incorrect arguments can lead to failed or unexpected results."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "04f90489",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_test_dataset.assign_scores(\n",
-    "    metrics = \"validmind.scorers.llm.deepeval.ArgumentCorrectness\",\n",
-    "    input_column = \"input\",\n",
-    "    model = vm_banking_model,\n",
-    "    actual_tools_called_column = \"banking_agent_model_tool_called\",\n",
-    ")\n",
-    "vm_test_dataset._df[['banking_agent_model_ArgumentCorrectness_score','banking_agent_model_ArgumentCorrectness_reason']]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "1aeec2f5",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_4__'></a>\n",
-    "\n",
-    "### Assign execution score\n",
-    "\n",
-    "*Execution* measures end-to-end performance:\n",
-    "\n",
-    "- **Task completion** – Whether the agent successfully completes the intended task."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "eb9ab8de",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_4_1__'></a>\n",
-    "\n",
-    "#### Task completion score\n",
-    "\n",
-    "Let's evaluate whether our banking agent successfully completes the requested tasks. Incomplete task execution can lead to user dissatisfaction and failed banking operations."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "05024f1f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_test_dataset.assign_scores(\n",
-    "    metrics = \"validmind.scorers.llm.deepeval.TaskCompletion\",\n",
-    "    input_column = \"input\",\n",
-    "    model = vm_banking_model,\n",
-    "    actual_tools_called_column = \"banking_agent_model_tool_called\",\n",
-    ")\n",
-    "vm_test_dataset._df[['banking_agent_model_TaskCompletion_score','banking_agent_model_TaskCompletion_reason']]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b577c282",
-   "metadata": {},
-   "source": [
-    "As you recall from the beginning of this section, when we run scorers through `assign_scores()`, the return values are automatically processed and added as new columns with the format `{scorer_name}_{metric_name}`. Note that the task completion scorer has added a new column `TaskCompletion_score` to our dataset.\n",
-    "\n",
-    "We'll use this column to visualize the distribution of task completion scores across our test cases through the [BoxPlot test](https://docs.validmind.ai/validmind/validmind/tests/plots/BoxPlot.html#boxplot):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "7f6d08ca",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    \"validmind.plots.BoxPlot\",\n",
-    "    inputs={\"dataset\": vm_test_dataset},\n",
-    "    params={\n",
-    "        \"columns\": \"banking_agent_model_TaskCompletion_score\",\n",
-    "        \"title\": \"Distribution of Task Completion Scores\",\n",
-    "        \"ylabel\": \"Score\",\n",
-    "        \"figsize\": (8, 6)\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "30d9ec62",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Running RAGAS tests\n",
-    "\n",
-    "Next, let's run some out-of-the-box *Retrieval-Augmented Generation Assessment* (RAGAS) tests available in the ValidMind Library. RAGAS provides specialized metrics for evaluating retrieval-augmented generation systems and conversational AI agents. These metrics analyze different aspects of agent performance by assessing how well systems integrate retrieved information with generated responses.\n",
-    "\n",
-    "Our banking agent uses tools to retrieve information and generates responses based on that context, making it similar to a RAG system. RAGAS metrics help evaluate the quality of this integration by analyzing the relationship between retrieved tool outputs, user queries, and generated responses.\n",
-    "\n",
-    "These tests provide insights into how well our banking agent integrates tool usage with conversational abilities, ensuring it provides accurate, relevant, and helpful responses to banking users while maintaining fidelity to retrieved information."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "8288f6c3",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_1__'></a>\n",
-    "\n",
-    "### Identify relevant RAGAS tests\n",
-    "\n",
-    "Let's explore some of ValidMind's available tests. Using ValidMind’s repository of tests streamlines your development testing, and helps you ensure that your models are being documented and evaluated appropriately.\n",
-    "\n",
-    "You can pass `tasks` and `tags` as parameters to the [`vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) to filter the tests based on the tags and task types:\n",
-    "\n",
-    "- **`tasks`** represent the kind of modeling task associated with a test. Here we'll focus on `text_qa` tasks.\n",
-    "- **`tags`** are free-form descriptions providing more details about the test, for example, what category the test falls into. Here we'll focus on the `ragas` tag.\n",
-    "\n",
-    "We'll then run three of these tests returned as examples below."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "0701f5a9",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.list_tests(task=\"text_qa\", tags=[\"ragas\"])"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "2ce24ba0",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_1_1__'></a>\n",
-    "\n",
-    "#### Faithfulness\n",
-    "\n",
-    "Let's evaluate whether the banking agent's responses accurately reflect the information retrieved from tools. Unfaithful responses can misreport credit analysis, financial calculations, and compliance results—undermining user trust in the banking agent.\n",
-    "\n",
-    "RAGAS runs a **judge LLM** that can be much slower than your agent if it uses the same model. In your `.env`, set **`VM_RAGAS_JUDGE_MODEL`** (for example `gpt-4o-mini`) so faithfulness and other RAGAS metrics use a faster judge while **`VM_OPENAI_MODEL`** can stay tuned for the agent. RAGAS execution also respects **`VM_RAGAS_TIMEOUT`**, **`VM_RAGAS_MAX_RETRIES`**, and **`VM_RAGAS_MAX_WORKERS`** (defaults help notebook stability).\n",
-    "\n",
-    "The cell below passes **`max_eval_rows`** and **`max_response_chars`** to bound evaluation cost on long agent outputs."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "92044533",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    \"validmind.model_validation.ragas.Faithfulness\",\n",
-    "    inputs={\"dataset\": vm_test_dataset},\n",
-    "    param_grid={\n",
-    "        \"user_input_column\": [\"input\"],\n",
-    "        \"response_column\": [\"banking_agent_model_prediction\"],\n",
-    "        \"retrieved_contexts_column\": [\"banking_agent_model_tool_messages\"],\n",
-    "        \"max_eval_rows\": [4],\n",
-    "        \"max_response_chars\": [6000],\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "4d1fcfcd",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_1_2__'></a>\n",
-    "\n",
-    "#### Response Relevancy\n",
-    "\n",
-    "Let's evaluate whether the banking agent's answers address the user's original question or request. Irrelevant or off-topic responses can frustrate users and fail to deliver the banking information they need."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "d7483bc3",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    \"validmind.model_validation.ragas.ResponseRelevancy\",\n",
-    "    inputs={\"dataset\": vm_test_dataset},\n",
-    "    params={\n",
-    "        \"user_input_column\": \"input\",\n",
-    "        \"response_column\": \"banking_agent_model_prediction\",\n",
-    "        \"retrieved_contexts_column\": \"banking_agent_model_tool_messages\",\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "38c1dfb5",
-   "metadata": {},
-   "source": [
-    "<a id='toc7_1_3__'></a>\n",
-    "\n",
-    "#### Context Recall\n",
-    "\n",
-    "Let's evaluate how well the banking agent uses the information retrieved from tools when generating its responses. Poor context recall can lead to incomplete or underinformed answers even when the right tools were selected."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "e5dc00ce",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    \"validmind.model_validation.ragas.ContextRecall\",\n",
-    "    inputs={\"dataset\": vm_test_dataset},\n",
-    "    param_grid={\n",
-    "        \"user_input_column\": [\"input\"],\n",
-    "        \"retrieved_contexts_column\": [\"banking_agent_model_tool_messages\"],\n",
-    "        \"reference_column\": [\"banking_agent_model_prediction\"],\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "95e1e16a",
-   "metadata": {},
-   "source": [
-    "<a id='toc8__'></a>\n",
-    "\n",
-    "## Running safety tests\n",
-    "\n",
-    "Finally, let's run some out-of-the-box *safety* tests available in the ValidMind Library. Safety tests provide specialized metrics for evaluating whether AI agents operate reliably and securely. These metrics analyze different aspects of agent behavior by assessing adherence to safety guidelines, consistency of outputs, and resistance to harmful or inappropriate requests.\n",
-    "\n",
-    "Our banking agent handles sensitive financial information and user requests, making safety and reliability essential. Safety tests help evaluate whether the agent maintains appropriate boundaries, responds consistently and correctly to inputs, and avoids generating harmful, biased, or unprofessional content.\n",
-    "\n",
-    "These tests provide insights into how well our banking agent upholds standards of fairness and professionalism, ensuring it operates reliably and securely for banking users."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e0972afa",
-   "metadata": {},
-   "source": [
-    "<a id='toc8_1_1__'></a>\n",
-    "\n",
-    "#### AspectCritic\n",
-    "\n",
-    "Let's evaluate our banking agent's responses across multiple quality dimensions — conciseness, coherence, correctness, harmfulness, and maliciousness. Weak performance on these dimensions can degrade user experience, fall short of professional banking standards, or introduce safety risks. \n",
-    "\n",
-    "We'll use the `AspectCritic` we identified earlier:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "148daa2b",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    \"validmind.model_validation.ragas.AspectCritic\",\n",
-    "    inputs={\"dataset\": vm_test_dataset},\n",
-    "    param_grid={\n",
-    "        \"user_input_column\": [\"input\"],\n",
-    "        \"response_column\": [\"banking_agent_model_prediction\"],\n",
-    "        \"retrieved_contexts_column\": [\"banking_agent_model_tool_messages\"],\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "16f29c8d",
-   "metadata": {},
-   "source": [
-    "<a id='toc8_1_2__'></a>\n",
-    "\n",
-    "#### Bias\n",
-    "\n",
-    "Let's evaluate whether our banking agent's prompts contain unintended biases that could affect banking decisions. Biased prompts can lead to unfair or discriminatory outcomes — undermining customer trust and exposing the institution to compliance risk.\n",
-    "\n",
-    "We'll first use `list_tests()` again to filter for tests relating to `prompt_validation`:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "74eba86c",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.list_tests(filter=\"prompt_validation\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e9413803",
-   "metadata": {},
-   "source": [
-    "And then run the identified `Bias` test:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "062cf8e7",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    \"validmind.prompt_validation.Bias\",\n",
-    "    inputs={\n",
-    "        \"model\": vm_banking_model,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "8f3f2dbe",
-   "metadata": {},
-   "source": [
-    "<a id='toc9__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the output produced by the ValidMind Library right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "8716165d",
-   "metadata": {},
-   "source": [
-    "<a id='toc9_1__'></a>\n",
-    "\n",
-    "### Work with your model documentation\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "    What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)\n",
-    "\n",
-    "3. Click into any section related to the tests we ran in this notebook, for example: **4.3. Prompt Evaluation** to review the results of the tests we logged."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "7c4a78ce",
-   "metadata": {},
-   "source": [
-    "<a id='toc9_2__'></a>\n",
-    "\n",
-    "### Customize the banking agent for your use case\n",
-    "\n",
-    "You've now built an agentic AI system designed for banking use cases that supports compliance with supervisory guidance such as SR 11-7 and SS1/23, covering credit and fraud risk assessment for both retail and commercial banking. Extend this example agent to real-world banking scenarios and production deployment by:\n",
-    "\n",
-    "- Adapting the banking tools to your organization's specific requirements\n",
-    "- Adding more banking scenarios and edge cases to your test set\n",
-    "- Connecting the agent to your banking systems and databases\n",
-    "- Implementing additional banking-specific tools and workflows"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "7f9385d3",
-   "metadata": {},
-   "source": [
-    "<a id='toc9_3__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "Learn more about the ValidMind Library tools we used in this notebook:\n",
-    "\n",
-    "- [Custom prompts](https://docs.validmind.ai/notebooks/how_to/customize_test_result_descriptions.html)\n",
-    "- [Custom tests](https://docs.validmind.ai/notebooks/code_samples/custom_tests/implement_custom_tests.html)\n",
-    "- [ValidMind scorers](https://docs.validmind.ai/notebooks/how_to/assign_scores_complete_tutorial.html)\n",
-    "\n",
-    "We also offer many more interactive notebooks to help you document models:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "fdd5c0db",
-   "metadata": {},
-   "source": [
-    "<a id='toc10__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "9733adff",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "829429fd",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "55339760",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-b9e82bcf4e364c4f8e5ae4bb0e4b2865",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "validmind-1QuffXMV-py3.11",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.11.9"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Document an agentic AI system\n",
+        "\n",
+        "Build and document an agentic AI system with the ValidMind Library. Construct a LangGraph-based banking agent, assign AI evaluation metric scores to your agent, and run accuracy, RAGAS, and safety tests, then log those test results to the ValidMind Platform.\n",
+        "\n",
+        "An _AI agent_ is an autonomous system that interprets inputs, selects from available tools or actions, and executes multi-step behaviors to achieve defined goals. In this notebook, the agent acts as a banking assistant that analyzes user requests and automatically selects and invokes the appropriate specialized banking tool to deliver accurate, compliant, and actionable responses.\n",
+        "\n",
+        "- This agent enables financial institutions to automate complex banking workflows where different customer requests require different specialized tools and knowledge bases.\n",
+        "- Effective validation of agentic AI systems reduces the risks of agents misinterpreting inputs, failing to extract required parameters, or producing incorrect assessments or actions — such as selecting the wrong tool.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For the LLM components in this notebook to function properly, you'll need access to OpenAI.</b></span>\n",
+        "<br></br>\n",
+        "Before you continue, ensure that a valid <code>OPENAI_API_KEY</code> is set in your <code>.env</code> file.</div>"
+      ],
+      "id": "eee6b64c"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "    - [Preview the documentation template](#toc2_2_4__)    \n",
+        "  - [Verify OpenAI API access](#toc2_3__)    \n",
+        "  - [Initialize the Python environment](#toc2_4__)    \n",
+        "- [Building the LangGraph agent](#toc3__)    \n",
+        "  - [Test available banking tools](#toc3_1__)    \n",
+        "  - [Create LangGraph banking agent](#toc3_2__)    \n",
+        "    - [Define system prompt](#toc3_2_1__)    \n",
+        "    - [Initialize the LLM](#toc3_2_2__)    \n",
+        "    - [Define agent state structure](#toc3_2_3__)    \n",
+        "    - [Create agent workflow function](#toc3_2_4__)    \n",
+        "    - [Instantiate the banking agent](#toc3_2_5__)    \n",
+        "  - [Integrate agent with ValidMind](#toc3_3__)    \n",
+        "    - [Import ValidMind components](#toc3_3_1__)    \n",
+        "    - [Create agent wrapper function](#toc3_3_2__)    \n",
+        "    - [Initialize the ValidMind model object](#toc3_3_3__)    \n",
+        "    - [Store the agent reference](#toc3_3_4__)    \n",
+        "    - [Verify integration](#toc3_3_5__)    \n",
+        "  - [Validate the system prompt](#toc3_4__)    \n",
+        "- [Initializing the ValidMind dataset](#toc4__)    \n",
+        "  - [Assign predictions](#toc4_1__)    \n",
+        "- [Running accuracy tests](#toc5__)    \n",
+        "  - [Response accuracy test](#toc5_1__)    \n",
+        "  - [Tool selection accuracy test](#toc5_2__)    \n",
+        "- [Assigning AI evaluation metric scores](#toc6__)    \n",
+        "  - [Identify relevant DeepEval scorers](#toc6_1__)    \n",
+        "  - [Assign reasoning scores](#toc6_2__)    \n",
+        "    - [Plan quality score](#toc6_2_1__)    \n",
+        "    - [Plan adherence score](#toc6_2_2__)    \n",
+        "  - [Assign action scores](#toc6_3__)    \n",
+        "    - [Tool correctness score](#toc6_3_1__)    \n",
+        "    - [Argument correctness score](#toc6_3_2__)    \n",
+        "  - [Assign execution score](#toc6_4__)    \n",
+        "    - [Task completion score](#toc6_4_1__)    \n",
+        "- [Running RAGAS tests](#toc7__)    \n",
+        "  - [Identify relevant RAGAS tests](#toc7_1__)    \n",
+        "    - [Faithfulness](#toc7_1_1__)    \n",
+        "    - [Response Relevancy](#toc7_1_2__)    \n",
+        "    - [Context Recall](#toc7_1_3__)    \n",
+        "- [Running safety tests](#toc8__)    \n",
+        "    - [AspectCritic](#toc8_1_1__)    \n",
+        "    - [Bias](#toc8_1_2__)    \n",
+        "- [Next steps](#toc9__)    \n",
+        "  - [Work with your model documentation](#toc9_1__)    \n",
+        "  - [Customize the banking agent for your use case](#toc9_2__)    \n",
+        "  - [Discover more learning resources](#toc9_3__)    \n",
+        "- [Upgrade ValidMind](#toc10__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ],
+      "id": "30927b2b"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models. \n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators."
+      ],
+      "id": "b58139db"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
+      ],
+      "id": "7e30d36b"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+      ],
+      "id": "1cba586e"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ],
+      "id": "5c46f003"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ],
+      "id": "11a2d7a5"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
+        "<br></br>\n",
+        "Python 3.9 <= x <= 3.14</div>\n",
+        "\n",
+        "Let's begin by installing the ValidMind Library with large language model (LLM) support:"
+      ],
+      "id": "fbab0edf"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q \"validmind[llm]\" \"langgraph==0.3.21\""
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "1982a118"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ],
+      "id": "14578e26"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook.\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ],
+      "id": "83d47d89"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Agentic AI`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ],
+      "id": "bb2c5670"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Can't select this template?</b></span>\n",
+        "<br></br>\n",
+        "Your organization administrators may need to add it to your template library:\n",
+        "<ul>\n",
+        "<li><a href=\"agentic_ai_template.yaml\" style=\"color: #DE257E;\"><b>Download Template YAML</b></a></li>\n",
+        "<li><a href=\"https://docs.validmind.ai/guide/templates/customize-document-templates.html\" style=\"color: #DE257E;\"><b>Customize Document Templates</b></a></li>\n",
+        "</ul>\n",
+        "</div>"
+      ],
+      "id": "98e475c1"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ],
+      "id": "0d1a13ca"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "d6ccbefc"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_4__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ],
+      "id": "3605df4f"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "dffdaa6f"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Verify OpenAI API access\n",
+        "\n",
+        "Verify that a valid `OPENAI_API_KEY` is set in your `.env` file:"
+      ],
+      "id": "d467c1d2"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load environment variables if using .env file\n",
+        "try:\n",
+        "    from dotenv import load_dotenv\n",
+        "    load_dotenv()\n",
+        "except ImportError:\n",
+        "    print(\"dotenv not installed. Make sure OPENAI_API_KEY is set in your environment.\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "22cc39cb"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_4__'></a>\n",
+        "\n",
+        "### Initialize the Python environment\n",
+        "\n",
+        "Let's import all the necessary libraries to prepare for building our banking LangGraph agentic system:\n",
+        "\n",
+        "- **Standard libraries** for data handling and environment management.\n",
+        "- **pandas**, a Python library for data manipulation and analytics, as an alias. We'll also configure pandas to show all columns and all rows at full width for easier debugging and inspection.\n",
+        "- **LangChain** components for LLM integration and tool management.\n",
+        "- **LangGraph** for building stateful, multi-step agent workflows.\n",
+        "- **Banking tools** for specialized financial services as defined in [banking_tools.py](banking_tools.py)."
+      ],
+      "id": "b56c3f39"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from typing import TypedDict, Annotated, Sequence\n",
+        "\n",
+        "from langchain_core.messages import BaseMessage, HumanMessage, SystemMessage\n",
+        "from langchain_openai import ChatOpenAI\n",
+        "from langgraph.checkpoint.memory import MemorySaver\n",
+        "from langgraph.graph import StateGraph, END, START\n",
+        "from langgraph.graph.message import add_messages\n",
+        "from langgraph.prebuilt import ToolNode\n",
+        "\n",
+        "# LOCAL IMPORTS FROM banking_tools.py\n",
+        "from banking_tools import AVAILABLE_TOOLS\n",
+        "\n",
+        "import pandas as pd\n",
+        "# Configure pandas to show all columns and all rows at full width\n",
+        "pd.set_option('display.max_columns', None)\n",
+        "pd.set_option('display.max_colwidth', None)\n",
+        "pd.set_option('display.width', None)\n",
+        "pd.set_option('display.max_rows', None)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "2058d1ac"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Building the LangGraph agent"
+      ],
+      "id": "cc1d3265"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Test available banking tools\n",
+        "\n",
+        "We'll use the demo banking tools defined in `banking_tools.py` that provide use cases of financial services:\n",
+        "\n",
+        "- **Credit Risk Analyzer** - Loan applications and credit decisions\n",
+        "- **Customer Account Manager** - Account services and customer support\n",
+        "- **Fraud Detection System** - Security and fraud prevention"
+      ],
+      "id": "a3c421c4"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "print(f\"Available tools: {len(AVAILABLE_TOOLS)}\")\n",
+        "print(\"\\nTool Details:\")\n",
+        "for i, tool in enumerate(AVAILABLE_TOOLS, 1):\n",
+        "    print(f\"   - {tool.name}\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "1e0a120c"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let's test each banking tool individually to ensure they're working correctly before integrating them into our agent:"
+      ],
+      "id": "53906630"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Test 1: Credit Risk Analyzer\n",
+        "print(\"TEST 1: Credit Risk Analyzer\")\n",
+        "print(\"-\" * 40)\n",
+        "try:\n",
+        "    # Access the underlying function using .func\n",
+        "    credit_result = AVAILABLE_TOOLS[0].func(\n",
+        "        customer_income=75000,\n",
+        "        customer_debt=1200,\n",
+        "        credit_score=720,\n",
+        "        loan_amount=50000,\n",
+        "        loan_type=\"personal\"\n",
+        "    )\n",
+        "    print(credit_result)\n",
+        "    print(\"Credit Risk Analyzer test PASSED\")\n",
+        "except Exception as e:\n",
+        "    print(f\"Credit Risk Analyzer test FAILED: {e}\")\n",
+        "\n",
+        "print(\"\" + \"=\" * 60)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "dc0caff2"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "\n",
+        "# Test 2: Customer Account Manager\n",
+        "print(\"TEST 2: Customer Account Manager\")\n",
+        "print(\"-\" * 40)\n",
+        "try:\n",
+        "    # Test checking balance\n",
+        "    account_result = AVAILABLE_TOOLS[1].func(\n",
+        "        account_type=\"checking\",\n",
+        "        customer_id=\"12345\",\n",
+        "        action=\"check_balance\"\n",
+        "    )\n",
+        "    print(account_result)\n",
+        "\n",
+        "    # Test getting account info\n",
+        "    info_result = AVAILABLE_TOOLS[1].func(\n",
+        "        account_type=\"all\",\n",
+        "        customer_id=\"12345\", \n",
+        "        action=\"get_info\"\n",
+        "    )\n",
+        "    print(info_result)\n",
+        "    print(\"Customer Account Manager test PASSED\")\n",
+        "except Exception as e:\n",
+        "    print(f\"Customer Account Manager test FAILED: {e}\")\n",
+        "\n",
+        "print(\"\" + \"=\" * 60)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "b6b227db"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "\n",
+        "# Test 3: Fraud Detection System\n",
+        "print(\"TEST 3: Fraud Detection System\")\n",
+        "print(\"-\" * 40)\n",
+        "try:\n",
+        "    fraud_result = AVAILABLE_TOOLS[2].func(\n",
+        "        transaction_id=\"TX123\",\n",
+        "        customer_id=\"12345\",\n",
+        "        transaction_amount=500.00,\n",
+        "        transaction_type=\"withdrawal\",\n",
+        "        location=\"Miami, FL\",\n",
+        "        device_id=\"DEVICE_001\"\n",
+        "    )\n",
+        "    print(fraud_result)\n",
+        "    print(\"Fraud Detection System test PASSED\")\n",
+        "except Exception as e:\n",
+        "    print(f\"Fraud Detection System test FAILED: {e}\")\n",
+        "\n",
+        "print(\"\" + \"=\" * 60)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "a983b30d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2__'></a>\n",
+        "\n",
+        "### Create LangGraph banking agent\n",
+        "\n",
+        "With our tools ready to go, we'll create our intelligent banking agent with LangGraph that automatically selects and uses the appropriate banking tool based on a user request."
+      ],
+      "id": "1424baed"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_1__'></a>\n",
+        "\n",
+        "#### Define system prompt\n",
+        "\n",
+        "We'll begin by defining our system prompt, which provides the LLM with context about its role as a banking assistant and guidance on when to use each available tool:"
+      ],
+      "id": "3469d656"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "\n",
+        "# Enhanced banking system prompt with tool selection guidance\n",
+        "system_context = \"\"\"You are a professional banking AI assistant with access to specialized banking tools.\n",
+        "            Analyze the user's banking request and directly use the most appropriate tools to help them.\n",
+        "            \n",
+        "            AVAILABLE BANKING TOOLS:\n",
+        "            \n",
+        "            credit_risk_analyzer - Analyze credit risk for loan applications and credit decisions\n",
+        "            - Use for: loan applications, credit assessments, risk analysis, mortgage eligibility\n",
+        "            - Examples: \"Analyze credit risk for $50k personal loan\", \"Assess mortgage eligibility for $300k home purchase\"\n",
+        "            - Parameters: customer_income, customer_debt, credit_score, loan_amount, loan_type\n",
+        "\n",
+        "            customer_account_manager - Manage customer accounts and provide banking services\n",
+        "            - Use for: account information, transaction processing, product recommendations, customer service\n",
+        "            - Examples: \"Check balance for checking account 12345\", \"Recommend products for customer with high balance\"\n",
+        "            - Parameters: account_type, customer_id, action, amount, account_details\n",
+        "\n",
+        "            fraud_detection_system - Analyze transactions for potential fraud and security risks\n",
+        "            - Use for: transaction monitoring, fraud prevention, risk assessment, security alerts\n",
+        "            - Examples: \"Analyze fraud risk for $500 ATM withdrawal in Miami\", \"Check security for $2000 online purchase\"\n",
+        "            - Parameters: transaction_id, customer_id, transaction_amount, transaction_type, location, device_id\n",
+        "\n",
+        "            BANKING INSTRUCTIONS:\n",
+        "            - Analyze the user's banking request carefully and identify the primary need\n",
+        "            - If they need credit analysis → use credit_risk_analyzer\n",
+        "            - If they need financial calculations → use financial_calculator\n",
+        "            - If they need account services → use customer_account_manager\n",
+        "            - If they need security analysis → use fraud_detection_system\n",
+        "            - Extract relevant parameters from the user's request\n",
+        "            - Provide helpful, accurate banking responses based on tool outputs\n",
+        "            - Always consider banking regulations, risk management, and best practices\n",
+        "            - Be professional and thorough in your analysis\n",
+        "\n",
+        "            Choose and use tools wisely to provide the most helpful banking assistance.\n",
+        "            Describe the response in user friendly manner with details describing the tool output. \n",
+        "            Provide the response in at least 500 words.\n",
+        "            Generate a concise execution plan for the banking request.\n",
+        "        \"\"\""
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "7971c427"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_2__'></a>\n",
+        "\n",
+        "#### Initialize the LLM\n",
+        "\n",
+        "Let's initialize the LLM that will power our banking agent:"
+      ],
+      "id": "b66c1ac4"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Initialize the main LLM for banking responses\n",
+        "main_llm = ChatOpenAI(\n",
+        "    model=\"gpt-5-mini\",\n",
+        "    reasoning={\n",
+        "        \"effort\": \"low\",\n",
+        "        \"summary\": \"auto\"\n",
+        "    }\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "866066e7"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Then bind the available banking tools to the LLM, enabling the model to automatically recognize and invoke each tool when appropriate based on request input and the system prompt we defined above:"
+      ],
+      "id": "8220afd6"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Bind all banking tools to the main LLM\n",
+        "llm_with_tools = main_llm.bind_tools(AVAILABLE_TOOLS)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "906d8132"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_3__'></a>\n",
+        "\n",
+        "#### Define agent state structure\n",
+        "\n",
+        "The agent state defines the data structure that flows through the LangGraph workflow. It includes:\n",
+        "\n",
+        "- **messages** — The conversation history between the user and agent\n",
+        "- **user_input** — The current user request\n",
+        "- **session_id** — A unique identifier for the conversation session\n",
+        "- **context** — Additional context that can be passed between nodes\n",
+        "\n",
+        "Defining this state structure maintains the structure throughout the agent's execution and allows for multi-turn conversations with memory:"
+      ],
+      "id": "43f56651"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Banking Agent State Definition\n",
+        "class BankingAgentState(TypedDict):\n",
+        "    messages: Annotated[Sequence[BaseMessage], add_messages]\n",
+        "    user_input: str\n",
+        "    session_id: str\n",
+        "    context: dict"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "6b926ddf"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_4__'></a>\n",
+        "\n",
+        "#### Create agent workflow function\n",
+        "\n",
+        "We'll build the LangGraph agent workflow with two main components:\n",
+        "\n",
+        "1. **LLM node** — Processes user requests, applies the system prompt, and decides whether to use tools.\n",
+        "2. **Tools node** — Executes the selected banking tools when the LLM determines they're needed.\n",
+        "\n",
+        "The workflow begins with the LLM analyzing the request, then uses tools if needed — or ends if the response is complete, and finally returns to the LLM to generate the final response."
+      ],
+      "id": "387ba780"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "def create_banking_langgraph_agent():\n",
+        "    \"\"\"Create a comprehensive LangGraph banking agent with intelligent tool selection.\"\"\"\n",
+        "    def llm_node(state: BankingAgentState) -> BankingAgentState:\n",
+        "        \"\"\"Main LLM node that processes banking requests and selects appropriate tools.\"\"\"\n",
+        "        messages = state[\"messages\"]\n",
+        "        # Add system context to messages\n",
+        "        enhanced_messages = [SystemMessage(content=system_context)] + list(messages)\n",
+        "        # Get LLM response with tool selection\n",
+        "        response = llm_with_tools.invoke(enhanced_messages)\n",
+        "        return {\n",
+        "            **state,\n",
+        "            \"messages\": messages + [response]\n",
+        "        }\n",
+        "    \n",
+        "    def should_continue(state: BankingAgentState) -> str:\n",
+        "        \"\"\"Decide whether to use tools or end the conversation.\"\"\"\n",
+        "        last_message = state[\"messages\"][-1]\n",
+        "        # Check if the LLM wants to use tools\n",
+        "        if hasattr(last_message, 'tool_calls') and last_message.tool_calls:\n",
+        "            return \"tools\"\n",
+        "        return END\n",
+        "        \n",
+        "    # Create the banking state graph\n",
+        "    workflow = StateGraph(BankingAgentState)\n",
+        "    # Add nodes\n",
+        "    workflow.add_node(\"llm\", llm_node)\n",
+        "    workflow.add_node(\"tools\", ToolNode(AVAILABLE_TOOLS))\n",
+        "    # Simplified entry point - go directly to LLM\n",
+        "    workflow.add_edge(START, \"llm\")\n",
+        "    # From LLM, decide whether to use tools or end\n",
+        "    workflow.add_conditional_edges(\n",
+        "        \"llm\",\n",
+        "        should_continue,\n",
+        "        {\"tools\": \"tools\", END: END}\n",
+        "    )\n",
+        "    # Tool execution flows back to LLM for final response\n",
+        "    workflow.add_edge(\"tools\", \"llm\")\n",
+        "    # Set up memory\n",
+        "    memory = MemorySaver()\n",
+        "    # Compile the graph\n",
+        "    agent = workflow.compile(checkpointer=memory)\n",
+        "    return agent"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "2c9bf585"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_5__'></a>\n",
+        "\n",
+        "#### Instantiate the banking agent\n",
+        "\n",
+        "Now, we'll create an instance of the banking agent by calling the workflow creation function.\n",
+        "\n",
+        "This compiled agent is ready to process banking requests and will automatically select and use the appropriate tools based on user queries:"
+      ],
+      "id": "765242e9"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Create the banking intelligent agent\n",
+        "banking_agent = create_banking_langgraph_agent()\n",
+        "\n",
+        "print(\"Banking LangGraph Agent Created Successfully!\")\n",
+        "print(\"\\nFeatures:\")\n",
+        "print(\"   - Intelligent banking tool selection\")\n",
+        "print(\"   - Comprehensive banking system prompt\")\n",
+        "print(\"   - Streamlined workflow: LLM → Tools → Response\")\n",
+        "print(\"   - Automatic tool parameter extraction\")\n",
+        "print(\"   - Professional banking assistance\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "455b8ee4"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_3__'></a>\n",
+        "\n",
+        "### Integrate agent with ValidMind\n",
+        "\n",
+        "To integrate our LangGraph banking agent with ValidMind, we need to create a wrapper function that ValidMind can use to invoke the agent and extract the necessary information for testing and documentation, allowing ValidMind to run validation tests on the agent's behavior, tool usage, and responses."
+      ],
+      "id": "e00dac77"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_3_1__'></a>\n",
+        "\n",
+        "#### Import ValidMind components\n",
+        "\n",
+        "We'll start with importing the necessary ValidMind components for integrating our agent:\n",
+        "\n",
+        "- `Prompt` from `validmind.models` for handling prompt-based model inputs\n",
+        "- `extract_tool_calls_from_agent_output` and `_convert_to_tool_call_list` from `validmind.scorers.llm.deepeval` for extracting and converting tool calls from agent outputs"
+      ],
+      "id": "a124857e"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.models import Prompt\n",
+        "from validmind.scorers.llm.deepeval import extract_tool_calls_from_agent_output, _convert_to_tool_call_list\n",
+        "from deepeval.tracing import observe, update_current_span\n",
+        "from deepeval.test_case import LLMTestCase"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "9aeb8969"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_3_2__'></a>\n",
+        "\n",
+        "#### Create agent wrapper function\n",
+        "\n",
+        "We'll then create a wrapper function that:\n",
+        "\n",
+        "- Accepts input in ValidMind's expected format (with `input` and `session_id` fields)\n",
+        "- Invokes the banking agent with the proper state initialization\n",
+        "- Captures tool outputs and tool calls for evaluation\n",
+        "- Returns a standardized response format that includes the prediction, full output, tool messages, and tool call information\n",
+        "- Handles errors gracefully with fallback responses"
+      ],
+      "id": "ed72903f"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "@observe(type=\"agent\")\n",
+        "def banking_agent_fn(input):\n",
+        "    \"\"\"\n",
+        "    Invoke the banking agent with the given input.\n",
+        "    \"\"\"\n",
+        "    try:\n",
+        "        # Initial state for banking agent\n",
+        "        initial_state = {\n",
+        "            \"user_input\": input[\"input\"],\n",
+        "            \"messages\": [HumanMessage(content=input[\"input\"])],\n",
+        "            \"session_id\": input[\"session_id\"],\n",
+        "            \"context\": {}\n",
+        "        }\n",
+        "        session_config = {\"configurable\": {\"thread_id\": input[\"session_id\"]}}\n",
+        "        result = banking_agent.invoke(initial_state, config=session_config)\n",
+        "\n",
+        "        from utils import capture_tool_output_messages\n",
+        "\n",
+        "        # Capture all tool outputs and metadata\n",
+        "        captured_data = capture_tool_output_messages(result)\n",
+        "    \n",
+        "        # Access specific tool outputs, this will be used for RAGAS tests\n",
+        "        tool_message = \"\"\n",
+        "        for output in captured_data[\"tool_outputs\"]:\n",
+        "            tool_message += output['content']\n",
+        "        \n",
+        "        tool_calls_found = []\n",
+        "        messages = result['messages']\n",
+        "        for message in messages:\n",
+        "            if hasattr(message, 'tool_calls') and message.tool_calls:\n",
+        "                for tool_call in message.tool_calls:\n",
+        "                    # Handle both dictionary and object formats\n",
+        "                    if isinstance(tool_call, dict):\n",
+        "                        tool_calls_found.append(tool_call['name'])\n",
+        "                    else:\n",
+        "                        # ToolCall object - use attribute access\n",
+        "                        tool_calls_found.append(tool_call.name)\n",
+        "\n",
+        "        prediction_text = result['messages'][-1].content[0]['text']\n",
+        "        tools_called_value = _convert_to_tool_call_list(extract_tool_calls_from_agent_output(result))\n",
+        "        expected_tools_value = _convert_to_tool_call_list(input.get(\"expected_tools\", []))\n",
+        "\n",
+        "        # Feed trace data for DeepEval metrics (e.g. PlanQuality) that require tracing\n",
+        "        update_current_span(\n",
+        "            test_case=LLMTestCase(\n",
+        "                input=input[\"input\"],\n",
+        "                actual_output=prediction_text,\n",
+        "                tools_called=tools_called_value,\n",
+        "                expected_tools=expected_tools_value\n",
+        "            )\n",
+        "        )\n",
+        "\n",
+        "        return {\n",
+        "            \"prediction\": prediction_text,\n",
+        "            \"output\": result,\n",
+        "            \"tool_messages\": [tool_message],\n",
+        "            # \"tool_calls\": tool_calls_found,\n",
+        "            \"tool_called\": tools_called_value\n",
+        "        }\n",
+        "    except Exception as e:\n",
+        "        # Return a fallback response if the agent fails\n",
+        "        error_message = f\"\"\"I apologize, but I encountered an error while processing your banking request: {str(e)}.\n",
+        "        Please try rephrasing your question or contact support if the issue persists.\"\"\"\n",
+        "        return {\n",
+        "            \"prediction\": error_message, \n",
+        "            \"output\": {\n",
+        "                \"messages\": [HumanMessage(content=input[\"input\"]), SystemMessage(content=error_message)],\n",
+        "                \"error\": str(e)\n",
+        "            }\n",
+        "        }"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "0e4d5a82"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_3_3__'></a>\n",
+        "\n",
+        "#### Initialize the ValidMind model\n",
+        "\n",
+        "We'll also need to register the banking agent as a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data.\n",
+        "\n",
+        "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+        "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
+        "\n",
+        "Initialize your model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model) which:\n",
+        "\n",
+        "- Associates the wrapper function with the model for prediction\n",
+        "- Stores the system prompt template for documentation\n",
+        "- Provides a unique `input_id` for tracking and identification\n",
+        "- Enables the agent to be used with ValidMind's testing and documentation features"
+      ],
+      "id": "fda87401"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Initialize the agent as a model\n",
+        "vm_banking_model = vm.init_model(\n",
+        "    input_id=\"banking_agent_model\",\n",
+        "    predict_fn=banking_agent_fn,\n",
+        "    prompt=Prompt(template=system_context)\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "60a2ce7a"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_3_4__'></a>\n",
+        "\n",
+        "#### Store the agent reference\n",
+        "\n",
+        "We'll also store a reference to the original banking agent object in the ValidMind model. This allows us to access the full agent functionality directly if needed, while still maintaining the wrapper function interface for ValidMind's testing framework."
+      ],
+      "id": "949bcf53"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Add the banking agent to the vm model\n",
+        "vm_banking_model.model = banking_agent"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "2c653471"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_3_5__'></a>\n",
+        "\n",
+        "#### Verify integration\n",
+        "\n",
+        "Let's confirm that the banking agent has been successfully integrated with ValidMind:"
+      ],
+      "id": "d8d0c1c1"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "print(\"Banking Agent Successfully Integrated with ValidMind!\")\n",
+        "print(f\"Model ID: {vm_banking_model.input_id}\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "8e101b0f"
+    },
+    {
+      "cell_type": "markdown",
+      "id": "2a5f874e",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_4__'></a>\n",
+        "\n",
+        "### Validate the system prompt\n",
+        "\n",
+        "Let's get an initial sense of how well our defined system prompt meets a few best practices for prompt engineering by running a few tests — we'll run evaluation tests later on our agent's performance.\n",
+        "\n",
+        "You run individual tests by calling [the `run_test` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test) provided by the `validmind.tests` module. Passing in our agentic model as an input, the tests below rate the prompt on a scale of 1-10 against the following criteria:\n",
+        "\n",
+        "- **prompt_validation.Clarity** — How clearly the prompt states the task.\n",
+        "- **prompt_validation.Conciseness** — How succinctly the prompt states the task.\n",
+        "- **prompt_validation.Delimitation** — When using complex prompts containing examples, contextual information, or other elements, is the prompt formatted in such a way that each element is clearly separated?\n",
+        "- **prompt_validation.NegativeInstruction** — Whether the prompt contains negative instructions.\n",
+        "- **prompt_validation.Specificity** — How specific the prompt defines the task.\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    \"validmind.prompt_validation.Clarity\",\n",
+        "    inputs={\n",
+        "        \"model\": vm_banking_model,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "f52dceb1"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    \"validmind.prompt_validation.Conciseness\",\n",
+        "    inputs={\n",
+        "        \"model\": vm_banking_model,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "70d52333"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    \"validmind.prompt_validation.Delimitation\",\n",
+        "    inputs={\n",
+        "        \"model\": vm_banking_model,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "5aa89976"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    \"validmind.prompt_validation.NegativeInstruction\",\n",
+        "    inputs={\n",
+        "        \"model\": vm_banking_model,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "8630197e"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    \"validmind.prompt_validation.Specificity\",\n",
+        "    inputs={\n",
+        "        \"model\": vm_banking_model,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "bba99915"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Initializing the ValidMind dataset\n",
+        "\n",
+        "After validation our system prompt, let's import our sample dataset ([banking_test_dataset.py](banking_test_dataset.py)), which we'll use in the next section to evaluate our agent's performance across different banking scenarios:"
+      ],
+      "id": "51d61141"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from banking_test_dataset import banking_test_dataset"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "0c70ca2c"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "The next step is to connect your data with a ValidMind `Dataset` object. **This step is always necessary every time you want to connect a dataset to documentation and produce test results through ValidMind,** but you only need to do it once per dataset.\n",
+        "\n",
+        "Initialize a ValidMind dataset object using the [`init_dataset` function](https://docs.validmind.ai/validmind/validmind.html#init_dataset) from the ValidMind (`vm`) module. For this example, we'll pass in the following arguments:\n",
+        "\n",
+        "- **`input_id`** — A unique identifier that allows tracking what inputs are used when running each individual test.\n",
+        "- **`dataset`** — The raw dataset that you want to provide as input to tests.\n",
+        "- **`text_column`** — The name of the column containing the text input data.\n",
+        "- **`target_column`** — A required argument if tests require access to true values. This is the name of the target column in the dataset."
+      ],
+      "id": "442ab66d"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_test_dataset = vm.init_dataset(\n",
+        "    input_id=\"banking_test_dataset\",\n",
+        "    dataset=banking_test_dataset,\n",
+        "    text_column=\"input\",\n",
+        "    target_column=\"possible_outputs\",\n",
+        ")\n",
+        "\n",
+        "print(\"Banking Test Dataset Initialized in ValidMind!\")\n",
+        "print(f\"Dataset ID: {vm_test_dataset.input_id}\")\n",
+        "print(f\"Dataset columns: {vm_test_dataset._df.columns}\")\n",
+        "vm_test_dataset._df"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "a7e9d158"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Assign predictions\n",
+        "\n",
+        "Now that both the model object and the datasets have been registered, we'll assign predictions to capture the banking agent's responses for evaluation:\n",
+        "\n",
+        "- The [`assign_predictions()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#assign_predictions) from the `Dataset` object can link existing predictions to any number of models.\n",
+        "- This method links the model's class prediction values and probabilities to our `vm_train_ds` and `vm_test_ds` datasets.\n",
+        "\n",
+        "If no prediction values are passed, the method will compute predictions automatically:"
+      ],
+      "id": "7b01021c"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_test_dataset.assign_predictions(vm_banking_model)\n",
+        "\n",
+        "print(\"Banking Agent Predictions Generated Successfully!\")\n",
+        "print(f\"Predictions assigned to {len(vm_test_dataset._df)} test cases\")\n",
+        "vm_test_dataset._df.head()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "1d462663"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Running accuracy tests\n",
+        "\n",
+        "Using [`@vm.test`](https://docs.validmind.ai/validmind/validmind.html#test), let's implement some reusable custom *inline tests* to assess the accuracy of our banking agent:\n",
+        "\n",
+        "- An inline test refers to a test written and executed within the same environment as the code being tested — in this case, right in this Jupyter Notebook —  without requiring a separate test file or framework.\n",
+        "- You'll note that the custom test functions are just regular Python functions that can include and require any Python library as you see fit."
+      ],
+      "id": "4e56f556"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Response accuracy test\n",
+        "\n",
+        "We'll create a custom test that evaluates the banking agent's ability to provide accurate responses by:\n",
+        "\n",
+        "- Testing against a dataset of predefined banking questions and expected answers.\n",
+        "- Checking if responses contain expected keywords and banking terminology.\n",
+        "- Providing detailed test results including pass/fail status.\n",
+        "- Helping identify any gaps in the agent's banking knowledge or response quality."
+      ],
+      "id": "1bce9258"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "\n",
+        "@vm.test(\"my_custom_tests.banking_accuracy_test\")\n",
+        "def banking_accuracy_test(model, dataset, list_of_columns):\n",
+        "    \"\"\"\n",
+        "    The Banking Accuracy Test evaluates whether the agent’s responses include \n",
+        "    critical domain-specific keywords and phrases that indicate accurate, compliant,\n",
+        "    and contextually appropriate banking information. This test ensures that the agent\n",
+        "    provides responses containing the expected banking terminology, risk classifications,\n",
+        "    account details, or other domain-relevant information required for regulatory compliance,\n",
+        "    customer safety, and operational accuracy.\n",
+        "    \"\"\"\n",
+        "    df = dataset._df\n",
+        "    \n",
+        "    # Pre-compute responses for all tests\n",
+        "    y_true = dataset.y.tolist()\n",
+        "    y_pred = dataset.y_pred(model).tolist()\n",
+        "\n",
+        "    # Vectorized test results\n",
+        "    test_results = []\n",
+        "    for response, keywords in zip(y_pred, y_true):\n",
+        "        # Convert keywords to list if not already a list\n",
+        "        if not isinstance(keywords, list):\n",
+        "            keywords = [keywords]\n",
+        "        test_results.append(any(str(keyword).lower() in str(response).lower() for keyword in keywords))\n",
+        "        \n",
+        "    results = pd.DataFrame()\n",
+        "    column_names = [col + \"_details\" for col in list_of_columns]\n",
+        "    results[column_names] = df[list_of_columns]\n",
+        "    results[\"actual\"] = y_pred\n",
+        "    results[\"expected\"] = y_true\n",
+        "    results[\"passed\"] = test_results\n",
+        "    results[\"error\"] = None if test_results else f'Response did not contain any expected keywords: {y_true}'\n",
+        "    \n",
+        "    return results"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "90232066"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Now that we've defined our custom response accuracy test, we can run the test using the same `run_test()` function we used earlier to validate the system prompt using our sample dataset and agentic model as input, and log the test results to the ValidMind Platform with the [`log()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#log):"
+      ],
+      "id": "2a7f71f8"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = vm.tests.run_test(\n",
+        "    \"my_custom_tests.banking_accuracy_test\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_test_dataset,\n",
+        "        \"model\": vm_banking_model\n",
+        "    },\n",
+        "    params={\n",
+        "        \"list_of_columns\": [\"input\"]\n",
+        "    }\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "e68884d5"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let's review the first five rows of the test dataset to inspect the results to see how well the banking agent performed. Each column in the output serves a specific purpose in evaluating agent performance:\n",
+        "\n",
+        "| Column header | Description | Importance |\n",
+        "|--------------|-------------|------------|\n",
+        "| **`input`** | Original user query or request | Essential for understanding the context of each test case and tracing which inputs led to specific agent behaviors. |\n",
+        "| **`expected_tools`** | Banking tools that should be invoked for this request | Enables validation of correct tool selection, which is critical for agentic AI systems where choosing the right tool is a key success metric. |\n",
+        "| **`expected_output`** | Expected output or keywords that should appear in the response | Defines the success criteria for each test case, enabling objective evaluation of whether the agent produced the correct result. |\n",
+        "| **`session_id`** | Unique identifier for each test session | Allows tracking and correlation of related test runs, debugging specific sessions, and maintaining audit trails. |\n",
+        "| **`category`** | Classification of the request type | Helps organize test results by domain and identify performance patterns across different banking use cases. |\n",
+        "| **`banking_agent_model_output`** | Complete agent response including all messages and reasoning | Allows you to examine the full output to assess response quality, completeness, and correctness beyond just keyword matching. |\n",
+        "| **`banking_agent_model_tool_messages`** | Messages exchanged with the banking tools | Critical for understanding how the agent interacted with tools, what parameters were passed, and what tool outputs were received. |\n",
+        "| **`banking_agent_model_tool_called`** | Specific tool that was invoked | Enables validation that the agent selected the correct tool for each request, which is fundamental to agentic AI validation. |\n",
+        "| **`possible_outputs`** | Alternative valid outputs or keywords that could appear in the response | Provides flexibility in evaluation by accounting for multiple acceptable response formats or variations. |"
+      ],
+      "id": "94a717e7"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_test_dataset.df.head(5)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "78f7edb1"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2__'></a>\n",
+        "\n",
+        "### Tool selection accuracy test\n",
+        "\n",
+        "We'll also create a custom test that evaluates the banking agent's ability to select the correct tools for different requests by:\n",
+        "\n",
+        "- Testing against a dataset of predefined banking queries with expected tool selections.\n",
+        "- Comparing the tools actually invoked by the agent against the expected tools for each request.\n",
+        "- Providing quantitative accuracy scores that measure the proportion of expected tools correctly selected.\n",
+        "- Helping identify gaps in the agent's understanding of user needs and tool selection logic."
+      ],
+      "id": "1cb3e8bd"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "First, we'll define a helper function that extracts tool calls from the agent's messages and compares them against the expected tools. This function handles different message formats (dictionary or object) and calculates accuracy scores:"
+      ],
+      "id": "69263d62"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "def validate_tool_calls_simple(messages, expected_tools):\n",
+        "    \"\"\"Simple validation of tool calls without RAGAS dependency issues.\"\"\"\n",
+        "    \n",
+        "    tool_calls_found = []\n",
+        "    \n",
+        "    for message in messages:\n",
+        "        if hasattr(message, 'tool_calls') and message.tool_calls:\n",
+        "            for tool_call in message.tool_calls:\n",
+        "                # Handle both dictionary and object formats\n",
+        "                if isinstance(tool_call, dict):\n",
+        "                    tool_calls_found.append(tool_call['name'])\n",
+        "                else:\n",
+        "                    # ToolCall object - use attribute access\n",
+        "                    tool_calls_found.append(tool_call.name)\n",
+        "    \n",
+        "    # Check if expected tools were called\n",
+        "    accuracy = 0.0\n",
+        "    matches = 0\n",
+        "    if expected_tools:\n",
+        "        matches = sum(1 for tool in expected_tools if tool in tool_calls_found)\n",
+        "        accuracy = matches / len(expected_tools)\n",
+        "    \n",
+        "    return {\n",
+        "        'expected_tools': expected_tools,\n",
+        "        'found_tools': tool_calls_found,\n",
+        "        'matches': matches,\n",
+        "        'total_expected': len(expected_tools) if expected_tools else 0,\n",
+        "        'accuracy': accuracy,\n",
+        "    }"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "e68798be"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Now we'll define the main test function that uses the helper function to evaluate tool selection accuracy across all test cases in the dataset:"
+      ],
+      "id": "8f494fd3"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "@vm.test(\"my_custom_tests.BankingToolCallAccuracy\")\n",
+        "def BankingToolCallAccuracy(dataset, agent_output_column, expected_tools_column):\n",
+        "    \"\"\"\n",
+        "    Evaluates the tool selection accuracy of a LangGraph-powered banking agent.\n",
+        "\n",
+        "    This test measures whether the agent correctly identifies and invokes the required banking tools\n",
+        "    for each user query scenario.\n",
+        "    For each case, the outputs generated by the agent (including its tool calls) are compared against an\n",
+        "    expected set of tools. The test considers both coverage and exactness: it computes the proportion of\n",
+        "    expected tools correctly called by the agent for each instance.\n",
+        "\n",
+        "    Parameters:\n",
+        "        dataset (VMDataset): The dataset containing user queries, agent outputs, and ground-truth tool expectations.\n",
+        "        agent_output_column (str): Dataset column name containing agent outputs (should include tool call details in 'messages').\n",
+        "        expected_tools_column (str): Dataset column specifying the true expected tools (as lists).\n",
+        "\n",
+        "    Returns:\n",
+        "        List[dict]: Per-row dictionaries with details: expected tools, found tools, match count, total expected, and accuracy score.\n",
+        "\n",
+        "    Purpose:\n",
+        "        Provides diagnostic evidence of the banking agent's core reasoning ability—specifically, its capacity to\n",
+        "        interpret user needs and select the correct banking actions. Useful for diagnosing gaps in tool coverage,\n",
+        "        misclassifications, or breakdowns in agent logic.\n",
+        "\n",
+        "    Interpretation:\n",
+        "        - An accuracy of 1.0 signals perfect tool selection for that example.\n",
+        "        - Lower scores may indicate partial or complete failures to invoke required tools.\n",
+        "        - Review 'found_tools' vs. 'expected_tools' to understand the source of discrepancies.\n",
+        "\n",
+        "    Strengths:\n",
+        "        - Directly tests a core capability of compositional tool-use agents.\n",
+        "        - Framework-agnostic; robust to tool call output format (object or dict).\n",
+        "        - Supports batch validation and result logging for systematic documentation.\n",
+        "\n",
+        "    Limitations:\n",
+        "        - Does not penalize extra, unnecessary tool calls.\n",
+        "        - Does not assess result quality—only correct invocation.\n",
+        "\n",
+        "    \"\"\"\n",
+        "    df = dataset._df\n",
+        "    \n",
+        "    results = []\n",
+        "    for i, row in df.iterrows():\n",
+        "        result = validate_tool_calls_simple(row[agent_output_column]['messages'], row[expected_tools_column])\n",
+        "        results.append(result)\n",
+        "         \n",
+        "    return results"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "604d7313"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Finally, we can call our function with `run_test()` and log the test results to the ValidMind Platform:"
+      ],
+      "id": "57ab606b"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = vm.tests.run_test(\n",
+        "    \"my_custom_tests.BankingToolCallAccuracy\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_test_dataset,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"agent_output_column\": \"banking_agent_model_output\",\n",
+        "        \"expected_tools_column\": \"expected_tools\"\n",
+        "    }\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "dd14115e"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Assigning AI evaluation metric scores\n",
+        "\n",
+        "*AI agent evaluation metrics* are specialized measurements designed to assess how well autonomous LLM-based agents reason, plan, select and execute tools, and ultimately complete user tasks by analyzing the *full execution trace* — including reasoning steps, tool calls, intermediate decisions, and outcomes, rather than just single input–output pairs. These metrics are essential because agent failures often occur in ways traditional LLM metrics miss — for example, choosing the right tool with wrong arguments, creating a good plan but not following it, or completing a task inefficiently.\n",
+        "\n",
+        "In this section, we'll evaluate our banking agent's outputs and add scoring to our sample dataset against metrics defined in [DeepEval’s AI agent evaluation framework](https://deepeval.com/guides/guides-ai-agent-evaluation-metrics) which breaks down AI agent evaluation into three layers with corresponding subcategories: **reasoning**, **action**, and **execution**.\n",
+        "\n",
+        "Together, these three metrics enable granular diagnosis of agent behavior, help pinpoint where failures occur (reasoning, action, or execution), and support both development benchmarking and production monitoring."
+      ],
+      "id": "be8d5270"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_1__'></a>\n",
+        "\n",
+        "### Identify relevant DeepEval scorers\n",
+        "\n",
+        "*Scorers* are evaluation metrics that analyze model outputs and store their results in the dataset:\n",
+        "\n",
+        "- Each scorer adds a new column to the dataset with format: `{scorer_name}_{metric_name}`\n",
+        "- The column contains the numeric score (typically `0`-`1`) for each example\n",
+        "- Multiple scorers can be run on the same dataset, each adding their own column\n",
+        "- Scores are persisted in the dataset for later analysis and visualization\n",
+        "- Common scorer patterns include:\n",
+        "  - Model performance metrics (accuracy, F1, etc.)\n",
+        "  - Output quality metrics (relevance, faithfulness)\n",
+        "  - Task-specific metrics (completion, correctness)\n",
+        "\n",
+        "Use `list_scorers()` from [`validmind.scorers`](https://docs.validmind.ai/validmind/validmind/tests.html#scorer) to discover all available scoring methods and their IDs that can be used with `assign_scores()`. We'll filter these results to return only DeepEval scorers for our desired three metrics in a formatted table with descriptions:"
+      ],
+      "id": "25828bef"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load all DeepEval scorers\n",
+        "llm_scorers_dict = vm.tests.load._load_tests([s for s in vm.scorer.list_scorers() if \"deepeval\" in s.lower()])\n",
+        "\n",
+        "# Categorize scorers by metric layer\n",
+        "reasoning_scorers = {}\n",
+        "action_scorers = {}\n",
+        "execution_scorers = {}\n",
+        "\n",
+        "for scorer_id, scorer_func in llm_scorers_dict.items():\n",
+        "    tags = getattr(scorer_func, \"__tags__\", [])\n",
+        "    scorer_name = scorer_id.split(\".\")[-1]\n",
+        "\n",
+        "    if \"reasoning_layer\" in tags:\n",
+        "        reasoning_scorers[scorer_id] = scorer_func\n",
+        "    elif \"action_layer\" in tags:\n",
+        "        action_scorers[scorer_id] = scorer_func\n",
+        "    elif \"TaskCompletion\" in scorer_name:\n",
+        "        execution_scorers[scorer_id] = scorer_func\n",
+        "\n",
+        "# Display scorers by category\n",
+        "print(\"=\" * 80)\n",
+        "print(\"REASONING LAYER\")\n",
+        "print(\"=\" * 80)\n",
+        "if reasoning_scorers:\n",
+        "    reasoning_df = vm.tests.load._pretty_list_tests(reasoning_scorers, truncate=True)\n",
+        "    display(reasoning_df)\n",
+        "else:\n",
+        "    print(\"No reasoning layer scorers found.\")\n",
+        "\n",
+        "print(\"\\n\" + \"=\" * 80)\n",
+        "print(\"ACTION LAYER\")\n",
+        "print(\"=\" * 80)\n",
+        "if action_scorers:\n",
+        "    action_df = vm.tests.load._pretty_list_tests(action_scorers, truncate=True)\n",
+        "    display(action_df)\n",
+        "else:\n",
+        "    print(\"No action layer scorers found.\")\n",
+        "\n",
+        "print(\"\\n\" + \"=\" * 80)\n",
+        "print(\"EXECUTION LAYER\")\n",
+        "print(\"=\" * 80)\n",
+        "if execution_scorers:\n",
+        "    execution_df = vm.tests.load._pretty_list_tests(execution_scorers, truncate=True)\n",
+        "    display(execution_df)\n",
+        "else:\n",
+        "    print(\"No execution layer scorers found.\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "730c70ec"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2__'></a>\n",
+        "\n",
+        "### Assign reasoning scores\n",
+        "\n",
+        "*Reasoning* evaluates planning and strategy generation:\n",
+        "\n",
+        "- **Plan quality** – How logical, complete, and efficient the agent’s plan is.\n",
+        "- **Plan adherence** – Whether the agent follows its own plan during execution."
+      ],
+      "id": "e5fb739b"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2_1__'></a>\n",
+        "\n",
+        "#### Plan quality score\n",
+        "\n",
+        "Let's measure how well our banking agent generates a plan before acting. A high score means the plan is logical, complete, and efficient."
+      ],
+      "id": "fde94d01"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_test_dataset.assign_scores(\n",
+        "    metrics = \"validmind.scorers.llm.deepeval.PlanQuality\",\n",
+        "    model = vm_banking_model,\n",
+        "    input_column = \"input\",\n",
+        ")\n",
+        "vm_test_dataset._df[['banking_agent_model_PlanQuality_score','banking_agent_model_PlanQuality_reason']]"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "52f362ba"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2_2__'></a>\n",
+        "\n",
+        "#### Plan adherence score\n",
+        "\n",
+        "Let's check whether our banking agent follows the plan it created. Deviations lower this score and indicate gaps between reasoning and execution."
+      ],
+      "id": "d631fd12"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_test_dataset.assign_scores(\n",
+        "    metrics = \"validmind.scorers.llm.deepeval.PlanAdherence\",\n",
+        "    input_column = \"input\",\n",
+        "    model = vm_banking_model,\n",
+        ")\n",
+        "vm_test_dataset._df[['banking_agent_model_PlanAdherence_score','banking_agent_model_PlanAdherence_reason']]"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "4124a7c2"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_3__'></a>\n",
+        "\n",
+        "### Assign action scores\n",
+        "\n",
+        "*Action* assesses tool usage and argument generation:\n",
+        "\n",
+        "- **Tool correctness** – Whether the agent selects and calls the right tools.\n",
+        "- **Argument correctness** – Whether the agent generates correct tool arguments."
+      ],
+      "id": "82e5e6f1"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_3_1__'></a>\n",
+        "\n",
+        "#### Tool correctness score\n",
+        "\n",
+        "Let's evaluate if our banking agent selects the appropriate tool for the task. Choosing the wrong tool reduces performance even if reasoning was correct."
+      ],
+      "id": "e641c9f2"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_test_dataset.assign_scores(\n",
+        "    metrics = \"validmind.scorers.llm.deepeval.ToolCorrectness\",\n",
+        "    input_column = \"input\",\n",
+        "    model = vm_banking_model,\n",
+        "    expected_tools_called_column = \"expected_tools\",\n",
+        "    actual_tools_called_column = \"banking_agent_model_tool_called\",\n",
+        ")\n",
+        "vm_test_dataset._df[['banking_agent_model_ToolCorrectness_score','banking_agent_model_ToolCorrectness_reason']]"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "8d2e8a25"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_3_2__'></a>\n",
+        "\n",
+        "#### Argument correctness score\n",
+        "\n",
+        "Let's assesses whether our banking agent provides correct inputs or arguments to the selected tool. Incorrect arguments can lead to failed or unexpected results."
+      ],
+      "id": "dd758ba5"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_test_dataset.assign_scores(\n",
+        "    metrics = \"validmind.scorers.llm.deepeval.ArgumentCorrectness\",\n",
+        "    input_column = \"input\",\n",
+        "    model = vm_banking_model,\n",
+        "    actual_tools_called_column = \"banking_agent_model_tool_called\",\n",
+        ")\n",
+        "vm_test_dataset._df[['banking_agent_model_ArgumentCorrectness_score','banking_agent_model_ArgumentCorrectness_reason']]"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "04f90489"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_4__'></a>\n",
+        "\n",
+        "### Assign execution score\n",
+        "\n",
+        "*Execution* measures end-to-end performance:\n",
+        "\n",
+        "- **Task completion** – Whether the agent successfully completes the intended task."
+      ],
+      "id": "1aeec2f5"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_4_1__'></a>\n",
+        "\n",
+        "#### Task completion score\n",
+        "\n",
+        "Let's evaluate whether our banking agent successfully completes the requested tasks. Incomplete task execution can lead to user dissatisfaction and failed banking operations."
+      ],
+      "id": "eb9ab8de"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_test_dataset.assign_scores(\n",
+        "    metrics = \"validmind.scorers.llm.deepeval.TaskCompletion\",\n",
+        "    input_column = \"input\",\n",
+        "    model = vm_banking_model,\n",
+        "    actual_tools_called_column = \"banking_agent_model_tool_called\",\n",
+        ")\n",
+        "vm_test_dataset._df[['banking_agent_model_TaskCompletion_score','banking_agent_model_TaskCompletion_reason']]"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "05024f1f"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "As you recall from the beginning of this section, when we run scorers through `assign_scores()`, the return values are automatically processed and added as new columns with the format `{scorer_name}_{metric_name}`. Note that the task completion scorer has added a new column `TaskCompletion_score` to our dataset.\n",
+        "\n",
+        "We'll use this column to visualize the distribution of task completion scores across our test cases through the [BoxPlot test](https://docs.validmind.ai/validmind/validmind/tests/plots/BoxPlot.html#boxplot):"
+      ],
+      "id": "b577c282"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    \"validmind.plots.BoxPlot\",\n",
+        "    inputs={\"dataset\": vm_test_dataset},\n",
+        "    params={\n",
+        "        \"columns\": \"banking_agent_model_TaskCompletion_score\",\n",
+        "        \"title\": \"Distribution of Task Completion Scores\",\n",
+        "        \"ylabel\": \"Score\",\n",
+        "        \"figsize\": (8, 6)\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "7f6d08ca"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Running RAGAS tests\n",
+        "\n",
+        "Next, let's run some out-of-the-box *Retrieval-Augmented Generation Assessment* (RAGAS) tests available in the ValidMind Library. RAGAS provides specialized metrics for evaluating retrieval-augmented generation systems and conversational AI agents. These metrics analyze different aspects of agent performance by assessing how well systems integrate retrieved information with generated responses.\n",
+        "\n",
+        "Our banking agent uses tools to retrieve information and generates responses based on that context, making it similar to a RAG system. RAGAS metrics help evaluate the quality of this integration by analyzing the relationship between retrieved tool outputs, user queries, and generated responses.\n",
+        "\n",
+        "These tests provide insights into how well our banking agent integrates tool usage with conversational abilities, ensuring it provides accurate, relevant, and helpful responses to banking users while maintaining fidelity to retrieved information."
+      ],
+      "id": "30d9ec62"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_1__'></a>\n",
+        "\n",
+        "### Identify relevant RAGAS tests\n",
+        "\n",
+        "Let's explore some of ValidMind's available tests. Using ValidMind’s repository of tests streamlines your development testing, and helps you ensure that your records are being documented and evaluated appropriately.\n",
+        "\n",
+        "You can pass `tasks` and `tags` as parameters to the [`vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) to filter the tests based on the tags and task types:\n",
+        "\n",
+        "- **`tasks`** represent the kind of modeling task associated with a test. Here we'll focus on `text_qa` tasks.\n",
+        "- **`tags`** are free-form descriptions providing more details about the test, for example, what category the test falls into. Here we'll focus on the `ragas` tag.\n",
+        "\n",
+        "We'll then run three of these tests returned as examples below."
+      ],
+      "id": "8288f6c3"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.list_tests(task=\"text_qa\", tags=[\"ragas\"])"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "0701f5a9"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_1_1__'></a>\n",
+        "\n",
+        "#### Faithfulness\n",
+        "\n",
+        "Let's evaluate whether the banking agent's responses accurately reflect the information retrieved from tools. Unfaithful responses can misreport credit analysis, financial calculations, and compliance results—undermining user trust in the banking agent."
+      ],
+      "id": "2ce24ba0"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    \"validmind.model_validation.ragas.Faithfulness\",\n",
+        "    inputs={\"dataset\": vm_test_dataset},\n",
+        "    param_grid={\n",
+        "        \"user_input_column\": [\"input\"],\n",
+        "        \"response_column\": [\"banking_agent_model_prediction\"],\n",
+        "        \"retrieved_contexts_column\": [\"banking_agent_model_tool_messages\"],\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "92044533"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_1_2__'></a>\n",
+        "\n",
+        "#### Response Relevancy\n",
+        "\n",
+        "Let's evaluate whether the banking agent's answers address the user's original question or request. Irrelevant or off-topic responses can frustrate users and fail to deliver the banking information they need."
+      ],
+      "id": "4d1fcfcd"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    \"validmind.model_validation.ragas.ResponseRelevancy\",\n",
+        "    inputs={\"dataset\": vm_test_dataset},\n",
+        "    params={\n",
+        "        \"user_input_column\": \"input\",\n",
+        "        \"response_column\": \"banking_agent_model_prediction\",\n",
+        "        \"retrieved_contexts_column\": \"banking_agent_model_tool_messages\",\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "d7483bc3"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7_1_3__'></a>\n",
+        "\n",
+        "#### Context Recall\n",
+        "\n",
+        "Let's evaluate how well the banking agent uses the information retrieved from tools when generating its responses. Poor context recall can lead to incomplete or underinformed answers even when the right tools were selected."
+      ],
+      "id": "38c1dfb5"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    \"validmind.model_validation.ragas.ContextRecall\",\n",
+        "    inputs={\"dataset\": vm_test_dataset},\n",
+        "    param_grid={\n",
+        "        \"user_input_column\": [\"input\"],\n",
+        "        \"retrieved_contexts_column\": [\"banking_agent_model_tool_messages\"],\n",
+        "        \"reference_column\": [\"banking_agent_model_prediction\"],\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "e5dc00ce"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## Running safety tests\n",
+        "\n",
+        "Finally, let's run some out-of-the-box *safety* tests available in the ValidMind Library. Safety tests provide specialized metrics for evaluating whether AI agents operate reliably and securely. These metrics analyze different aspects of agent behavior by assessing adherence to safety guidelines, consistency of outputs, and resistance to harmful or inappropriate requests.\n",
+        "\n",
+        "Our banking agent handles sensitive financial information and user requests, making safety and reliability essential. Safety tests help evaluate whether the agent maintains appropriate boundaries, responds consistently and correctly to inputs, and avoids generating harmful, biased, or unprofessional content.\n",
+        "\n",
+        "These tests provide insights into how well our banking agent upholds standards of fairness and professionalism, ensuring it operates reliably and securely for banking users."
+      ],
+      "id": "95e1e16a"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8_1_1__'></a>\n",
+        "\n",
+        "#### AspectCritic\n",
+        "\n",
+        "Let's evaluate our banking agent's responses across multiple quality dimensions — conciseness, coherence, correctness, harmfulness, and maliciousness. Weak performance on these dimensions can degrade user experience, fall short of professional banking standards, or introduce safety risks. \n",
+        "\n",
+        "We'll use the `AspectCritic` we identified earlier:"
+      ],
+      "id": "e0972afa"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    \"validmind.model_validation.ragas.AspectCritic\",\n",
+        "    inputs={\"dataset\": vm_test_dataset},\n",
+        "    param_grid={\n",
+        "        \"user_input_column\": [\"input\"],\n",
+        "        \"response_column\": [\"banking_agent_model_prediction\"],\n",
+        "        \"retrieved_contexts_column\": [\"banking_agent_model_tool_messages\"],\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "148daa2b"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8_1_2__'></a>\n",
+        "\n",
+        "#### Bias\n",
+        "\n",
+        "Let's evaluate whether our banking agent's prompts contain unintended biases that could affect banking decisions. Biased prompts can lead to unfair or discriminatory outcomes — undermining customer trust and exposing the institution to compliance risk.\n",
+        "\n",
+        "We'll first use `list_tests()` again to filter for tests relating to `prompt_validation`:"
+      ],
+      "id": "16f29c8d"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.list_tests(filter=\"prompt_validation\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "74eba86c"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "And then run the identified `Bias` test:"
+      ],
+      "id": "e9413803"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    \"validmind.prompt_validation.Bias\",\n",
+        "    inputs={\n",
+        "        \"model\": vm_banking_model,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "062cf8e7"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc9__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the output produced by the ValidMind Library right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your documentation."
+      ],
+      "id": "8f3f2dbe"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc9_1__'></a>\n",
+        "\n",
+        "### Work with your documentation\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "    What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
+        "\n",
+        "3. Click into any section related to the tests we ran in this notebook, for example: **4.3. Prompt Evaluation** to review the results of the tests we logged."
+      ],
+      "id": "8716165d"
+    },
+    {
+      "cell_type": "markdown",
+      "id": "7c4a78ce",
+      "metadata": {},
+      "source": [
+        "<a id='toc9_2__'></a>\n",
+        "\n",
+        "### Customize the banking agent for your use case\n",
+        "\n",
+        "You've now built an agentic AI system designed for banking use cases that supports compliance with supervisory guidance such as SR 26-2 and SS1/23. While SR 26-2 explicitly excludes generative and agentic AI from its scope, underlying principles — materiality, ongoing monitoring, and effective challenge — still apply to governance of these systems. The example covers credit and fraud risk assessment for both retail and commercial banking. Extend this example agent to real-world banking scenarios and production deployment by:\n",
+        "\n",
+        "- Adapting the banking tools to your organization's specific requirements\n",
+        "- Adding more banking scenarios and edge cases to your test set\n",
+        "- Connecting the agent to your banking systems and databases\n",
+        "- Implementing additional banking-specific tools and workflows"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc9_3__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "Learn more about the ValidMind Library tools we used in this notebook:\n",
+        "\n",
+        "- [Custom prompts](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/customize_test_result_descriptions.html)\n",
+        "- [Custom tests](https://docs.validmind.ai/notebooks/how_to/tests/custom_tests/implement_custom_tests.html)\n",
+        "- [ValidMind scorers](https://docs.validmind.ai/notebooks/how_to/scoring/assign_scores_complete_tutorial.html)\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ],
+      "id": "7f9385d3"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc10__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ],
+      "id": "fdd5c0db"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "9733adff"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ],
+      "id": "829429fd"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ],
+      "id": "55339760"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-b9e82bcf4e364c4f8e5ae4bb0e4b2865"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "validmind-1QuffXMV-py3.11",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.11.9"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 5
 }
diff --git a/site/notebooks/use_cases/capital_markets/capital_markets_template.yaml b/site/notebooks/use_cases/capital_markets/capital_markets_template.yaml
index 9cb561dc27..1ae9f6e4fa 100644
--- a/site/notebooks/use_cases/capital_markets/capital_markets_template.yaml
+++ b/site/notebooks/use_cases/capital_markets/capital_markets_template.yaml
@@ -40,7 +40,7 @@
           with business goals.
         - Include specific use cases, outputs, and highlight regulatory
           expectations to demonstrate compliance.
-        - Specify compliance requirements, such as IFRS, Basel III or SR11-7, as
+        - Specify compliance requirements, such as IFRS, Basel III or SR 26-2, as
           applicable.
     - id: products_and_risks
       title: Products and Risks
diff --git a/site/notebooks/use_cases/capital_markets/quickstart_option_pricing_models.ipynb b/site/notebooks/use_cases/capital_markets/quickstart_option_pricing_models.ipynb
index f372b04c64..4b4ae386c0 100644
--- a/site/notebooks/use_cases/capital_markets/quickstart_option_pricing_models.ipynb
+++ b/site/notebooks/use_cases/capital_markets/quickstart_option_pricing_models.ipynb
@@ -1,2103 +1,2115 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "id": "87056cee",
-   "metadata": {},
-   "source": [
-    "# Quickstart for knockout option pricing model documentation\n",
-    "\n",
-    "Welcome! Let's get you started with the basic process of documenting models with ValidMind.\n",
-    "\n",
-    "A knockout option is a barrier option that ceases to exist if the underlying asset hits a predetermined price, known as the \"barrier.\" This barrier level, set above or below the current market price, determines whether the option will \"knock out\" before its expiration date. There are two types: \"up-and-out\" and \"down-and-out.\" In an up-and-out knockout option, the option expires if the asset price rises above the barrier, while in a down-and-out, it expires if the asset price falls below. Knockout options generally offer a lower premium than standard options since there is a chance they will expire worthless if the barrier is reached.\n",
-    "\n",
-    "Pricing knockout options involves accounting for the proximity of the asset's price to the barrier, as well as market volatility and the option’s time to expiration. High volatility and longer expiry increase the likelihood of the barrier being triggered, which reduces the option’s value. Models like modified Black-Scholes are used for simpler cases, while Monte Carlo simulations or binomial trees handle complex scenarios. Knockout options are useful for hedging or cost-effective investment strategies, allowing investors to save on premiums but with the risk of losing the option entirely if the barrier is hit.\n",
-    "\n",
-    "You will learn how to initialize the ValidMind Library, develop a option pricing model, and then write custom tests that can be used for sensitivity and stress testing to quickly generate documentation about model."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "7417dfe1",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "  - [Initialize the Python environment](#toc2_3__)    \n",
-    "  - [Preview the documentation template](#toc2_4__)    \n",
-    "- [Model development](#toc3__)    \n",
-    "- [Data Preparation](#toc4__)    \n",
-    "  - [Synthetic data generation](#toc4_1__)    \n",
-    "  - [Initialize the ValidMind datasets](#toc4_2__)    \n",
-    "  - [Data Quality](#toc4_3__)    \n",
-    "    - [Outliers detection using IQR method](#toc4_3_1__)    \n",
-    "    - [Isolation Forest Outliers Test](#toc4_3_2__)    \n",
-    "  - [Model Calibration](#toc4_4__)    \n",
-    "  - [Synthetic Data Calibration Test](#toc4_5__)    \n",
-    "  - [Model Evaluation](#toc4_6__)    \n",
-    "    - [Benchmark Testing](#toc4_6_1__)    \n",
-    "    - [Sensitivity Testing](#toc4_6_2__)    \n",
-    "    - [Greeks](#toc4_6_3__)    \n",
-    "  - [Delta](#toc4_7__)    \n",
-    "  - [Gamma](#toc4_8__)    \n",
-    "  - [Theta](#toc4_9__)    \n",
-    "  - [Vega](#toc4_10__)    \n",
-    "  - [Rho](#toc4_11__)    \n",
-    "    - [Stress Testing](#toc4_11_1__)    \n",
-    "- [Next steps](#toc5__)    \n",
-    "  - [Work with your model documentation](#toc5_1__)    \n",
-    "  - [Discover more learning resources](#toc5_2__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "1426d212",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
-    "\n",
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Custom tests**: Custom tests are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom test.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom test. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f8812717",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b792f6a9",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "c3d26e61",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f3db6c9b",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e1865b8d",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "214572ff",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Capital markets`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "8b9547ad",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "0cc9c04c",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e928f7e5",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Initialize the Python environment\n",
-    "\n",
-    "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "9edb42a2",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%matplotlib inline\n",
-    "import pandas as pd\n",
-    "import numpy as np\n",
-    "import matplotlib.pyplot as plt\n",
-    "from scipy.optimize import minimize\n",
-    "\n",
-    "from validmind.tests import run_test"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "a2403294",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_4__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "3dfd04dd",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "d79d9953",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Model development"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 32,
-   "id": "c3f5b0b9",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "class OptionPricing:\n",
-    "    def __init__(self, S0, K, T, r):\n",
-    "        self.S0 = S0\n",
-    "        self.K = K\n",
-    "        self.T = T\n",
-    "        self.r = r\n",
-    "\n",
-    "    def monte_carlo_simulation(self, N, M):\n",
-    "        raise NotImplementedError(\"Must be implemented by subclasses\")\n",
-    "\n",
-    "    def price_option(self, N, M):\n",
-    "        raise NotImplementedError(\"Must be implemented by subclasses\")\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "a9d7f832",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "\n",
-    "class BlackScholesModel(OptionPricing):\n",
-    "    def __init__(self, S0, K, T, r, sigma):\n",
-    "        super().__init__(S0, K, T, r)\n",
-    "        self.sigma = sigma\n",
-    "    def monte_carlo_simulation(self, N, M):\n",
-    "        dt = self.T / M\n",
-    "        price_paths = np.zeros((N, M + 1))\n",
-    "        price_paths[:, 0] = self.S0\n",
-    "        for t in range(1, M + 1):\n",
-    "            Z = np.random.standard_normal(N)\n",
-    "            price_paths[:, t] = price_paths[:, t - 1] * np.exp((self.r - 0.5 * self.sigma**2) * dt + self.sigma * np.sqrt(dt) * Z)\n",
-    "        return price_paths\n",
-    "\n",
-    "    def price_option(self, N, M):\n",
-    "        price_paths = self.monte_carlo_simulation(N, M)\n",
-    "        payoffs = np.maximum(price_paths[:, -1] - self.K, 0)\n",
-    "        return np.exp(-self.r * self.T) * np.mean(payoffs)\n",
-    "    \n",
-    "    def calibrate(self, market_prices, strikes, maturities):\n",
-    "        def objective_function(params):\n",
-    "            self.sigma = params[0]\n",
-    "            for K, T in zip(strikes, maturities):\n",
-    "                self.K = K\n",
-    "                self.T = T\n",
-    "                model_prices.append(self.price_option(10000, 100))\n",
-    "            return np.sum((np.array(market_prices) - np.array(model_prices))**2)\n",
-    "        result = minimize(objective_function, [self.sigma], bounds=[(0.01, 1.0)])\n",
-    "        self.sigma = result.x[0]\n",
-    "\n",
-    "class StochasticVolatilityModel(OptionPricing):\n",
-    "    def __init__(self, S0, K, T, r, v0, kappa, theta, xi, rho):\n",
-    "        super().__init__(S0, K, T, r)\n",
-    "        self.v0 = v0\n",
-    "        self.kappa = kappa\n",
-    "        self.theta = theta\n",
-    "        self.xi = xi\n",
-    "        self.rho = rho\n",
-    "    def monte_carlo_simulation(self, N, M):\n",
-    "        dt = self.T / M\n",
-    "        price_paths = np.zeros((N, M + 1))\n",
-    "        vol_paths = np.zeros((N, M + 1))\n",
-    "        price_paths[:, 0] = self.S0\n",
-    "        vol_paths[:, 0] = self.v0\n",
-    "        for t in range(1, M + 1):\n",
-    "            Z1 = np.random.standard_normal(N)\n",
-    "            Z2 = np.random.standard_normal(N)\n",
-    "            W1 = Z1\n",
-    "            W2 = self.rho * Z1 + np.sqrt(1 - self.rho**2) * Z2\n",
-    "            vol_paths[:, t] = np.abs(vol_paths[:, t - 1] + self.kappa * (self.theta - vol_paths[:, t - 1]) * dt + self.xi * np.sqrt(vol_paths[:, t - 1] * dt) * W1)\n",
-    "            price_paths[:, t] = price_paths[:, t - 1] * np.exp((self.r - 0.5 * vol_paths[:, t - 1]) * dt + np.sqrt(vol_paths[:, t - 1] * dt) * W2)\n",
-    "        return price_paths\n",
-    "\n",
-    "    def price_option(self, N, M):\n",
-    "        price_paths = self.monte_carlo_simulation(N, M)\n",
-    "        payoffs = np.maximum(price_paths[:, -1] - self.K, 0)\n",
-    "        return np.exp(-self.r * self.T) * np.mean(payoffs)\n",
-    "    \n",
-    "    def calibrate(self, market_prices, strikes, maturities):\n",
-    "        def objective_function(params):\n",
-    "            self.v0, self.kappa, self.theta, self.xi, self.rho = params\n",
-    "            model_prices = []\n",
-    "            for K, T in zip(strikes, maturities):\n",
-    "                self.K = K\n",
-    "                self.T = T\n",
-    "                model_prices.append(self.price_option(10000, 100))\n",
-    "\n",
-    "            return np.sum((np.array(market_prices) - np.array(model_prices))**2)\n",
-    "        \n",
-    "        initial_guess = [self.v0, self.kappa, self.theta, self.xi, self.rho]\n",
-    "        bounds = [(0.01, 1.0), (0.01, 5.0), (0.01, 1.0), (0.01, 1.0), (-1.0, 1.0)]\n",
-    "        result = minimize(objective_function, initial_guess, bounds=bounds)\n",
-    "        self.v0, self.kappa, self.theta, self.xi, self.rho = result.x\n",
-    "\n",
-    "\n",
-    "class KnockoutOption:\n",
-    "    def __init__(self, model, S0, K, T, r, barrier):\n",
-    "        self.model = model\n",
-    "        self.S0 = S0\n",
-    "        self.K = K\n",
-    "        self.T = T\n",
-    "        self.r = r\n",
-    "        self.barrier = barrier\n",
-    "\n",
-    "    def price_knockout_option(self, N, M):\n",
-    "        dt = self.T / M\n",
-    "        price_paths = np.zeros((N, M + 1))\n",
-    "        vol_paths = np.zeros((N, M + 1)) if isinstance(self.model, StochasticVolatilityModel) else None\n",
-    "        price_paths[:, 0] = self.S0\n",
-    "        if vol_paths is not None:\n",
-    "            vol_paths[:, 0] = self.model.v0\n",
-    "        \n",
-    "        for t in range(1, M + 1):\n",
-    "            Z1 = np.random.standard_normal(N)\n",
-    "            if vol_paths is None:\n",
-    "                # Black-Scholes Model\n",
-    "                price_paths[:, t] = price_paths[:, t - 1] * np.exp(\n",
-    "                    (self.r - 0.5 * self.model.sigma**2) * dt + self.model.sigma * np.sqrt(dt) * Z1\n",
-    "                )\n",
-    "            else:\n",
-    "                # Stochastic Volatility Model\n",
-    "                Z2 = np.random.standard_normal(N)\n",
-    "                W1 = Z1\n",
-    "                W2 = self.model.rho * Z1 + np.sqrt(1 - self.model.rho**2) * Z2\n",
-    "                vol_paths[:, t] = np.abs(vol_paths[:, t - 1] + self.model.kappa * (self.model.theta - vol_paths[:, t - 1]) * dt + self.model.xi * np.sqrt(vol_paths[:, t - 1] * dt) * W1)\n",
-    "                price_paths[:, t] = price_paths[:, t - 1] * np.exp(\n",
-    "                    (self.r - 0.5 * vol_paths[:, t - 1]) * dt + np.sqrt(vol_paths[:, t - 1] * dt) * W2\n",
-    "                )\n",
-    "            \n",
-    "            # Knockout condition\n",
-    "            price_paths[:, t][price_paths[:, t] >= self.barrier] = 0\n",
-    "        payoffs = np.maximum(price_paths[:, -1] - self.K, 0)\n",
-    "        return np.exp(-self.r * self.T) * np.mean(payoffs)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "14bcdbb9",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Data Preparation"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f655dc9c",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Synthetic data generation"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 34,
-   "id": "42cb9070",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def generate_synthetic_market_data(model, strikes, maturities):\n",
-    "    market_prices = []\n",
-    "    market_data = []\n",
-    "    for K, T in zip(strikes, maturities):\n",
-    "        model.K = K\n",
-    "        model.T = T\n",
-    "        market_prices.append(model.price_option(10000, 100))\n",
-    "        market_data.append({\"strike\": K, \"option_price\": model.price_option(10000, 100)})\n",
-    "    return market_prices, market_data\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "2854fbe3",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "N = 10000\n",
-    "M = 100\n",
-    "\n",
-    "# Parameters for synthetic data\n",
-    "S0 = 100\n",
-    "K = 100\n",
-    "T = 1\n",
-    "r = 0.05\n",
-    "# BlackSholes\n",
-    "true_sigma = 0.2\n",
-    "\n",
-    "# Stochastic Volatility\n",
-    "true_v0 = 0.2\n",
-    "true_kappa = 2.0\n",
-    "true_theta = 0.2\n",
-    "true_xi = 0.1\n",
-    "true_rho = -0.5\n",
-    "\n",
-    "# Synthetic data generation parameters\n",
-    "strikes = list(np.linspace(75, 130, 25))\n",
-    "maturities = list(np.linspace(0.2, 3.0, 25))\n",
-    "\n",
-    "# Generate synthetic market data using the true parameters\n",
-    "bs_model = BlackScholesModel(S0, K, T, r, true_sigma)\n",
-    "bs_market_prices, bs_market_data = generate_synthetic_market_data(bs_model, strikes, maturities)\n",
-    "\n",
-    "\n",
-    "sv_model = StochasticVolatilityModel(S0, K, T, r, true_v0, true_kappa, true_theta, true_xi, true_rho)\n",
-    "sv_market_prices, sv_market_data = generate_synthetic_market_data(sv_model, strikes, maturities)\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b54c4950",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind datasets\n",
-    "\n",
-    "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "7f3498dd",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "bs_market_data_df = pd.DataFrame(bs_market_data)\n",
-    "vm_bs_market_data = vm.init_dataset(\n",
-    "    dataset=bs_market_data_df,\n",
-    "    input_id=\"sv_market_data\",\n",
-    ")\n",
-    "\n",
-    "sv_market_data_df = pd.DataFrame(sv_market_data)\n",
-    "vm_sv_market_data = vm.init_dataset(\n",
-    "    dataset=sv_market_data_df,\n",
-    "    input_id=\"sv_market_data\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "7b36b59c",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_3__'></a>\n",
-    "\n",
-    "### Data Quality\n",
-    "Let's check quality of the data using outliers and missing data tests."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "671330b1",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_3_1__'></a>\n",
-    "\n",
-    "#### Outliers detection using IQR method\n",
-    "Let's visualizes the distribution of outliers in the option_price feature using the Interquartile Range (IQR) method."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "f1c1ab6f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"validmind.data_validation.IQROutliersBarPlot:BlackScholes\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_bs_market_data,\n",
-    "    },\n",
-    "    title=\"Outliers detection using IQR method for BlackScholes\",\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "6b5e8654",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"validmind.data_validation.IQROutliersTable:BlackScholes\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_bs_market_data,\n",
-    "    },\n",
-    "    title=\"Outliers table using IQR method for BlackScholes\",\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "d96f10c7",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"validmind.data_validation.IQROutliersBarPlot:StochasticVolatility\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_sv_market_data,\n",
-    "    },\n",
-    "    title=\"Outliers detection using IQR method for StochasticVolatility\",\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "758c4c57",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"validmind.data_validation.IQROutliersTable:StochasticVolatility\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_sv_market_data,\n",
-    "    },\n",
-    "    title=\"Outliers table using IQR method for StochasticVolatility\",\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b1430200",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_3_2__'></a>\n",
-    "\n",
-    "#### Isolation Forest Outliers Test\n",
-    "Let's detects anomalies in the dataset using the Isolation Forest algorithm, visualized through scatter plots."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "9eb91453",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"validmind.data_validation.IsolationForestOutliers:BlackScholes\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_bs_market_data,\n",
-    "    },\n",
-    "    title=\"Outliers detection using Isolation Forest for BlackScholes\",\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "12940f8e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"validmind.data_validation.IsolationForestOutliers:StochasticVolatility\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_sv_market_data,\n",
-    "    },\n",
-    "    title=\"Outliers detection using Isolation Forest for StochasticVolatility\",\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f30e5579",
-   "metadata": {},
-   "source": [
-    "##### Missing Values Test\n",
-    "Let's evaluates dataset quality by ensuring the missing value ratio across all features does not exceed a set threshold."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "805ddb1c",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"validmind.data_validation.MissingValues:BlackScholes\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_bs_market_data,\n",
-    "    },\n",
-    "    title=\"Missing Values detection for BlackScholes\",\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "e69e0039",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "\n",
-    "result = run_test(\n",
-    "    \"validmind.data_validation.MissingValues:StochasticVolatility\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_sv_market_data,\n",
-    "    },\n",
-    "    title=\"MissingValues detection for StochasticVolatility\",\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "09628809",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_4__'></a>\n",
-    "\n",
-    "### Model Calibration\n",
-    "* Clearly state the purpose of the calibration process. For example, in the context of an option pricing model, calibration aims to adjust model parameters to fit market data (e.g., market option prices, volatility surfaces).\n",
-    "* Specify whether the calibration is to historical data, current market data, or a blend of both."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "6802c26e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import pandas as pd\n",
-    "\n",
-    "@vm.test(\"my_custom_tests.SyntheticDataCalibrationTest\")\n",
-    "def generate_synthetic_data_summary(option_pricing_model, strikes, maturities, synthetic_prices):\n",
-    "    \"\"\"\n",
-    "    This function will use synthetic prices to calibrate each model\n",
-    "    and then generate derived prices based on the calibrated parameters.\n",
-    "    It will output a DataFrame summarizing the strikes, maturities,\n",
-    "    synthetic and derived prices, and the model parameters.\n",
-    "\n",
-    "    \"\"\"\n",
-    "    derived_prices = []\n",
-    "    for K, T in zip(strikes, maturities):\n",
-    "        option_pricing_model.K = K\n",
-    "        option_pricing_model.T = T\n",
-    "        derived_prices.append(option_pricing_model.price_option(10000, 100))\n",
-    "    \n",
-    "    model_type = type(option_pricing_model).__name__\n",
-    "    data = {\n",
-    "        \"Strike\": strikes,\n",
-    "        \"Maturity\": maturities,\n",
-    "        \"Synthetic_Price\": synthetic_prices,\n",
-    "        \"Derived_Price\": derived_prices,\n",
-    "        \"Model_Type\": model_type,\n",
-    "        \"S0\": [option_pricing_model.S0] * len(strikes),\n",
-    "        \"K\": [option_pricing_model.K] * len(strikes),\n",
-    "        \"T\": [option_pricing_model.T] * len(strikes),\n",
-    "        \"r\": [option_pricing_model.r] * len(strikes)\n",
-    "    }\n",
-    "    \n",
-    "    if model_type == \"BlackScholesModel\":\n",
-    "        data[\"sigma\"] = [option_pricing_model.sigma] * len(strikes)\n",
-    "    elif model_type == \"StochasticVolatilityModel\":\n",
-    "        data[\"v0\"] = [option_pricing_model.v0] * len(strikes)\n",
-    "        data[\"kappa\"] = [option_pricing_model.kappa] * len(strikes)\n",
-    "        data[\"theta\"] = [option_pricing_model.theta] * len(strikes)\n",
-    "        data[\"xi\"] = [option_pricing_model.xi] * len(strikes)\n",
-    "        data[\"rho\"] = [option_pricing_model.rho] * len(strikes)\n",
-    "    \n",
-    "    df = pd.DataFrame(data)\n",
-    "    return df\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "3bf04d21",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_5__'></a>\n",
-    "\n",
-    "### Synthetic Data Calibration Test\n",
-    "Let's evaluates the accuracy of a stochastic volatility model by comparing synthetic prices with derived prices after model calibration."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "4345cb5c",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"my_custom_tests.SyntheticDataCalibrationTest\",\n",
-    "    params={\n",
-    "        \"option_pricing_model\": sv_model,\n",
-    "        \"strikes\": strikes,\n",
-    "        \"maturities\": maturities,\n",
-    "        \"synthetic_prices\": sv_market_prices\n",
-    "    },\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "4d48f107",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_6__'></a>\n",
-    "\n",
-    "### Model Evaluation"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "8ec8b5a3",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_6_1__'></a>\n",
-    "\n",
-    "#### Benchmark Testing\n",
-    "* Compare the model’s performance with alternative models or industry-standard models to assess its relative effectiveness.\n",
-    "* Ensure that the model is competitive in pricing, accuracy, and computational efficiency."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 47,
-   "id": "ac733262",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "@vm.test(\"my_custom_tests.BenchmarkTest\")\n",
-    "def benchmark_test(bs_model, sv_model, strikes, maturities):\n",
-    "    \"\"\"\n",
-    "    Comparison between Black Scholes and stochastic volatility model\n",
-    "\n",
-    "    \"\"\"\n",
-    "    bs_model_type = type(bs_model).__name__\n",
-    "    sv_model_type = type(sv_model).__name__\n",
-    "\n",
-    "    bs_derived_prices = []\n",
-    "    sv_derived_prices = []\n",
-    "    for K in strikes:\n",
-    "        bs_model.K = K\n",
-    "        bs_derived_prices.append(bs_model.price_option(10000, 100))\n",
-    "        sv_model.K = K\n",
-    "        sv_derived_prices.append(sv_model.price_option(10000, 100))\n",
-    "\n",
-    "    data = {\n",
-    "        \"Strike\": strikes,\n",
-    "        \"Maturities\": [sv_model.T] * len(strikes),\n",
-    "        \"bs_model_price\": bs_derived_prices,\n",
-    "        \"sv_model_price\": sv_derived_prices,\n",
-    "\n",
-    "    }\n",
-    "    df1 = pd.DataFrame(data)\n",
-    "\n",
-    "    bs_derived_prices = []\n",
-    "    sv_derived_prices = []\n",
-    "    for T in maturities:\n",
-    "        bs_model.T = T\n",
-    "        bs_derived_prices.append(bs_model.price_option(10000, 100))\n",
-    "        sv_model.T = T\n",
-    "        sv_derived_prices.append(sv_model.price_option(10000, 100))\n",
-    "\n",
-    "    data = {\n",
-    "        \"Strike\": [sv_model.K] * len(maturities),\n",
-    "        \"Maturities\": maturities,\n",
-    "        \"bs_model_price\": bs_derived_prices,\n",
-    "        \"sv_model_price\": sv_derived_prices,\n",
-    "    }\n",
-    "\n",
-    "    df2 = pd.DataFrame(data)\n",
-    "\n",
-    "    return {\"strikes variation benchmarking\": df1}, {\"maturities variation benchmarking\": df2}"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "20de9858",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"my_custom_tests.BenchmarkTest\",\n",
-    "    params={\n",
-    "        \"sv_model\": sv_model,\n",
-    "        \"bs_model\": bs_model,\n",
-    "        \"strikes\": strikes,\n",
-    "        \"maturities\": maturities,\n",
-    "    },\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "d9ad15b8",
-   "metadata": {},
-   "source": [
-    "##### Surface Volatility Test\n",
-    "Let's calculates the implied volatility across different strikes and maturities based on market prices"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 49,
-   "id": "46e275e3",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import numpy as np\n",
-    "import pandas as pd\n",
-    "from scipy.optimize import minimize\n",
-    "import plotly.graph_objects as go\n",
-    "\n",
-    "@vm.test(\"my_custom_tests.ImpliedVolSurface\")\n",
-    "def implied_vol_surface(market_prices, strikes, maturities, S0, r, barrier, N=10000, M=100):\n",
-    "    \"\"\"\n",
-    "    This is a test to compute the implied volatility surface for a given set of market prices,\n",
-    "    strikes, and maturities.\n",
-    "    \"\"\"\n",
-    "    def implied_volatility(market_price, N, M, initial_guess=0.2):\n",
-    "        def objective_function(sigma):\n",
-    "            model.sigma = sigma\n",
-    "            model_price = model.price_option(N, M)\n",
-    "            return (model_price - market_price) ** 2\n",
-    "\n",
-    "        result = minimize(objective_function, initial_guess, bounds=[(0.01, 1.0)])\n",
-    "        return result.x[0]\n",
-    "    \n",
-    "    implied_vols = np.zeros((len(strikes), len(maturities)))\n",
-    "\n",
-    "    for i, K in enumerate(strikes):\n",
-    "        for j, T in enumerate(maturities):\n",
-    "            market_price = market_prices[i]\n",
-    "            model = BlackScholesModel(S0, K, T, r, sigma=0.2)\n",
-    "\n",
-    "            implied_vol = implied_volatility(market_price, N, M)\n",
-    "            implied_vols[i, j] = implied_vol\n",
-    "\n",
-    "    # Create the 3D surface plot\n",
-    "    X, Y = np.meshgrid(strikes, maturities)\n",
-    "    Z = implied_vols.T  # Transpose to match the meshgrid orientation\n",
-    "\n",
-    "    fig = go.Figure(data=[go.Surface(x=X, y=Y, z=Z)])\n",
-    "    \n",
-    "    # Update the layout\n",
-    "    fig.update_layout(\n",
-    "        title=f'3D Surface Plot of Implied Volatility',\n",
-    "        scene=dict(\n",
-    "            xaxis_title='Strike',\n",
-    "            yaxis_title='Maturity',\n",
-    "            zaxis_title='Implied Volatility',\n",
-    "            camera=dict(\n",
-    "                up=dict(x=0, y=0, z=1),\n",
-    "                center=dict(x=0, y=0, z=0),\n",
-    "                eye=dict(x=1.5, y=1.5, z=1.5)\n",
-    "            )\n",
-    "        ),\n",
-    "        width=900,\n",
-    "        height=700,\n",
-    "        margin=dict(l=65, r=50, b=65, t=90)\n",
-    "    )\n",
-    "\n",
-    "    return fig"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "66ca002a",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"my_custom_tests.ImpliedVolSurface\",\n",
-    "    params={\n",
-    "        \"market_prices\": sv_market_prices,\n",
-    "        \"strikes\": strikes,\n",
-    "        \"maturities\": maturities,\n",
-    "        \"S0\": S0,\n",
-    "        \"r\": r,\n",
-    "        \"barrier\": 120\n",
-    "    }\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "a49d8a1e",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_6_2__'></a>\n",
-    "\n",
-    "#### Sensitivity Testing"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "784a5e7c",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "\n",
-    "@vm.test(\"my_custom_tests.Sensitivity\")\n",
-    "def sensitivity_test(model_type, S0, T, r, N, M, strike=None, barrier=None, sigma=None, v0=None, kappa=None,theta=None, xi=None, rho=None):\n",
-    "    \"\"\"\n",
-    "    This is sensitivity test\n",
-    "\"\"\"\n",
-    "    if model_type == 'BS':\n",
-    "        model = BlackScholesModel(S0, strike, T, r, sigma)\n",
-    "    else:\n",
-    "        model = StochasticVolatilityModel(S0, strike, T, r, v0, kappa, theta, xi, rho)\n",
-    "    \n",
-    "    knockout_option = KnockoutOption(model, S0, strike, T, r, barrier)\n",
-    "    price = knockout_option.price_knockout_option(N, M)\n",
-    "\n",
-    "    return pd.DataFrame({\"Option price\": [price]})"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "d4be30e6",
-   "metadata": {},
-   "source": [
-    "##### Initialise parameters"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "46878b84",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "\n",
-    "strike_range = (min(strikes), max(strikes))\n",
-    "barrier_range = (100, 120)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "205c46ce",
-   "metadata": {},
-   "source": [
-    "##### Common plot function\n",
-    "Let's create a line plot using the default result output data and log it by passing the function through the `post_process_fn` parameter in the `run_test()` method."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "d4b9ea2f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from plotly.express import bar\n",
-    "from validmind.vm_models.figure import Figure\n",
-    "from validmind.vm_models.result import TestResult\n",
-    "import plotly.graph_objects as go\n",
-    "import random\n",
-    "\n",
-    "def process_results(result: TestResult):\n",
-    "\n",
-    "    # Convert to DataFrame\n",
-    "    df = pd.DataFrame(result.tables[0].data)\n",
-    "    \n",
-    "    # Get the first two column names\n",
-    "    x_col = df.columns[0]\n",
-    "    y_col = df.columns[1]\n",
-    "    \n",
-    "    # Create figure\n",
-    "    fig = go.Figure()\n",
-    "    fig.add_trace(\n",
-    "        go.Scatter(\n",
-    "            x=df[x_col],\n",
-    "            y=df[y_col],\n",
-    "            mode='lines',\n",
-    "            name=y_col  # Use y-axis column name as trace name\n",
-    "        )\n",
-    "    )\n",
-    "    \n",
-    "    fig.update_layout(\n",
-    "        xaxis_title=x_col,\n",
-    "        yaxis_title=y_col,\n",
-    "        showlegend=True,\n",
-    "        template=\"plotly_white\"\n",
-    "    )\n",
-    "\n",
-    "    result.add_figure(\n",
-    "        Figure(\n",
-    "            figure=fig,\n",
-    "            key=\"sensitivity_plot_\" + str(random.randint(0, 1000000)),\n",
-    "            ref_id=result.ref_id,\n",
-    "        )\n",
-    "    )\n",
-    "\n",
-    "    return result"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "528b409c",
-   "metadata": {},
-   "source": [
-    "##### Strike sensitivity Test\n",
-    "Let's evaluates the sensitivity of a model's output value to changes in the strike price, while keeping other parameters constant.\n",
-    "This test is crucial for understanding how variations in strike prices affect the valuation of financial derivatives, particularly options."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "bb8f1cab",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"my_custom_tests.Sensitivity:S0\",\n",
-    "    param_grid={\n",
-    "        \"model_type\": ['SV'],\n",
-    "        \"N\": [N],\n",
-    "        \"M\": [M],\n",
-    "        \"strike\":[strike_range[0]],\n",
-    "        \"barrier\": [barrier_range[0]],\n",
-    "        \"S0\": list(np.linspace(S0-20, S0+20, 20)),\n",
-    "        \"T\": [T],\n",
-    "        \"r\": [r],\n",
-    "        \"v0\": [0.2],\n",
-    "        \"kappa\": [2],\n",
-    "        \"theta\": [0.2],\n",
-    "        \"xi\": [0.1],\n",
-    "        \"rho\": [-0.5],\n",
-    "    },\n",
-    "    post_process_fn= process_results\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "e566a681",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"my_custom_tests.Sensitivity:ToStrike\",\n",
-    "    param_grid={\n",
-    "        \"model_type\": ['SV'],\n",
-    "        \"N\": [N],\n",
-    "        \"M\": [M],\n",
-    "        \"strike\": list(np.linspace(strike_range[0], strike_range[1], 20)),\n",
-    "        \"barrier\": [barrier_range[0]],\n",
-    "        \"S0\": [S0],\n",
-    "        \"T\": [T],\n",
-    "        \"r\": [r],\n",
-    "        \"v0\": [0.2],\n",
-    "        \"kappa\": [2],\n",
-    "        \"theta\": [0.2],\n",
-    "        \"xi\": [0.1],\n",
-    "        \"rho\": [-0.5],\n",
-    "    },\n",
-    "    post_process_fn= process_results\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "0f288663",
-   "metadata": {},
-   "source": [
-    "##### Barrier Sensitivity Test\n",
-    "Let's evaluates the sensitivity of a model's output to changes in the barrier level of a financial derivative, specifically a barrier option. This test is crucial for understanding how small changes in the barrier can impact the option's valuation, which is essential for risk management and pricing strategies."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "95f81283",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"my_custom_tests.Sensitivity:ToBarrier\",\n",
-    "    param_grid={\n",
-    "        \"model_type\": ['SV'],\n",
-    "        \"N\": [N],\n",
-    "        \"M\": [M],\n",
-    "        \"strike\": [strike_range[0]],\n",
-    "        \"barrier\": list(np.linspace(barrier_range[0], barrier_range[1], 20)),\n",
-    "        \"S0\": [S0],\n",
-    "        \"T\": [T],\n",
-    "        \"r\": [r],\n",
-    "        \"v0\": [0.2],\n",
-    "        \"kappa\": [2],\n",
-    "        \"theta\": [0.2],\n",
-    "        \"xi\": [0.1],\n",
-    "        \"rho\": [-0.5],\n",
-    "    },\n",
-    "    post_process_fn=process_results\n",
-    "\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "3201aa09",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_6_3__'></a>\n",
-    "\n",
-    "#### Greeks\n",
-    "These Greeks are crucial for traders and risk managers as they provide insights into the risk and potential price movements of options and derivatives, allowing for more informed decision-making and risk management strategies."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f31afc73",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_7__'></a>\n",
-    "\n",
-    "### Delta\n",
-    "Let's measures the sensitivity of the option's price to a change in the price of the underlying asset. It indicates how much the price of an option is expected to move per $1 change in the underlying asset's price."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 30,
-   "id": "31befc58",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "@vm.test(\"my_custom_tests.GreeksDelta\")\n",
-    "def calculate_delta(model_type, S0, T, r, N, M, strike=None, barrier=None, \n",
-    "                   sigma=None, v0=None, kappa=None, theta=None, xi=None, rho=None, \n",
-    "                   h=0.001):  # h is the step size for finite difference\n",
-    "    \"\"\"\n",
-    "    Calculate delta using finite difference method.\n",
-    "    Delta = (V(S0 + h) - V(S0 - h)) / (2h)\n",
-    "    where V is the option price and h is a small increment\n",
-    "    \"\"\"\n",
-    "    # Initialize the model with S0 + h\n",
-    "    if model_type == 'BS':\n",
-    "        model_up = BlackScholesModel(S0 + h, strike, T, r, sigma)\n",
-    "        model_down = BlackScholesModel(S0 - h, strike, T, r, sigma)\n",
-    "    else:\n",
-    "        model_up = StochasticVolatilityModel(S0 + h, strike, T, r, v0, kappa, theta, xi, rho)\n",
-    "        model_down = StochasticVolatilityModel(S0 - h, strike, T, r, v0, kappa, theta, xi, rho)\n",
-    "    \n",
-    "\n",
-    "    # Calculate option prices for up and down moves\n",
-    "    knockout_up = KnockoutOption(model_up, S0 + h, strike, T, r, barrier)\n",
-    "    knockout_down = KnockoutOption(model_down, S0 - h, strike, T, r, barrier)\n",
-    "    \n",
-    "    price_up = knockout_up.price_knockout_option(N, M)\n",
-    "    price_down = knockout_down.price_knockout_option(N, M)\n",
-    "    \n",
-    "    # Calculate delta using central difference\n",
-    "    delta = (price_up - price_down) / (2 * h)\n",
-    "    df = pd.DataFrame({\"Delta\": [delta], \"Price_Up\": [price_up], \"Price_Down\": [price_down], \"h\": [h]})\n",
-    "    return df\n",
-    "\n"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "a033dd96",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# To analyze delta sensitivity to underlying price changes\n",
-    "result = run_test(\n",
-    "    \"my_custom_tests.GreeksDelta\",\n",
-    "    param_grid={\n",
-    "        \"model_type\": ['SV'],\n",
-    "        \"N\": [1000000],\n",
-    "        \"M\": [M],\n",
-    "        \"strike\":[strike_range[0]],\n",
-    "        \"barrier\": [barrier_range[0]],\n",
-    "        \"S0\": list(np.linspace(S0-20, S0+20, 20)),\n",
-    "        \"T\": [T],\n",
-    "        \"r\": [r],\n",
-    "        \"v0\": [0.2],\n",
-    "        \"kappa\": [2],\n",
-    "        \"theta\": [0.2],\n",
-    "        \"xi\": [0.1],\n",
-    "        \"rho\": [-0.5],\n",
-    "        \"h\": [0.001]\n",
-    "    },\n",
-    "post_process_fn=process_results  # Using the plotting function defined earlier\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "0826d4dc",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_8__'></a>\n",
-    "\n",
-    "### Gamma\n",
-    "Let's measures the rate of change of Delta with respect to changes in the underlying asset's price. It indicates the curvature of the option's price relative to the underlying asset's price."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "ccf54452",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "@vm.test(\"my_custom_tests.GreeksGamma\")\n",
-    "def calculate_gamma(model_type, S0, T, r, N, M, strike=None, barrier=None, \n",
-    "                   sigma=None, v0=None, kappa=None, theta=None, xi=None, rho=None, \n",
-    "                   h=0.01):  # h is the step size for finite difference\n",
-    "    \"\"\"\n",
-    "    Calculate gamma using finite difference method.\n",
-    "    Gamma = (V(S0 + h) - 2V(S0) + V(S0 - h)) / h^2\n",
-    "    where V is the option price and h is a small increment\n",
-    "    \"\"\"\n",
-    "    # Initialize the models with S0 + h, S0, and S0 - h\n",
-    "    if model_type == 'BS':\n",
-    "        model_up = BlackScholesModel(S0 + h, strike, T, r, sigma)\n",
-    "        model_center = BlackScholesModel(S0, strike, T, r, sigma)\n",
-    "        model_down = BlackScholesModel(S0 - h, strike, T, r, sigma)\n",
-    "    else:\n",
-    "        model_up = StochasticVolatilityModel(S0 + h, strike, T, r, v0, kappa, theta, xi, rho)\n",
-    "        model_center = StochasticVolatilityModel(S0, strike, T, r, v0, kappa, theta, xi, rho)\n",
-    "        model_down = StochasticVolatilityModel(S0 - h, strike, T, r, v0, kappa, theta, xi, rho)\n",
-    "    \n",
-    "    # Calculate option prices for up, center, and down moves\n",
-    "    knockout_up = KnockoutOption(model_up, S0 + h, strike, T, r, barrier)\n",
-    "    knockout_center = KnockoutOption(model_center, S0, strike, T, r, barrier)\n",
-    "    knockout_down = KnockoutOption(model_down, S0 - h, strike, T, r, barrier)\n",
-    "    \n",
-    "    price_up = knockout_up.price_knockout_option(N, M)\n",
-    "    price_center = knockout_center.price_knockout_option(N, M)\n",
-    "    price_down = knockout_down.price_knockout_option(N, M)\n",
-    "    \n",
-    "    # Calculate gamma using second-order central difference\n",
-    "    gamma = (price_up - 2*price_center + price_down) / (h * h)\n",
-    "    \n",
-    "    df = pd.DataFrame({\n",
-    "        \"Gamma\": [gamma], \n",
-    "        \"Price_Up\": [price_up], \n",
-    "        \"Price_Center\": [price_center],\n",
-    "        \"Price_Down\": [price_down], \n",
-    "        \"h\": [h]\n",
-    "    })\n",
-    "    return df\n",
-    "\n",
-    "# To analyze gamma sensitivity to underlying price changes\n",
-    "result = run_test(\n",
-    "    \"my_custom_tests.GreeksGamma\",\n",
-    "    param_grid={\n",
-    "        \"model_type\": ['SV'],\n",
-    "        \"N\": [1000000],\n",
-    "        \"M\": [M],\n",
-    "        \"strike\":[strike_range[0]],\n",
-    "        \"barrier\": [barrier_range[0]],\n",
-    "        \"S0\": list(np.linspace(S0-20, S0+20, 20)),\n",
-    "        \"T\": [T],\n",
-    "        \"r\": [r],\n",
-    "        \"v0\": [0.2],\n",
-    "        \"kappa\": [2],\n",
-    "        \"theta\": [0.2],\n",
-    "        \"xi\": [0.1],\n",
-    "        \"rho\": [-0.5],\n",
-    "        \"h\": [0.1]\n",
-    "    },\n",
-    "    post_process_fn=process_results  # Using the plotting function defined earlier\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "df0eaa72",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_9__'></a>\n",
-    "\n",
-    "### Theta\n",
-    "Let's measures the sensitivity of the option's price to the passage of time, also known as time decay. It indicates how much the price of an option is expected to decrease as the option approaches its expiration date."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "0e9810b1",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "@vm.test(\"my_custom_tests.GreeksTheta\")\n",
-    "def calculate_theta(model_type, S0, T, r, N, M, strike=None, barrier=None, \n",
-    "                   sigma=None, v0=None, kappa=None, theta=None, xi=None, rho=None, \n",
-    "                   dt=1/365):  # dt is typically one day\n",
-    "    \"\"\"\n",
-    "    Calculate theta using finite difference method.\n",
-    "    Theta = (V(t + dt) - V(t)) / dt\n",
-    "    where V is the option price and dt is a small time increment (typically 1 day)\n",
-    "    \"\"\"\n",
-    "    # Initialize the models with T and T + dt\n",
-    "    if model_type == 'BS':\n",
-    "        model_current = BlackScholesModel(S0, strike, T, r, sigma)\n",
-    "        model_future = BlackScholesModel(S0, strike, T + dt, r, sigma)\n",
-    "    else:\n",
-    "        model_current = StochasticVolatilityModel(S0, strike, T, r, v0, kappa, theta, xi, rho)\n",
-    "        model_future = StochasticVolatilityModel(S0, strike, T + dt, r, v0, kappa, theta, xi, rho)\n",
-    "    \n",
-    "    # Calculate option prices for current and future time\n",
-    "    knockout_current = KnockoutOption(model_current, S0, strike, T, r, barrier)\n",
-    "    knockout_future = KnockoutOption(model_future, S0, strike, T + dt, r, barrier)\n",
-    "    \n",
-    "    price_current = knockout_current.price_knockout_option(N, M)\n",
-    "    price_future = knockout_future.price_knockout_option(N, M)\n",
-    "    \n",
-    "    # Calculate theta using forward difference\n",
-    "    # Note: We divide by dt and multiply by -1 since theta represents the negative rate of change\n",
-    "    theta_value = -1 * (price_future - price_current) / dt\n",
-    "    \n",
-    "    df = pd.DataFrame({\n",
-    "        \"Theta\": [theta_value], \n",
-    "        \"Price_Current\": [price_current],\n",
-    "        \"Price_Future\": [price_future],\n",
-    "        \"dt\": [dt]\n",
-    "    })\n",
-    "    return df\n",
-    "\n",
-    "# Example usage to analyze theta sensitivity across different underlying prices\n",
-    "result = run_test(\n",
-    "    \"my_custom_tests.GreeksTheta\",\n",
-    "    param_grid={\n",
-    "               \"model_type\": ['SV'],\n",
-    "        \"N\": [1000000],\n",
-    "        \"M\": [M],\n",
-    "        \"strike\":[strike_range[0]],\n",
-    "        \"barrier\": [barrier_range[0]],\n",
-    "        \"S0\": list(np.linspace(S0-20, S0+20, 20)),\n",
-    "        \"T\": [T],\n",
-    "        \"r\": [r],\n",
-    "        \"v0\": [0.2],\n",
-    "        \"kappa\": [2],\n",
-    "        \"theta\": [0.2],\n",
-    "        \"xi\": [0.1],\n",
-    "        \"rho\": [-0.5],\n",
-    "        \"dt\": [1/365]  # One day time step\n",
-    "    },\n",
-    "    post_process_fn=process_results  # Using the plotting function defined earlier\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "28c60e1d",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_10__'></a>\n",
-    "\n",
-    "### Vega\n",
-    "Let's measures the sensitivity of the option's price to changes in the volatility of the underlying asset. It indicates how much the price of an option is expected to change with a 1% change in the underlying asset's volatility."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "1dbc6632",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "@vm.test(\"my_custom_tests.GreeksVega\")\n",
-    "def calculate_vega(model_type, S0, T, r, N, M, strike=None, barrier=None, \n",
-    "                  sigma=None, v0=None, kappa=None, theta=None, xi=None, rho=None, \n",
-    "                  h=0.001):  # h is the step size for finite difference\n",
-    "    \"\"\"\n",
-    "    Calculate vega using finite difference method.\n",
-    "    For Black-Scholes: Vega = (V(σ + h) - V(σ - h)) / (2h)\n",
-    "    For Stochastic Vol: Vega = (V(v0 + h) - V(v0 - h)) / (2h)\n",
-    "    where V is the option price and h is a small increment in volatility\n",
-    "    \"\"\"\n",
-    "    if model_type == 'BS':\n",
-    "        # For Black-Scholes, perturb sigma\n",
-    "        model_up = BlackScholesModel(S0, strike, T, r, sigma + h)\n",
-    "        model_down = BlackScholesModel(S0, strike, T, r, sigma - h)\n",
-    "    else:\n",
-    "        # For Stochastic Volatility, perturb v0\n",
-    "        model_up = StochasticVolatilityModel(S0, strike, T, r, v0 + h, kappa, theta, xi, rho)\n",
-    "        model_down = StochasticVolatilityModel(S0, strike, T, r, v0 - h, kappa, theta, xi, rho)\n",
-    "    \n",
-    "    # Calculate option prices for up and down moves in volatility\n",
-    "    knockout_up = KnockoutOption(model_up, S0, strike, T, r, barrier)\n",
-    "    knockout_down = KnockoutOption(model_down, S0, strike, T, r, barrier)\n",
-    "    \n",
-    "    price_up = knockout_up.price_knockout_option(N, M)\n",
-    "    price_down = knockout_down.price_knockout_option(N, M)\n",
-    "    \n",
-    "    # Calculate vega using central difference\n",
-    "    vega = (price_up - price_down) / (2 * h)\n",
-    "    \n",
-    "    df = pd.DataFrame({\n",
-    "        \"Vega\": [vega], \n",
-    "        \"Price_Up\": [price_up], \n",
-    "        \"Price_Down\": [price_down], \n",
-    "        \"h\": [h]\n",
-    "    })\n",
-    "    return df\n",
-    "\n",
-    "# Example usage to analyze vega sensitivity across different underlying prices\n",
-    "result = run_test(\n",
-    "    \"my_custom_tests.GreeksVega\",\n",
-    "    param_grid={\n",
-    "                \"model_type\": ['SV'],\n",
-    "        \"N\": [1000000],\n",
-    "        \"M\": [M],\n",
-    "        \"strike\":[strike_range[0]],\n",
-    "        \"barrier\": [barrier_range[0]],\n",
-    "        \"S0\": list(np.linspace(S0-20, S0+20, 20)),\n",
-    "        \"T\": [T],\n",
-    "        \"r\": [r],\n",
-    "        \"v0\": [0.2],\n",
-    "        \"kappa\": [2],\n",
-    "        \"theta\": [0.2],\n",
-    "        \"xi\": [0.1],\n",
-    "        \"rho\": [-0.5],\n",
-    "        \"h\": [0.0001]  # Small step size for better accuracy\n",
-    "    },\n",
-    "    post_process_fn=process_results  # Using the plotting function defined earlier\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "1ec51eba",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_11__'></a>\n",
-    "\n",
-    "### Rho\n",
-    "Let's measures the sensitivity of the option's price to changes in the interest rate. It indicates how much the price of an option is expected to change with a 1% change in interest rates."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "2f497b5f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "@vm.test(\"my_custom_tests.GreeksRho\")\n",
-    "def calculate_rho(model_type, S0, T, r, N, M, strike=None, barrier=None, \n",
-    "                 sigma=None, v0=None, kappa=None, theta=None, xi=None, rho=None, \n",
-    "                 h=0.0001):  # h is the step size for finite difference\n",
-    "    \"\"\"\n",
-    "    Calculate rho using finite difference method.\n",
-    "    Rho = (V(r + h) - V(r - h)) / (2h)\n",
-    "    where V is the option price and h is a small increment in interest rate\n",
-    "    \"\"\"\n",
-    "    # Initialize the models with r + h and r - h\n",
-    "    if model_type == 'BS':\n",
-    "        model_up = BlackScholesModel(S0, strike, T, r + h, sigma)\n",
-    "        model_down = BlackScholesModel(S0, strike, T, r - h, sigma)\n",
-    "    else:\n",
-    "        model_up = StochasticVolatilityModel(S0, strike, T, r + h, v0, kappa, theta, xi, rho)\n",
-    "        model_down = StochasticVolatilityModel(S0, strike, T, r - h, v0, kappa, theta, xi, rho)\n",
-    "    \n",
-    "    # Calculate option prices for up and down moves in interest rate\n",
-    "    knockout_up = KnockoutOption(model_up, S0, strike, T, r + h, barrier)\n",
-    "    knockout_down = KnockoutOption(model_down, S0, strike, T, r - h, barrier)\n",
-    "    \n",
-    "    price_up = knockout_up.price_knockout_option(N, M)\n",
-    "    price_down = knockout_down.price_knockout_option(N, M)\n",
-    "    \n",
-    "    # Calculate rho using central difference\n",
-    "    rho_value = (price_up - price_down) / (2 * h)\n",
-    "    \n",
-    "    df = pd.DataFrame({\n",
-    "        \"Rho\": [rho_value], \n",
-    "        \"Price_Up\": [price_up], \n",
-    "        \"Price_Down\": [price_down], \n",
-    "        \"h\": [h]\n",
-    "    })\n",
-    "    return df\n",
-    "\n",
-    "# Example usage to analyze rho sensitivity across different underlying prices\n",
-    "result = run_test(\n",
-    "    \"my_custom_tests.GreeksRho\",\n",
-    "    param_grid={\n",
-    "               \"model_type\": ['SV'],\n",
-    "        \"N\": [1000000],\n",
-    "        \"M\": [M],\n",
-    "        \"strike\":[strike_range[0]],\n",
-    "        \"barrier\": [barrier_range[0]],\n",
-    "        \"S0\": list(np.linspace(S0-20, S0+20, 20)),\n",
-    "        \"T\": [T],\n",
-    "        \"r\": [r],\n",
-    "        \"v0\": [0.2],\n",
-    "        \"kappa\": [2],\n",
-    "        \"theta\": [0.2],\n",
-    "        \"xi\": [0.1],\n",
-    "        \"rho\": [-0.5],\n",
-    "        \"h\": [0.0001]  # Small step size for better accuracy\n",
-    "    },\n",
-    "    post_process_fn=process_results  # Using the plotting function defined earlier\n",
-    ")\n",
-    "result.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "0cdd1b1b",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_11_1__'></a>\n",
-    "\n",
-    "#### Stress Testing"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "c98ff396",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "@vm.test(\"my_custom_tests.Stressing\")\n",
-    "def sensitivity_test(model_type, S0, T, r, N, M, strike=None, barrier=None, sigma=None, v0=None, kappa=None,theta=None, xi=None, rho=None):\n",
-    "    \"\"\"\n",
-    "    This is stress test\n",
-    "    \"\"\"\n",
-    "    if model_type == 'BS':\n",
-    "        model = BlackScholesModel(S0, strike, T, r, sigma)\n",
-    "    else:\n",
-    "        model = StochasticVolatilityModel(S0, strike, T, r, v0, kappa, theta, xi, rho)\n",
-    "    \n",
-    "    knockout_option = KnockoutOption(model, S0, strike, T, r, barrier)\n",
-    "    price = knockout_option.price_knockout_option(N, M)\n",
-    "\n",
-    "    return pd.DataFrame({\"Option price\": [price]})"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b6f0a179",
-   "metadata": {},
-   "source": [
-    "##### Rho (correlation) and Theta (long term vol) stress test\n",
-    "First, we create a surface plot to visualize the option price with respect to two variables."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "b408de0f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def two_parameters_stress_surface_plot(result: TestResult):\n",
-    "    import plotly.graph_objects as go\n",
-    "    import numpy as np\n",
-    "    import pandas as pd\n",
-    "    # Convert to DataFrame\n",
-    "    data = pd.DataFrame(result.tables[0].data)\n",
-    "    \n",
-    "    # Get column names (assuming first column is x, next two are y1 and y2)\n",
-    "    z_col = data.columns[2]\n",
-    "    x_col = data.columns[0]\n",
-    "    y_col = data.columns[1]\n",
-    "    \n",
-    "    # Get unique values for x and y\n",
-    "    x_unique = np.sort(data[x_col].unique())\n",
-    "    y_unique = np.sort(data[y_col].unique())\n",
-    "    \n",
-    "    # Create meshgrid\n",
-    "    X, Y = np.meshgrid(x_unique, y_unique)\n",
-    "    \n",
-    "    # Create Z matrix\n",
-    "    Z = np.zeros_like(X)\n",
-    "    for i, x_val in enumerate(x_unique):\n",
-    "        for j, y_val in enumerate(y_unique):\n",
-    "            mask = (data[x_col] == x_val) & (data[y_col] == y_val)\n",
-    "            if mask.any():\n",
-    "                Z[j, i] = data.loc[mask, z_col].iloc[0]\n",
-    "    \n",
-    "    # Create the 3D surface plot\n",
-    "    fig = go.Figure(data=[go.Surface(x=X, y=Y, z=Z)])\n",
-    "    \n",
-    "    # Update the layout\n",
-    "    fig.update_layout(\n",
-    "        title=f'3D Surface Plot of {z_col}',\n",
-    "        scene=dict(\n",
-    "            xaxis_title=x_col,\n",
-    "            yaxis_title=y_col,\n",
-    "            zaxis_title=z_col,\n",
-    "            camera=dict(\n",
-    "                up=dict(x=0, y=0, z=1),\n",
-    "                center=dict(x=0, y=0, z=0),\n",
-    "                eye=dict(x=1.5, y=1.5, z=1.5)\n",
-    "            )\n",
-    "        ),\n",
-    "        width=900,\n",
-    "        height=700,\n",
-    "        margin=dict(l=65, r=50, b=65, t=90)\n",
-    "    )\n",
-    "\n",
-    "    result.add_figure(\n",
-    "        Figure(\n",
-    "            figure=fig,\n",
-    "            key=\"sensitivity_plot_\" + str(random.randint(0, 1000000)),\n",
-    "            ref_id=result.ref_id,\n",
-    "        )\n",
-    "    )\n",
-    "\n",
-    "    return result"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "87289ee6",
-   "metadata": {},
-   "source": [
-    "Let's evaluates the sensitivity of a model's output to changes in the correlation parameter (rho) and the long-term variance parameter (theta) within a stochastic volatility framework.\n",
-    "\n",
-    "This test is useful for understanding how variations in these parameters affect the model's valuation, which is crucial for risk management and model validation."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "5c0ec52d",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "\n",
-    "\n",
-    "result = run_test(\n",
-    "    \"my_custom_tests.Stressing:TheRhoAndThetaParameters\",\n",
-    "    param_grid={\n",
-    "        \"model_type\": ['SV'],\n",
-    "        \"N\": [N],\n",
-    "        \"M\": [M],\n",
-    "        \"strike\": [strike_range[0]],\n",
-    "        \"barrier\": [barrier_range[0]],\n",
-    "        \"S0\": [S0],\n",
-    "        \"T\": [T],\n",
-    "        \"r\": [r],\n",
-    "        \"v0\": [0.2],\n",
-    "        \"kappa\": [2],\n",
-    "        \"theta\": list(np.linspace(0,0.8, 10)),\n",
-    "        \"xi\": [0.1],\n",
-    "        \"rho\": list(np.linspace(-1,0.8, 10)),\n",
-    "    },\n",
-    "    post_process_fn=two_parameters_stress_surface_plot\n",
-    ")\n",
-    "result.log()\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "44be4c61",
-   "metadata": {},
-   "source": [
-    "##### Rho (correlation) and Xi (vol of vol) stress test"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "e0a2996e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "\n",
-    "\n",
-    "result = run_test(\n",
-    "    \"my_custom_tests.Stressing:TheRhoAndXiParameters\",\n",
-    "    param_grid={\n",
-    "        \"model_type\": ['SV'],\n",
-    "        \"N\": [N],\n",
-    "        \"M\": [M],\n",
-    "        \"strike\": [strike_range[0]],\n",
-    "        \"barrier\": [barrier_range[0]],\n",
-    "        \"S0\": [S0],\n",
-    "        \"T\": [T],\n",
-    "        \"r\": [r],\n",
-    "        \"v0\": [0.2],\n",
-    "        \"kappa\": [2],\n",
-    "        \"theta\": [0.2],\n",
-    "        \"xi\": list(np.linspace(0,0.8, 10)),\n",
-    "        \"rho\": list(np.linspace(-1,0.8, 10)),\n",
-    "    },\n",
-    "    post_process_fn=two_parameters_stress_surface_plot\n",
-    ")\n",
-    "result.log()\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "5fed568d",
-   "metadata": {},
-   "source": [
-    "##### Sigma stress test\n",
-    "evaluates the sensitivity of a model's output to changes in the volatility parameter, sigma. This test is crucial for understanding how variations in market volatility impact the model's valuation of financial instruments, particularly options.\n",
-    "\n",
-    "This test is useful for risk management and model validation, as it helps identify the robustness of the model under different market conditions. By analyzing the changes in the model's output as sigma varies, stakeholders can assess the model's stability and reliability."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "d49e2e37",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"my_custom_tests.Stressing:TheSigmaParameter\",\n",
-    "    param_grid={\n",
-    "        \"model_type\": ['BS'],\n",
-    "        \"N\": [N],\n",
-    "        \"M\": [M],\n",
-    "        \"strike\": [strike_range[0]],\n",
-    "        \"barrier\": [barrier_range[0]],\n",
-    "        \"S0\": [S0],\n",
-    "        \"T\": [T],\n",
-    "        \"r\": [r],\n",
-    "        \"sigma\": list(np.linspace(0.2, 0.8, 10)),\n",
-    "    },\n",
-    "    post_process_fn=process_results\n",
-    ")\n",
-    "result.log()\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "4e7a1f00",
-   "metadata": {},
-   "source": [
-    "##### Stress kappa\n",
-    "Let's evaluates the sensitivity of a model's output to changes in the kappa parameter, which is a mean reversion rate in stochastic volatility models."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "e995f6ae",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"my_custom_tests.Stressing:TheKappaParameter\",\n",
-    "    param_grid={\n",
-    "        \"model_type\": ['SV'],\n",
-    "        \"N\": [N],\n",
-    "        \"M\": [M],\n",
-    "        \"strike\": [strike_range[0]],\n",
-    "        \"barrier\": [barrier_range[0]],\n",
-    "        \"S0\": [S0],\n",
-    "        \"T\": [T],\n",
-    "        \"r\": [r],\n",
-    "        \"v0\": [0.2],\n",
-    "        \"kappa\": list(np.linspace(0, 8, 10)),\n",
-    "        \"theta\": [0.2],\n",
-    "        \"xi\": [0.1],\n",
-    "        \"rho\": [-0.5],\n",
-    "    },\n",
-    "    post_process_fn=process_results\n",
-    ")\n",
-    "result.log()\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "40d1c9e2",
-   "metadata": {},
-   "source": [
-    "##### Stress theta\n",
-    "Stress Theta evaluates the sensitivity of a model's output to changes in the parameter theta, which represents the long-term variance in a stochastic volatility model"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "7e371aee",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"my_custom_tests.Stressing:TheThetaParameter\",\n",
-    "    param_grid={\n",
-    "        \"model_type\": ['SV'],\n",
-    "        \"N\": [N],\n",
-    "        \"M\": [M],\n",
-    "        \"strike\": [strike_range[0]],\n",
-    "        \"barrier\": [barrier_range[0]],\n",
-    "        \"S0\": [S0],\n",
-    "        \"T\": [T],\n",
-    "        \"r\": [r],\n",
-    "        \"v0\": [0.2],\n",
-    "        \"kappa\": [2],\n",
-    "        \"theta\": list(np.linspace(0, 0.8, 10)),\n",
-    "        \"xi\": [0.1],\n",
-    "        \"rho\": [-0.5],\n",
-    "    },\n",
-    "    post_process_fn=process_results\n",
-    ")\n",
-    "result.log()\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e20d074f",
-   "metadata": {},
-   "source": [
-    "##### Stress xi\n",
-    "Stress Xi evaluates the sensitivity of a model's output to changes in the parameter xi, which represents the volatility of volatility in a stochastic volatility model. This test is crucial for understanding how variations in xi impact the model's valuation, particularly in financial derivatives pricing."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "9c545090",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"my_custom_tests.Stressing:TheXiParameter\",\n",
-    "    param_grid={\n",
-    "        \"model_type\": ['SV'],\n",
-    "        \"N\": [N],\n",
-    "        \"M\": [M],\n",
-    "        \"strike\": [strike_range[0]],\n",
-    "        \"barrier\": [barrier_range[0]],\n",
-    "        \"S0\": [S0],\n",
-    "        \"T\": [T],\n",
-    "        \"r\": [r],\n",
-    "        \"v0\": [0.2],\n",
-    "        \"kappa\": [2],\n",
-    "        \"theta\": [0.2],\n",
-    "        \"xi\": list(np.linspace(0.05, 0.95, 10)),\n",
-    "        \"rho\": [-0.5],\n",
-    "    },\n",
-    "    post_process_fn=process_results\n",
-    ")\n",
-    "result.log()\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f0360e20",
-   "metadata": {},
-   "source": [
-    "##### Stress rho\n",
-    "Stress rho test evaluates the sensitivity of a model's output to changes in the correlation parameter, rho, within a stochastic volatility (SV) model framework. This test is crucial for understanding how variations in rho, which represents the correlation between the asset price and its volatility, impact the model's valuation output."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "e2c5dfb1",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"my_custom_tests.Stressing:TheRhoParameter\",\n",
-    "    param_grid={\n",
-    "        \"model_type\": ['SV'],\n",
-    "        \"N\": [N],\n",
-    "        \"M\": [M],\n",
-    "        \"strike\": [strike_range[0]],\n",
-    "        \"barrier\": [barrier_range[0]],\n",
-    "        \"S0\": [S0],\n",
-    "        \"T\": [T],\n",
-    "        \"r\": [r],\n",
-    "        \"v0\": [0.2],\n",
-    "        \"kappa\": [2],\n",
-    "        \"theta\": [0.2],\n",
-    "        \"xi\": [0.1],\n",
-    "        \"rho\": list(np.linspace(-1.0, 1.0, 20)),\n",
-    "    },\n",
-    "    post_process_fn=process_results\n",
-    ")\n",
-    "result.log()\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "61d4e596",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
-    "\n",
-    "<a id='toc5_1__'></a>\n",
-    "\n",
-    "### Work with your model documentation\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)\n",
-    "\n",
-    "<a id='toc5_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-a23adf093a60485ea005cf8fc18545a5",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "validmind-1QuffXMV-py3.10",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.14"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Quickstart for knockout option pricing model documentation\n",
+        "\n",
+        "Welcome! Let's get you started with the basic process of documenting models with ValidMind.\n",
+        "\n",
+        "A knockout option is a barrier option that ceases to exist if the underlying asset hits a predetermined price, known as the \"barrier.\" This barrier level, set above or below the current market price, determines whether the option will \"knock out\" before its expiration date. There are two types: \"up-and-out\" and \"down-and-out.\" In an up-and-out knockout option, the option expires if the asset price rises above the barrier, while in a down-and-out, it expires if the asset price falls below. Knockout options generally offer a lower premium than standard options since there is a chance they will expire worthless if the barrier is reached.\n",
+        "\n",
+        "Pricing knockout options involves accounting for the proximity of the asset's price to the barrier, as well as market volatility and the option’s time to expiration. High volatility and longer expiry increase the likelihood of the barrier being triggered, which reduces the option’s value. Models like modified Black-Scholes are used for simpler cases, while Monte Carlo simulations or binomial trees handle complex scenarios. Knockout options are useful for hedging or cost-effective investment strategies, allowing investors to save on premiums but with the risk of losing the option entirely if the barrier is hit.\n",
+        "\n",
+        "You will learn how to initialize the ValidMind Library, develop a option pricing model, and then write custom tests that can be used for sensitivity and stress testing to quickly generate documentation about model."
+      ],
+      "id": "87056cee"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "  - [Initialize the Python environment](#toc2_3__)    \n",
+        "  - [Preview the documentation template](#toc2_4__)    \n",
+        "- [Model development](#toc3__)    \n",
+        "- [Data Preparation](#toc4__)    \n",
+        "  - [Synthetic data generation](#toc4_1__)    \n",
+        "  - [Initialize the ValidMind datasets](#toc4_2__)    \n",
+        "  - [Data Quality](#toc4_3__)    \n",
+        "    - [Outliers detection using IQR method](#toc4_3_1__)    \n",
+        "    - [Isolation Forest Outliers Test](#toc4_3_2__)    \n",
+        "  - [Model Calibration](#toc4_4__)    \n",
+        "  - [Synthetic Data Calibration Test](#toc4_5__)    \n",
+        "  - [Model Evaluation](#toc4_6__)    \n",
+        "    - [Benchmark Testing](#toc4_6_1__)    \n",
+        "    - [Sensitivity Testing](#toc4_6_2__)    \n",
+        "    - [Greeks](#toc4_6_3__)    \n",
+        "  - [Delta](#toc4_7__)    \n",
+        "  - [Gamma](#toc4_8__)    \n",
+        "  - [Theta](#toc4_9__)    \n",
+        "  - [Vega](#toc4_10__)    \n",
+        "  - [Rho](#toc4_11__)    \n",
+        "    - [Stress Testing](#toc4_11_1__)    \n",
+        "- [Next steps](#toc5__)    \n",
+        "  - [Work with your model documentation](#toc5_1__)    \n",
+        "  - [Discover more learning resources](#toc5_2__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ],
+      "id": "7417dfe1"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+        "\n",
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ],
+      "id": "1426d212"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ],
+      "id": "f8812717"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "To install the library:"
+      ],
+      "id": "b792f6a9"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "c3d26e61"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ],
+      "id": "f3db6c9b"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ],
+      "id": "e1865b8d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Capital markets`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ],
+      "id": "214572ff"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ],
+      "id": "8b9547ad"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "0cc9c04c"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Initialize the Python environment\n",
+        "\n",
+        "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
+      ],
+      "id": "e928f7e5"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%matplotlib inline\n",
+        "import pandas as pd\n",
+        "import numpy as np\n",
+        "import matplotlib.pyplot as plt\n",
+        "from scipy.optimize import minimize\n",
+        "\n",
+        "from validmind.tests import run_test"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "9edb42a2"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_4__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ],
+      "id": "a2403294"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "3dfd04dd"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Model development"
+      ],
+      "id": "d79d9953"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "class OptionPricing:\n",
+        "    def __init__(self, S0, K, T, r):\n",
+        "        self.S0 = S0\n",
+        "        self.K = K\n",
+        "        self.T = T\n",
+        "        self.r = r\n",
+        "\n",
+        "    def monte_carlo_simulation(self, N, M):\n",
+        "        raise NotImplementedError(\"Must be implemented by subclasses\")\n",
+        "\n",
+        "    def price_option(self, N, M):\n",
+        "        raise NotImplementedError(\"Must be implemented by subclasses\")\n"
+      ],
+      "execution_count": 32,
+      "outputs": [],
+      "id": "c3f5b0b9"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "\n",
+        "class BlackScholesModel(OptionPricing):\n",
+        "    def __init__(self, S0, K, T, r, sigma):\n",
+        "        super().__init__(S0, K, T, r)\n",
+        "        self.sigma = sigma\n",
+        "    def monte_carlo_simulation(self, N, M):\n",
+        "        dt = self.T / M\n",
+        "        price_paths = np.zeros((N, M + 1))\n",
+        "        price_paths[:, 0] = self.S0\n",
+        "        for t in range(1, M + 1):\n",
+        "            Z = np.random.standard_normal(N)\n",
+        "            price_paths[:, t] = price_paths[:, t - 1] * np.exp((self.r - 0.5 * self.sigma**2) * dt + self.sigma * np.sqrt(dt) * Z)\n",
+        "        return price_paths\n",
+        "\n",
+        "    def price_option(self, N, M):\n",
+        "        price_paths = self.monte_carlo_simulation(N, M)\n",
+        "        payoffs = np.maximum(price_paths[:, -1] - self.K, 0)\n",
+        "        return np.exp(-self.r * self.T) * np.mean(payoffs)\n",
+        "    \n",
+        "    def calibrate(self, market_prices, strikes, maturities):\n",
+        "        def objective_function(params):\n",
+        "            self.sigma = params[0]\n",
+        "            for K, T in zip(strikes, maturities):\n",
+        "                self.K = K\n",
+        "                self.T = T\n",
+        "                model_prices.append(self.price_option(10000, 100))\n",
+        "            return np.sum((np.array(market_prices) - np.array(model_prices))**2)\n",
+        "        result = minimize(objective_function, [self.sigma], bounds=[(0.01, 1.0)])\n",
+        "        self.sigma = result.x[0]\n",
+        "\n",
+        "class StochasticVolatilityModel(OptionPricing):\n",
+        "    def __init__(self, S0, K, T, r, v0, kappa, theta, xi, rho):\n",
+        "        super().__init__(S0, K, T, r)\n",
+        "        self.v0 = v0\n",
+        "        self.kappa = kappa\n",
+        "        self.theta = theta\n",
+        "        self.xi = xi\n",
+        "        self.rho = rho\n",
+        "    def monte_carlo_simulation(self, N, M):\n",
+        "        dt = self.T / M\n",
+        "        price_paths = np.zeros((N, M + 1))\n",
+        "        vol_paths = np.zeros((N, M + 1))\n",
+        "        price_paths[:, 0] = self.S0\n",
+        "        vol_paths[:, 0] = self.v0\n",
+        "        for t in range(1, M + 1):\n",
+        "            Z1 = np.random.standard_normal(N)\n",
+        "            Z2 = np.random.standard_normal(N)\n",
+        "            W1 = Z1\n",
+        "            W2 = self.rho * Z1 + np.sqrt(1 - self.rho**2) * Z2\n",
+        "            vol_paths[:, t] = np.abs(vol_paths[:, t - 1] + self.kappa * (self.theta - vol_paths[:, t - 1]) * dt + self.xi * np.sqrt(vol_paths[:, t - 1] * dt) * W1)\n",
+        "            price_paths[:, t] = price_paths[:, t - 1] * np.exp((self.r - 0.5 * vol_paths[:, t - 1]) * dt + np.sqrt(vol_paths[:, t - 1] * dt) * W2)\n",
+        "        return price_paths\n",
+        "\n",
+        "    def price_option(self, N, M):\n",
+        "        price_paths = self.monte_carlo_simulation(N, M)\n",
+        "        payoffs = np.maximum(price_paths[:, -1] - self.K, 0)\n",
+        "        return np.exp(-self.r * self.T) * np.mean(payoffs)\n",
+        "    \n",
+        "    def calibrate(self, market_prices, strikes, maturities):\n",
+        "        def objective_function(params):\n",
+        "            self.v0, self.kappa, self.theta, self.xi, self.rho = params\n",
+        "            model_prices = []\n",
+        "            for K, T in zip(strikes, maturities):\n",
+        "                self.K = K\n",
+        "                self.T = T\n",
+        "                model_prices.append(self.price_option(10000, 100))\n",
+        "\n",
+        "            return np.sum((np.array(market_prices) - np.array(model_prices))**2)\n",
+        "        \n",
+        "        initial_guess = [self.v0, self.kappa, self.theta, self.xi, self.rho]\n",
+        "        bounds = [(0.01, 1.0), (0.01, 5.0), (0.01, 1.0), (0.01, 1.0), (-1.0, 1.0)]\n",
+        "        result = minimize(objective_function, initial_guess, bounds=bounds)\n",
+        "        self.v0, self.kappa, self.theta, self.xi, self.rho = result.x\n",
+        "\n",
+        "\n",
+        "class KnockoutOption:\n",
+        "    def __init__(self, model, S0, K, T, r, barrier):\n",
+        "        self.model = model\n",
+        "        self.S0 = S0\n",
+        "        self.K = K\n",
+        "        self.T = T\n",
+        "        self.r = r\n",
+        "        self.barrier = barrier\n",
+        "\n",
+        "    def price_knockout_option(self, N, M):\n",
+        "        dt = self.T / M\n",
+        "        price_paths = np.zeros((N, M + 1))\n",
+        "        vol_paths = np.zeros((N, M + 1)) if isinstance(self.model, StochasticVolatilityModel) else None\n",
+        "        price_paths[:, 0] = self.S0\n",
+        "        if vol_paths is not None:\n",
+        "            vol_paths[:, 0] = self.model.v0\n",
+        "        \n",
+        "        for t in range(1, M + 1):\n",
+        "            Z1 = np.random.standard_normal(N)\n",
+        "            if vol_paths is None:\n",
+        "                # Black-Scholes Model\n",
+        "                price_paths[:, t] = price_paths[:, t - 1] * np.exp(\n",
+        "                    (self.r - 0.5 * self.model.sigma**2) * dt + self.model.sigma * np.sqrt(dt) * Z1\n",
+        "                )\n",
+        "            else:\n",
+        "                # Stochastic Volatility Model\n",
+        "                Z2 = np.random.standard_normal(N)\n",
+        "                W1 = Z1\n",
+        "                W2 = self.model.rho * Z1 + np.sqrt(1 - self.model.rho**2) * Z2\n",
+        "                vol_paths[:, t] = np.abs(vol_paths[:, t - 1] + self.model.kappa * (self.model.theta - vol_paths[:, t - 1]) * dt + self.model.xi * np.sqrt(vol_paths[:, t - 1] * dt) * W1)\n",
+        "                price_paths[:, t] = price_paths[:, t - 1] * np.exp(\n",
+        "                    (self.r - 0.5 * vol_paths[:, t - 1]) * dt + np.sqrt(vol_paths[:, t - 1] * dt) * W2\n",
+        "                )\n",
+        "            \n",
+        "            # Knockout condition\n",
+        "            price_paths[:, t][price_paths[:, t] >= self.barrier] = 0\n",
+        "        payoffs = np.maximum(price_paths[:, -1] - self.K, 0)\n",
+        "        return np.exp(-self.r * self.T) * np.mean(payoffs)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "a9d7f832"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Data Preparation"
+      ],
+      "id": "14bcdbb9"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Synthetic data generation"
+      ],
+      "id": "f655dc9c"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "def generate_synthetic_market_data(model, strikes, maturities):\n",
+        "    market_prices = []\n",
+        "    market_data = []\n",
+        "    for K, T in zip(strikes, maturities):\n",
+        "        model.K = K\n",
+        "        model.T = T\n",
+        "        market_prices.append(model.price_option(10000, 100))\n",
+        "        market_data.append({\"strike\": K, \"option_price\": model.price_option(10000, 100)})\n",
+        "    return market_prices, market_data\n"
+      ],
+      "execution_count": 34,
+      "outputs": [],
+      "id": "42cb9070"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "N = 10000\n",
+        "M = 100\n",
+        "\n",
+        "# Parameters for synthetic data\n",
+        "S0 = 100\n",
+        "K = 100\n",
+        "T = 1\n",
+        "r = 0.05\n",
+        "# BlackSholes\n",
+        "true_sigma = 0.2\n",
+        "\n",
+        "# Stochastic Volatility\n",
+        "true_v0 = 0.2\n",
+        "true_kappa = 2.0\n",
+        "true_theta = 0.2\n",
+        "true_xi = 0.1\n",
+        "true_rho = -0.5\n",
+        "\n",
+        "# Synthetic data generation parameters\n",
+        "strikes = list(np.linspace(75, 130, 25))\n",
+        "maturities = list(np.linspace(0.2, 3.0, 25))\n",
+        "\n",
+        "# Generate synthetic market data using the true parameters\n",
+        "bs_model = BlackScholesModel(S0, K, T, r, true_sigma)\n",
+        "bs_market_prices, bs_market_data = generate_synthetic_market_data(bs_model, strikes, maturities)\n",
+        "\n",
+        "\n",
+        "sv_model = StochasticVolatilityModel(S0, K, T, r, true_v0, true_kappa, true_theta, true_xi, true_rho)\n",
+        "sv_market_prices, sv_market_data = generate_synthetic_market_data(sv_model, strikes, maturities)\n"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "2854fbe3"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind datasets\n",
+        "\n",
+        "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module."
+      ],
+      "id": "b54c4950"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "bs_market_data_df = pd.DataFrame(bs_market_data)\n",
+        "vm_bs_market_data = vm.init_dataset(\n",
+        "    dataset=bs_market_data_df,\n",
+        "    input_id=\"sv_market_data\",\n",
+        ")\n",
+        "\n",
+        "sv_market_data_df = pd.DataFrame(sv_market_data)\n",
+        "vm_sv_market_data = vm.init_dataset(\n",
+        "    dataset=sv_market_data_df,\n",
+        "    input_id=\"sv_market_data\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "7f3498dd"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_3__'></a>\n",
+        "\n",
+        "### Data Quality\n",
+        "Let's check quality of the data using outliers and missing data tests."
+      ],
+      "id": "7b36b59c"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_3_1__'></a>\n",
+        "\n",
+        "#### Outliers detection using IQR method\n",
+        "Let's visualizes the distribution of outliers in the option_price feature using the Interquartile Range (IQR) method."
+      ],
+      "id": "671330b1"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"validmind.data_validation.IQROutliersBarPlot:BlackScholes\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_bs_market_data,\n",
+        "    },\n",
+        "    title=\"Outliers detection using IQR method for BlackScholes\",\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "f1c1ab6f"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"validmind.data_validation.IQROutliersTable:BlackScholes\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_bs_market_data,\n",
+        "    },\n",
+        "    title=\"Outliers table using IQR method for BlackScholes\",\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "6b5e8654"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"validmind.data_validation.IQROutliersBarPlot:StochasticVolatility\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_sv_market_data,\n",
+        "    },\n",
+        "    title=\"Outliers detection using IQR method for StochasticVolatility\",\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "d96f10c7"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"validmind.data_validation.IQROutliersTable:StochasticVolatility\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_sv_market_data,\n",
+        "    },\n",
+        "    title=\"Outliers table using IQR method for StochasticVolatility\",\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "758c4c57"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_3_2__'></a>\n",
+        "\n",
+        "#### Isolation Forest Outliers Test\n",
+        "Let's detects anomalies in the dataset using the Isolation Forest algorithm, visualized through scatter plots."
+      ],
+      "id": "b1430200"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"validmind.data_validation.IsolationForestOutliers:BlackScholes\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_bs_market_data,\n",
+        "    },\n",
+        "    title=\"Outliers detection using Isolation Forest for BlackScholes\",\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "9eb91453"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"validmind.data_validation.IsolationForestOutliers:StochasticVolatility\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_sv_market_data,\n",
+        "    },\n",
+        "    title=\"Outliers detection using Isolation Forest for StochasticVolatility\",\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "12940f8e"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Missing Values Test\n",
+        "Let's evaluates dataset quality by ensuring the missing value ratio across all features does not exceed a set threshold."
+      ],
+      "id": "f30e5579"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"validmind.data_validation.MissingValues:BlackScholes\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_bs_market_data,\n",
+        "    },\n",
+        "    title=\"Missing Values detection for BlackScholes\",\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "805ddb1c"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "\n",
+        "result = run_test(\n",
+        "    \"validmind.data_validation.MissingValues:StochasticVolatility\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_sv_market_data,\n",
+        "    },\n",
+        "    title=\"MissingValues detection for StochasticVolatility\",\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "e69e0039"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_4__'></a>\n",
+        "\n",
+        "### Model Calibration\n",
+        "* Clearly state the purpose of the calibration process. For example, in the context of an option pricing model, calibration aims to adjust model parameters to fit market data (e.g., market option prices, volatility surfaces).\n",
+        "* Specify whether the calibration is to historical data, current market data, or a blend of both."
+      ],
+      "id": "09628809"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import pandas as pd\n",
+        "\n",
+        "@vm.test(\"my_custom_tests.SyntheticDataCalibrationTest\")\n",
+        "def generate_synthetic_data_summary(option_pricing_model, strikes, maturities, synthetic_prices):\n",
+        "    \"\"\"\n",
+        "    This function will use synthetic prices to calibrate each model\n",
+        "    and then generate derived prices based on the calibrated parameters.\n",
+        "    It will output a DataFrame summarizing the strikes, maturities,\n",
+        "    synthetic and derived prices, and the model parameters.\n",
+        "\n",
+        "    \"\"\"\n",
+        "    derived_prices = []\n",
+        "    for K, T in zip(strikes, maturities):\n",
+        "        option_pricing_model.K = K\n",
+        "        option_pricing_model.T = T\n",
+        "        derived_prices.append(option_pricing_model.price_option(10000, 100))\n",
+        "    \n",
+        "    model_type = type(option_pricing_model).__name__\n",
+        "    data = {\n",
+        "        \"Strike\": strikes,\n",
+        "        \"Maturity\": maturities,\n",
+        "        \"Synthetic_Price\": synthetic_prices,\n",
+        "        \"Derived_Price\": derived_prices,\n",
+        "        \"Model_Type\": model_type,\n",
+        "        \"S0\": [option_pricing_model.S0] * len(strikes),\n",
+        "        \"K\": [option_pricing_model.K] * len(strikes),\n",
+        "        \"T\": [option_pricing_model.T] * len(strikes),\n",
+        "        \"r\": [option_pricing_model.r] * len(strikes)\n",
+        "    }\n",
+        "    \n",
+        "    if model_type == \"BlackScholesModel\":\n",
+        "        data[\"sigma\"] = [option_pricing_model.sigma] * len(strikes)\n",
+        "    elif model_type == \"StochasticVolatilityModel\":\n",
+        "        data[\"v0\"] = [option_pricing_model.v0] * len(strikes)\n",
+        "        data[\"kappa\"] = [option_pricing_model.kappa] * len(strikes)\n",
+        "        data[\"theta\"] = [option_pricing_model.theta] * len(strikes)\n",
+        "        data[\"xi\"] = [option_pricing_model.xi] * len(strikes)\n",
+        "        data[\"rho\"] = [option_pricing_model.rho] * len(strikes)\n",
+        "    \n",
+        "    df = pd.DataFrame(data)\n",
+        "    return df\n"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "6802c26e"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_5__'></a>\n",
+        "\n",
+        "### Synthetic Data Calibration Test\n",
+        "Let's evaluates the accuracy of a stochastic volatility model by comparing synthetic prices with derived prices after model calibration."
+      ],
+      "id": "3bf04d21"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"my_custom_tests.SyntheticDataCalibrationTest\",\n",
+        "    params={\n",
+        "        \"option_pricing_model\": sv_model,\n",
+        "        \"strikes\": strikes,\n",
+        "        \"maturities\": maturities,\n",
+        "        \"synthetic_prices\": sv_market_prices\n",
+        "    },\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "4345cb5c"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_6__'></a>\n",
+        "\n",
+        "### Model Evaluation"
+      ],
+      "id": "4d48f107"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_6_1__'></a>\n",
+        "\n",
+        "#### Benchmark Testing\n",
+        "* Compare the model’s performance with alternative models or industry-standard models to assess its relative effectiveness.\n",
+        "* Ensure that the model is competitive in pricing, accuracy, and computational efficiency."
+      ],
+      "id": "8ec8b5a3"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "@vm.test(\"my_custom_tests.BenchmarkTest\")\n",
+        "def benchmark_test(bs_model, sv_model, strikes, maturities):\n",
+        "    \"\"\"\n",
+        "    Comparison between Black Scholes and stochastic volatility model\n",
+        "\n",
+        "    \"\"\"\n",
+        "    bs_model_type = type(bs_model).__name__\n",
+        "    sv_model_type = type(sv_model).__name__\n",
+        "\n",
+        "    bs_derived_prices = []\n",
+        "    sv_derived_prices = []\n",
+        "    for K in strikes:\n",
+        "        bs_model.K = K\n",
+        "        bs_derived_prices.append(bs_model.price_option(10000, 100))\n",
+        "        sv_model.K = K\n",
+        "        sv_derived_prices.append(sv_model.price_option(10000, 100))\n",
+        "\n",
+        "    data = {\n",
+        "        \"Strike\": strikes,\n",
+        "        \"Maturities\": [sv_model.T] * len(strikes),\n",
+        "        \"bs_model_price\": bs_derived_prices,\n",
+        "        \"sv_model_price\": sv_derived_prices,\n",
+        "\n",
+        "    }\n",
+        "    df1 = pd.DataFrame(data)\n",
+        "\n",
+        "    bs_derived_prices = []\n",
+        "    sv_derived_prices = []\n",
+        "    for T in maturities:\n",
+        "        bs_model.T = T\n",
+        "        bs_derived_prices.append(bs_model.price_option(10000, 100))\n",
+        "        sv_model.T = T\n",
+        "        sv_derived_prices.append(sv_model.price_option(10000, 100))\n",
+        "\n",
+        "    data = {\n",
+        "        \"Strike\": [sv_model.K] * len(maturities),\n",
+        "        \"Maturities\": maturities,\n",
+        "        \"bs_model_price\": bs_derived_prices,\n",
+        "        \"sv_model_price\": sv_derived_prices,\n",
+        "    }\n",
+        "\n",
+        "    df2 = pd.DataFrame(data)\n",
+        "\n",
+        "    return {\"strikes variation benchmarking\": df1}, {\"maturities variation benchmarking\": df2}"
+      ],
+      "execution_count": 47,
+      "outputs": [],
+      "id": "ac733262"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"my_custom_tests.BenchmarkTest\",\n",
+        "    params={\n",
+        "        \"sv_model\": sv_model,\n",
+        "        \"bs_model\": bs_model,\n",
+        "        \"strikes\": strikes,\n",
+        "        \"maturities\": maturities,\n",
+        "    },\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "20de9858"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Surface Volatility Test\n",
+        "Let's calculates the implied volatility across different strikes and maturities based on market prices"
+      ],
+      "id": "d9ad15b8"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import numpy as np\n",
+        "import pandas as pd\n",
+        "from scipy.optimize import minimize\n",
+        "import plotly.graph_objects as go\n",
+        "\n",
+        "@vm.test(\"my_custom_tests.ImpliedVolSurface\")\n",
+        "def implied_vol_surface(market_prices, strikes, maturities, S0, r, barrier, N=10000, M=100):\n",
+        "    \"\"\"\n",
+        "    This is a test to compute the implied volatility surface for a given set of market prices,\n",
+        "    strikes, and maturities.\n",
+        "    \"\"\"\n",
+        "    def implied_volatility(market_price, N, M, initial_guess=0.2):\n",
+        "        def objective_function(sigma):\n",
+        "            model.sigma = sigma\n",
+        "            model_price = model.price_option(N, M)\n",
+        "            return (model_price - market_price) ** 2\n",
+        "\n",
+        "        result = minimize(objective_function, initial_guess, bounds=[(0.01, 1.0)])\n",
+        "        return result.x[0]\n",
+        "    \n",
+        "    implied_vols = np.zeros((len(strikes), len(maturities)))\n",
+        "\n",
+        "    for i, K in enumerate(strikes):\n",
+        "        for j, T in enumerate(maturities):\n",
+        "            market_price = market_prices[i]\n",
+        "            model = BlackScholesModel(S0, K, T, r, sigma=0.2)\n",
+        "\n",
+        "            implied_vol = implied_volatility(market_price, N, M)\n",
+        "            implied_vols[i, j] = implied_vol\n",
+        "\n",
+        "    # Create the 3D surface plot\n",
+        "    X, Y = np.meshgrid(strikes, maturities)\n",
+        "    Z = implied_vols.T  # Transpose to match the meshgrid orientation\n",
+        "\n",
+        "    fig = go.Figure(data=[go.Surface(x=X, y=Y, z=Z)])\n",
+        "    \n",
+        "    # Update the layout\n",
+        "    fig.update_layout(\n",
+        "        title=f'3D Surface Plot of Implied Volatility',\n",
+        "        scene=dict(\n",
+        "            xaxis_title='Strike',\n",
+        "            yaxis_title='Maturity',\n",
+        "            zaxis_title='Implied Volatility',\n",
+        "            camera=dict(\n",
+        "                up=dict(x=0, y=0, z=1),\n",
+        "                center=dict(x=0, y=0, z=0),\n",
+        "                eye=dict(x=1.5, y=1.5, z=1.5)\n",
+        "            )\n",
+        "        ),\n",
+        "        width=900,\n",
+        "        height=700,\n",
+        "        margin=dict(l=65, r=50, b=65, t=90)\n",
+        "    )\n",
+        "\n",
+        "    return fig"
+      ],
+      "execution_count": 49,
+      "outputs": [],
+      "id": "46e275e3"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"my_custom_tests.ImpliedVolSurface\",\n",
+        "    params={\n",
+        "        \"market_prices\": sv_market_prices,\n",
+        "        \"strikes\": strikes,\n",
+        "        \"maturities\": maturities,\n",
+        "        \"S0\": S0,\n",
+        "        \"r\": r,\n",
+        "        \"barrier\": 120\n",
+        "    }\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "66ca002a"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_6_2__'></a>\n",
+        "\n",
+        "#### Sensitivity Testing"
+      ],
+      "id": "a49d8a1e"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "\n",
+        "@vm.test(\"my_custom_tests.Sensitivity\")\n",
+        "def sensitivity_test(model_type, S0, T, r, N, M, strike=None, barrier=None, sigma=None, v0=None, kappa=None,theta=None, xi=None, rho=None):\n",
+        "    \"\"\"\n",
+        "    This is sensitivity test\n",
+        "\"\"\"\n",
+        "    if model_type == 'BS':\n",
+        "        model = BlackScholesModel(S0, strike, T, r, sigma)\n",
+        "    else:\n",
+        "        model = StochasticVolatilityModel(S0, strike, T, r, v0, kappa, theta, xi, rho)\n",
+        "    \n",
+        "    knockout_option = KnockoutOption(model, S0, strike, T, r, barrier)\n",
+        "    price = knockout_option.price_knockout_option(N, M)\n",
+        "\n",
+        "    return pd.DataFrame({\"Option price\": [price]})"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "784a5e7c"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Initialise parameters"
+      ],
+      "id": "d4be30e6"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "\n",
+        "strike_range = (min(strikes), max(strikes))\n",
+        "barrier_range = (100, 120)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "46878b84"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Common plot function\n",
+        "Let's create a line plot using the default result output data and log it by passing the function through the `post_process_fn` parameter in the `run_test()` method."
+      ],
+      "id": "205c46ce"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from plotly.express import bar\n",
+        "from validmind.vm_models.figure import Figure\n",
+        "from validmind.vm_models.result import TestResult\n",
+        "import plotly.graph_objects as go\n",
+        "import random\n",
+        "\n",
+        "def process_results(result: TestResult):\n",
+        "\n",
+        "    # Convert to DataFrame\n",
+        "    df = pd.DataFrame(result.tables[0].data)\n",
+        "    \n",
+        "    # Get the first two column names\n",
+        "    x_col = df.columns[0]\n",
+        "    y_col = df.columns[1]\n",
+        "    \n",
+        "    # Create figure\n",
+        "    fig = go.Figure()\n",
+        "    fig.add_trace(\n",
+        "        go.Scatter(\n",
+        "            x=df[x_col],\n",
+        "            y=df[y_col],\n",
+        "            mode='lines',\n",
+        "            name=y_col  # Use y-axis column name as trace name\n",
+        "        )\n",
+        "    )\n",
+        "    \n",
+        "    fig.update_layout(\n",
+        "        xaxis_title=x_col,\n",
+        "        yaxis_title=y_col,\n",
+        "        showlegend=True,\n",
+        "        template=\"plotly_white\"\n",
+        "    )\n",
+        "\n",
+        "    result.add_figure(\n",
+        "        Figure(\n",
+        "            figure=fig,\n",
+        "            key=\"sensitivity_plot_\" + str(random.randint(0, 1000000)),\n",
+        "            ref_id=result.ref_id,\n",
+        "        )\n",
+        "    )\n",
+        "\n",
+        "    return result"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "d4b9ea2f"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Strike sensitivity Test\n",
+        "Let's evaluates the sensitivity of a model's output value to changes in the strike price, while keeping other parameters constant.\n",
+        "This test is crucial for understanding how variations in strike prices affect the valuation of financial derivatives, particularly options."
+      ],
+      "id": "528b409c"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"my_custom_tests.Sensitivity:S0\",\n",
+        "    param_grid={\n",
+        "        \"model_type\": ['SV'],\n",
+        "        \"N\": [N],\n",
+        "        \"M\": [M],\n",
+        "        \"strike\":[strike_range[0]],\n",
+        "        \"barrier\": [barrier_range[0]],\n",
+        "        \"S0\": list(np.linspace(S0-20, S0+20, 20)),\n",
+        "        \"T\": [T],\n",
+        "        \"r\": [r],\n",
+        "        \"v0\": [0.2],\n",
+        "        \"kappa\": [2],\n",
+        "        \"theta\": [0.2],\n",
+        "        \"xi\": [0.1],\n",
+        "        \"rho\": [-0.5],\n",
+        "    },\n",
+        "    post_process_fn= process_results\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "bb8f1cab"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"my_custom_tests.Sensitivity:ToStrike\",\n",
+        "    param_grid={\n",
+        "        \"model_type\": ['SV'],\n",
+        "        \"N\": [N],\n",
+        "        \"M\": [M],\n",
+        "        \"strike\": list(np.linspace(strike_range[0], strike_range[1], 20)),\n",
+        "        \"barrier\": [barrier_range[0]],\n",
+        "        \"S0\": [S0],\n",
+        "        \"T\": [T],\n",
+        "        \"r\": [r],\n",
+        "        \"v0\": [0.2],\n",
+        "        \"kappa\": [2],\n",
+        "        \"theta\": [0.2],\n",
+        "        \"xi\": [0.1],\n",
+        "        \"rho\": [-0.5],\n",
+        "    },\n",
+        "    post_process_fn= process_results\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "e566a681"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Barrier Sensitivity Test\n",
+        "Let's evaluates the sensitivity of a model's output to changes in the barrier level of a financial derivative, specifically a barrier option. This test is crucial for understanding how small changes in the barrier can impact the option's valuation, which is essential for risk management and pricing strategies."
+      ],
+      "id": "0f288663"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"my_custom_tests.Sensitivity:ToBarrier\",\n",
+        "    param_grid={\n",
+        "        \"model_type\": ['SV'],\n",
+        "        \"N\": [N],\n",
+        "        \"M\": [M],\n",
+        "        \"strike\": [strike_range[0]],\n",
+        "        \"barrier\": list(np.linspace(barrier_range[0], barrier_range[1], 20)),\n",
+        "        \"S0\": [S0],\n",
+        "        \"T\": [T],\n",
+        "        \"r\": [r],\n",
+        "        \"v0\": [0.2],\n",
+        "        \"kappa\": [2],\n",
+        "        \"theta\": [0.2],\n",
+        "        \"xi\": [0.1],\n",
+        "        \"rho\": [-0.5],\n",
+        "    },\n",
+        "    post_process_fn=process_results\n",
+        "\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "95f81283"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_6_3__'></a>\n",
+        "\n",
+        "#### Greeks\n",
+        "These Greeks are crucial for traders and risk managers as they provide insights into the risk and potential price movements of options and derivatives, allowing for more informed decision-making and risk management strategies."
+      ],
+      "id": "3201aa09"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_7__'></a>\n",
+        "\n",
+        "### Delta\n",
+        "Let's measures the sensitivity of the option's price to a change in the price of the underlying asset. It indicates how much the price of an option is expected to move per $1 change in the underlying asset's price."
+      ],
+      "id": "f31afc73"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "@vm.test(\"my_custom_tests.GreeksDelta\")\n",
+        "def calculate_delta(model_type, S0, T, r, N, M, strike=None, barrier=None, \n",
+        "                   sigma=None, v0=None, kappa=None, theta=None, xi=None, rho=None, \n",
+        "                   h=0.001):  # h is the step size for finite difference\n",
+        "    \"\"\"\n",
+        "    Calculate delta using finite difference method.\n",
+        "    Delta = (V(S0 + h) - V(S0 - h)) / (2h)\n",
+        "    where V is the option price and h is a small increment\n",
+        "    \"\"\"\n",
+        "    # Initialize the model with S0 + h\n",
+        "    if model_type == 'BS':\n",
+        "        model_up = BlackScholesModel(S0 + h, strike, T, r, sigma)\n",
+        "        model_down = BlackScholesModel(S0 - h, strike, T, r, sigma)\n",
+        "    else:\n",
+        "        model_up = StochasticVolatilityModel(S0 + h, strike, T, r, v0, kappa, theta, xi, rho)\n",
+        "        model_down = StochasticVolatilityModel(S0 - h, strike, T, r, v0, kappa, theta, xi, rho)\n",
+        "    \n",
+        "\n",
+        "    # Calculate option prices for up and down moves\n",
+        "    knockout_up = KnockoutOption(model_up, S0 + h, strike, T, r, barrier)\n",
+        "    knockout_down = KnockoutOption(model_down, S0 - h, strike, T, r, barrier)\n",
+        "    \n",
+        "    price_up = knockout_up.price_knockout_option(N, M)\n",
+        "    price_down = knockout_down.price_knockout_option(N, M)\n",
+        "    \n",
+        "    # Calculate delta using central difference\n",
+        "    delta = (price_up - price_down) / (2 * h)\n",
+        "    df = pd.DataFrame({\"Delta\": [delta], \"Price_Up\": [price_up], \"Price_Down\": [price_down], \"h\": [h]})\n",
+        "    return df\n",
+        "\n"
+      ],
+      "execution_count": 30,
+      "outputs": [],
+      "id": "31befc58"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# To analyze delta sensitivity to underlying price changes\n",
+        "result = run_test(\n",
+        "    \"my_custom_tests.GreeksDelta\",\n",
+        "    param_grid={\n",
+        "        \"model_type\": ['SV'],\n",
+        "        \"N\": [1000000],\n",
+        "        \"M\": [M],\n",
+        "        \"strike\":[strike_range[0]],\n",
+        "        \"barrier\": [barrier_range[0]],\n",
+        "        \"S0\": list(np.linspace(S0-20, S0+20, 20)),\n",
+        "        \"T\": [T],\n",
+        "        \"r\": [r],\n",
+        "        \"v0\": [0.2],\n",
+        "        \"kappa\": [2],\n",
+        "        \"theta\": [0.2],\n",
+        "        \"xi\": [0.1],\n",
+        "        \"rho\": [-0.5],\n",
+        "        \"h\": [0.001]\n",
+        "    },\n",
+        "post_process_fn=process_results  # Using the plotting function defined earlier\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "a033dd96"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_8__'></a>\n",
+        "\n",
+        "### Gamma\n",
+        "Let's measures the rate of change of Delta with respect to changes in the underlying asset's price. It indicates the curvature of the option's price relative to the underlying asset's price."
+      ],
+      "id": "0826d4dc"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "@vm.test(\"my_custom_tests.GreeksGamma\")\n",
+        "def calculate_gamma(model_type, S0, T, r, N, M, strike=None, barrier=None, \n",
+        "                   sigma=None, v0=None, kappa=None, theta=None, xi=None, rho=None, \n",
+        "                   h=0.01):  # h is the step size for finite difference\n",
+        "    \"\"\"\n",
+        "    Calculate gamma using finite difference method.\n",
+        "    Gamma = (V(S0 + h) - 2V(S0) + V(S0 - h)) / h^2\n",
+        "    where V is the option price and h is a small increment\n",
+        "    \"\"\"\n",
+        "    # Initialize the models with S0 + h, S0, and S0 - h\n",
+        "    if model_type == 'BS':\n",
+        "        model_up = BlackScholesModel(S0 + h, strike, T, r, sigma)\n",
+        "        model_center = BlackScholesModel(S0, strike, T, r, sigma)\n",
+        "        model_down = BlackScholesModel(S0 - h, strike, T, r, sigma)\n",
+        "    else:\n",
+        "        model_up = StochasticVolatilityModel(S0 + h, strike, T, r, v0, kappa, theta, xi, rho)\n",
+        "        model_center = StochasticVolatilityModel(S0, strike, T, r, v0, kappa, theta, xi, rho)\n",
+        "        model_down = StochasticVolatilityModel(S0 - h, strike, T, r, v0, kappa, theta, xi, rho)\n",
+        "    \n",
+        "    # Calculate option prices for up, center, and down moves\n",
+        "    knockout_up = KnockoutOption(model_up, S0 + h, strike, T, r, barrier)\n",
+        "    knockout_center = KnockoutOption(model_center, S0, strike, T, r, barrier)\n",
+        "    knockout_down = KnockoutOption(model_down, S0 - h, strike, T, r, barrier)\n",
+        "    \n",
+        "    price_up = knockout_up.price_knockout_option(N, M)\n",
+        "    price_center = knockout_center.price_knockout_option(N, M)\n",
+        "    price_down = knockout_down.price_knockout_option(N, M)\n",
+        "    \n",
+        "    # Calculate gamma using second-order central difference\n",
+        "    gamma = (price_up - 2*price_center + price_down) / (h * h)\n",
+        "    \n",
+        "    df = pd.DataFrame({\n",
+        "        \"Gamma\": [gamma], \n",
+        "        \"Price_Up\": [price_up], \n",
+        "        \"Price_Center\": [price_center],\n",
+        "        \"Price_Down\": [price_down], \n",
+        "        \"h\": [h]\n",
+        "    })\n",
+        "    return df\n",
+        "\n",
+        "# To analyze gamma sensitivity to underlying price changes\n",
+        "result = run_test(\n",
+        "    \"my_custom_tests.GreeksGamma\",\n",
+        "    param_grid={\n",
+        "        \"model_type\": ['SV'],\n",
+        "        \"N\": [1000000],\n",
+        "        \"M\": [M],\n",
+        "        \"strike\":[strike_range[0]],\n",
+        "        \"barrier\": [barrier_range[0]],\n",
+        "        \"S0\": list(np.linspace(S0-20, S0+20, 20)),\n",
+        "        \"T\": [T],\n",
+        "        \"r\": [r],\n",
+        "        \"v0\": [0.2],\n",
+        "        \"kappa\": [2],\n",
+        "        \"theta\": [0.2],\n",
+        "        \"xi\": [0.1],\n",
+        "        \"rho\": [-0.5],\n",
+        "        \"h\": [0.1]\n",
+        "    },\n",
+        "    post_process_fn=process_results  # Using the plotting function defined earlier\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "ccf54452"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_9__'></a>\n",
+        "\n",
+        "### Theta\n",
+        "Let's measures the sensitivity of the option's price to the passage of time, also known as time decay. It indicates how much the price of an option is expected to decrease as the option approaches its expiration date."
+      ],
+      "id": "df0eaa72"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "@vm.test(\"my_custom_tests.GreeksTheta\")\n",
+        "def calculate_theta(model_type, S0, T, r, N, M, strike=None, barrier=None, \n",
+        "                   sigma=None, v0=None, kappa=None, theta=None, xi=None, rho=None, \n",
+        "                   dt=1/365):  # dt is typically one day\n",
+        "    \"\"\"\n",
+        "    Calculate theta using finite difference method.\n",
+        "    Theta = (V(t + dt) - V(t)) / dt\n",
+        "    where V is the option price and dt is a small time increment (typically 1 day)\n",
+        "    \"\"\"\n",
+        "    # Initialize the models with T and T + dt\n",
+        "    if model_type == 'BS':\n",
+        "        model_current = BlackScholesModel(S0, strike, T, r, sigma)\n",
+        "        model_future = BlackScholesModel(S0, strike, T + dt, r, sigma)\n",
+        "    else:\n",
+        "        model_current = StochasticVolatilityModel(S0, strike, T, r, v0, kappa, theta, xi, rho)\n",
+        "        model_future = StochasticVolatilityModel(S0, strike, T + dt, r, v0, kappa, theta, xi, rho)\n",
+        "    \n",
+        "    # Calculate option prices for current and future time\n",
+        "    knockout_current = KnockoutOption(model_current, S0, strike, T, r, barrier)\n",
+        "    knockout_future = KnockoutOption(model_future, S0, strike, T + dt, r, barrier)\n",
+        "    \n",
+        "    price_current = knockout_current.price_knockout_option(N, M)\n",
+        "    price_future = knockout_future.price_knockout_option(N, M)\n",
+        "    \n",
+        "    # Calculate theta using forward difference\n",
+        "    # Note: We divide by dt and multiply by -1 since theta represents the negative rate of change\n",
+        "    theta_value = -1 * (price_future - price_current) / dt\n",
+        "    \n",
+        "    df = pd.DataFrame({\n",
+        "        \"Theta\": [theta_value], \n",
+        "        \"Price_Current\": [price_current],\n",
+        "        \"Price_Future\": [price_future],\n",
+        "        \"dt\": [dt]\n",
+        "    })\n",
+        "    return df\n",
+        "\n",
+        "# Example usage to analyze theta sensitivity across different underlying prices\n",
+        "result = run_test(\n",
+        "    \"my_custom_tests.GreeksTheta\",\n",
+        "    param_grid={\n",
+        "               \"model_type\": ['SV'],\n",
+        "        \"N\": [1000000],\n",
+        "        \"M\": [M],\n",
+        "        \"strike\":[strike_range[0]],\n",
+        "        \"barrier\": [barrier_range[0]],\n",
+        "        \"S0\": list(np.linspace(S0-20, S0+20, 20)),\n",
+        "        \"T\": [T],\n",
+        "        \"r\": [r],\n",
+        "        \"v0\": [0.2],\n",
+        "        \"kappa\": [2],\n",
+        "        \"theta\": [0.2],\n",
+        "        \"xi\": [0.1],\n",
+        "        \"rho\": [-0.5],\n",
+        "        \"dt\": [1/365]  # One day time step\n",
+        "    },\n",
+        "    post_process_fn=process_results  # Using the plotting function defined earlier\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "0e9810b1"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_10__'></a>\n",
+        "\n",
+        "### Vega\n",
+        "Let's measures the sensitivity of the option's price to changes in the volatility of the underlying asset. It indicates how much the price of an option is expected to change with a 1% change in the underlying asset's volatility."
+      ],
+      "id": "28c60e1d"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "@vm.test(\"my_custom_tests.GreeksVega\")\n",
+        "def calculate_vega(model_type, S0, T, r, N, M, strike=None, barrier=None, \n",
+        "                  sigma=None, v0=None, kappa=None, theta=None, xi=None, rho=None, \n",
+        "                  h=0.001):  # h is the step size for finite difference\n",
+        "    \"\"\"\n",
+        "    Calculate vega using finite difference method.\n",
+        "    For Black-Scholes: Vega = (V(σ + h) - V(σ - h)) / (2h)\n",
+        "    For Stochastic Vol: Vega = (V(v0 + h) - V(v0 - h)) / (2h)\n",
+        "    where V is the option price and h is a small increment in volatility\n",
+        "    \"\"\"\n",
+        "    if model_type == 'BS':\n",
+        "        # For Black-Scholes, perturb sigma\n",
+        "        model_up = BlackScholesModel(S0, strike, T, r, sigma + h)\n",
+        "        model_down = BlackScholesModel(S0, strike, T, r, sigma - h)\n",
+        "    else:\n",
+        "        # For Stochastic Volatility, perturb v0\n",
+        "        model_up = StochasticVolatilityModel(S0, strike, T, r, v0 + h, kappa, theta, xi, rho)\n",
+        "        model_down = StochasticVolatilityModel(S0, strike, T, r, v0 - h, kappa, theta, xi, rho)\n",
+        "    \n",
+        "    # Calculate option prices for up and down moves in volatility\n",
+        "    knockout_up = KnockoutOption(model_up, S0, strike, T, r, barrier)\n",
+        "    knockout_down = KnockoutOption(model_down, S0, strike, T, r, barrier)\n",
+        "    \n",
+        "    price_up = knockout_up.price_knockout_option(N, M)\n",
+        "    price_down = knockout_down.price_knockout_option(N, M)\n",
+        "    \n",
+        "    # Calculate vega using central difference\n",
+        "    vega = (price_up - price_down) / (2 * h)\n",
+        "    \n",
+        "    df = pd.DataFrame({\n",
+        "        \"Vega\": [vega], \n",
+        "        \"Price_Up\": [price_up], \n",
+        "        \"Price_Down\": [price_down], \n",
+        "        \"h\": [h]\n",
+        "    })\n",
+        "    return df\n",
+        "\n",
+        "# Example usage to analyze vega sensitivity across different underlying prices\n",
+        "result = run_test(\n",
+        "    \"my_custom_tests.GreeksVega\",\n",
+        "    param_grid={\n",
+        "                \"model_type\": ['SV'],\n",
+        "        \"N\": [1000000],\n",
+        "        \"M\": [M],\n",
+        "        \"strike\":[strike_range[0]],\n",
+        "        \"barrier\": [barrier_range[0]],\n",
+        "        \"S0\": list(np.linspace(S0-20, S0+20, 20)),\n",
+        "        \"T\": [T],\n",
+        "        \"r\": [r],\n",
+        "        \"v0\": [0.2],\n",
+        "        \"kappa\": [2],\n",
+        "        \"theta\": [0.2],\n",
+        "        \"xi\": [0.1],\n",
+        "        \"rho\": [-0.5],\n",
+        "        \"h\": [0.0001]  # Small step size for better accuracy\n",
+        "    },\n",
+        "    post_process_fn=process_results  # Using the plotting function defined earlier\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "1dbc6632"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_11__'></a>\n",
+        "\n",
+        "### Rho\n",
+        "Let's measures the sensitivity of the option's price to changes in the interest rate. It indicates how much the price of an option is expected to change with a 1% change in interest rates."
+      ],
+      "id": "1ec51eba"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "@vm.test(\"my_custom_tests.GreeksRho\")\n",
+        "def calculate_rho(model_type, S0, T, r, N, M, strike=None, barrier=None, \n",
+        "                 sigma=None, v0=None, kappa=None, theta=None, xi=None, rho=None, \n",
+        "                 h=0.0001):  # h is the step size for finite difference\n",
+        "    \"\"\"\n",
+        "    Calculate rho using finite difference method.\n",
+        "    Rho = (V(r + h) - V(r - h)) / (2h)\n",
+        "    where V is the option price and h is a small increment in interest rate\n",
+        "    \"\"\"\n",
+        "    # Initialize the models with r + h and r - h\n",
+        "    if model_type == 'BS':\n",
+        "        model_up = BlackScholesModel(S0, strike, T, r + h, sigma)\n",
+        "        model_down = BlackScholesModel(S0, strike, T, r - h, sigma)\n",
+        "    else:\n",
+        "        model_up = StochasticVolatilityModel(S0, strike, T, r + h, v0, kappa, theta, xi, rho)\n",
+        "        model_down = StochasticVolatilityModel(S0, strike, T, r - h, v0, kappa, theta, xi, rho)\n",
+        "    \n",
+        "    # Calculate option prices for up and down moves in interest rate\n",
+        "    knockout_up = KnockoutOption(model_up, S0, strike, T, r + h, barrier)\n",
+        "    knockout_down = KnockoutOption(model_down, S0, strike, T, r - h, barrier)\n",
+        "    \n",
+        "    price_up = knockout_up.price_knockout_option(N, M)\n",
+        "    price_down = knockout_down.price_knockout_option(N, M)\n",
+        "    \n",
+        "    # Calculate rho using central difference\n",
+        "    rho_value = (price_up - price_down) / (2 * h)\n",
+        "    \n",
+        "    df = pd.DataFrame({\n",
+        "        \"Rho\": [rho_value], \n",
+        "        \"Price_Up\": [price_up], \n",
+        "        \"Price_Down\": [price_down], \n",
+        "        \"h\": [h]\n",
+        "    })\n",
+        "    return df\n",
+        "\n",
+        "# Example usage to analyze rho sensitivity across different underlying prices\n",
+        "result = run_test(\n",
+        "    \"my_custom_tests.GreeksRho\",\n",
+        "    param_grid={\n",
+        "               \"model_type\": ['SV'],\n",
+        "        \"N\": [1000000],\n",
+        "        \"M\": [M],\n",
+        "        \"strike\":[strike_range[0]],\n",
+        "        \"barrier\": [barrier_range[0]],\n",
+        "        \"S0\": list(np.linspace(S0-20, S0+20, 20)),\n",
+        "        \"T\": [T],\n",
+        "        \"r\": [r],\n",
+        "        \"v0\": [0.2],\n",
+        "        \"kappa\": [2],\n",
+        "        \"theta\": [0.2],\n",
+        "        \"xi\": [0.1],\n",
+        "        \"rho\": [-0.5],\n",
+        "        \"h\": [0.0001]  # Small step size for better accuracy\n",
+        "    },\n",
+        "    post_process_fn=process_results  # Using the plotting function defined earlier\n",
+        ")\n",
+        "result.log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "2f497b5f"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_11_1__'></a>\n",
+        "\n",
+        "#### Stress Testing"
+      ],
+      "id": "0cdd1b1b"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "@vm.test(\"my_custom_tests.Stressing\")\n",
+        "def sensitivity_test(model_type, S0, T, r, N, M, strike=None, barrier=None, sigma=None, v0=None, kappa=None,theta=None, xi=None, rho=None):\n",
+        "    \"\"\"\n",
+        "    This is stress test\n",
+        "    \"\"\"\n",
+        "    if model_type == 'BS':\n",
+        "        model = BlackScholesModel(S0, strike, T, r, sigma)\n",
+        "    else:\n",
+        "        model = StochasticVolatilityModel(S0, strike, T, r, v0, kappa, theta, xi, rho)\n",
+        "    \n",
+        "    knockout_option = KnockoutOption(model, S0, strike, T, r, barrier)\n",
+        "    price = knockout_option.price_knockout_option(N, M)\n",
+        "\n",
+        "    return pd.DataFrame({\"Option price\": [price]})"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "c98ff396"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Rho (correlation) and Theta (long term vol) stress test\n",
+        "First, we create a surface plot to visualize the option price with respect to two variables."
+      ],
+      "id": "b6f0a179"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "def two_parameters_stress_surface_plot(result: TestResult):\n",
+        "    import plotly.graph_objects as go\n",
+        "    import numpy as np\n",
+        "    import pandas as pd\n",
+        "    # Convert to DataFrame\n",
+        "    data = pd.DataFrame(result.tables[0].data)\n",
+        "    \n",
+        "    # Get column names (assuming first column is x, next two are y1 and y2)\n",
+        "    z_col = data.columns[2]\n",
+        "    x_col = data.columns[0]\n",
+        "    y_col = data.columns[1]\n",
+        "    \n",
+        "    # Get unique values for x and y\n",
+        "    x_unique = np.sort(data[x_col].unique())\n",
+        "    y_unique = np.sort(data[y_col].unique())\n",
+        "    \n",
+        "    # Create meshgrid\n",
+        "    X, Y = np.meshgrid(x_unique, y_unique)\n",
+        "    \n",
+        "    # Create Z matrix\n",
+        "    Z = np.zeros_like(X)\n",
+        "    for i, x_val in enumerate(x_unique):\n",
+        "        for j, y_val in enumerate(y_unique):\n",
+        "            mask = (data[x_col] == x_val) & (data[y_col] == y_val)\n",
+        "            if mask.any():\n",
+        "                Z[j, i] = data.loc[mask, z_col].iloc[0]\n",
+        "    \n",
+        "    # Create the 3D surface plot\n",
+        "    fig = go.Figure(data=[go.Surface(x=X, y=Y, z=Z)])\n",
+        "    \n",
+        "    # Update the layout\n",
+        "    fig.update_layout(\n",
+        "        title=f'3D Surface Plot of {z_col}',\n",
+        "        scene=dict(\n",
+        "            xaxis_title=x_col,\n",
+        "            yaxis_title=y_col,\n",
+        "            zaxis_title=z_col,\n",
+        "            camera=dict(\n",
+        "                up=dict(x=0, y=0, z=1),\n",
+        "                center=dict(x=0, y=0, z=0),\n",
+        "                eye=dict(x=1.5, y=1.5, z=1.5)\n",
+        "            )\n",
+        "        ),\n",
+        "        width=900,\n",
+        "        height=700,\n",
+        "        margin=dict(l=65, r=50, b=65, t=90)\n",
+        "    )\n",
+        "\n",
+        "    result.add_figure(\n",
+        "        Figure(\n",
+        "            figure=fig,\n",
+        "            key=\"sensitivity_plot_\" + str(random.randint(0, 1000000)),\n",
+        "            ref_id=result.ref_id,\n",
+        "        )\n",
+        "    )\n",
+        "\n",
+        "    return result"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "b408de0f"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let's evaluates the sensitivity of a model's output to changes in the correlation parameter (rho) and the long-term variance parameter (theta) within a stochastic volatility framework.\n",
+        "\n",
+        "This test is useful for understanding how variations in these parameters affect the model's valuation, which is crucial for risk management and model validation."
+      ],
+      "id": "87289ee6"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "\n",
+        "\n",
+        "result = run_test(\n",
+        "    \"my_custom_tests.Stressing:TheRhoAndThetaParameters\",\n",
+        "    param_grid={\n",
+        "        \"model_type\": ['SV'],\n",
+        "        \"N\": [N],\n",
+        "        \"M\": [M],\n",
+        "        \"strike\": [strike_range[0]],\n",
+        "        \"barrier\": [barrier_range[0]],\n",
+        "        \"S0\": [S0],\n",
+        "        \"T\": [T],\n",
+        "        \"r\": [r],\n",
+        "        \"v0\": [0.2],\n",
+        "        \"kappa\": [2],\n",
+        "        \"theta\": list(np.linspace(0,0.8, 10)),\n",
+        "        \"xi\": [0.1],\n",
+        "        \"rho\": list(np.linspace(-1,0.8, 10)),\n",
+        "    },\n",
+        "    post_process_fn=two_parameters_stress_surface_plot\n",
+        ")\n",
+        "result.log()\n"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "5c0ec52d"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Rho (correlation) and Xi (vol of vol) stress test"
+      ],
+      "id": "44be4c61"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "\n",
+        "\n",
+        "result = run_test(\n",
+        "    \"my_custom_tests.Stressing:TheRhoAndXiParameters\",\n",
+        "    param_grid={\n",
+        "        \"model_type\": ['SV'],\n",
+        "        \"N\": [N],\n",
+        "        \"M\": [M],\n",
+        "        \"strike\": [strike_range[0]],\n",
+        "        \"barrier\": [barrier_range[0]],\n",
+        "        \"S0\": [S0],\n",
+        "        \"T\": [T],\n",
+        "        \"r\": [r],\n",
+        "        \"v0\": [0.2],\n",
+        "        \"kappa\": [2],\n",
+        "        \"theta\": [0.2],\n",
+        "        \"xi\": list(np.linspace(0,0.8, 10)),\n",
+        "        \"rho\": list(np.linspace(-1,0.8, 10)),\n",
+        "    },\n",
+        "    post_process_fn=two_parameters_stress_surface_plot\n",
+        ")\n",
+        "result.log()\n"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "e0a2996e"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Sigma stress test\n",
+        "evaluates the sensitivity of a model's output to changes in the volatility parameter, sigma. This test is crucial for understanding how variations in market volatility impact the model's valuation of financial instruments, particularly options.\n",
+        "\n",
+        "This test is useful for risk management and model validation, as it helps identify the robustness of the model under different market conditions. By analyzing the changes in the model's output as sigma varies, stakeholders can assess the model's stability and reliability."
+      ],
+      "id": "5fed568d"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"my_custom_tests.Stressing:TheSigmaParameter\",\n",
+        "    param_grid={\n",
+        "        \"model_type\": ['BS'],\n",
+        "        \"N\": [N],\n",
+        "        \"M\": [M],\n",
+        "        \"strike\": [strike_range[0]],\n",
+        "        \"barrier\": [barrier_range[0]],\n",
+        "        \"S0\": [S0],\n",
+        "        \"T\": [T],\n",
+        "        \"r\": [r],\n",
+        "        \"sigma\": list(np.linspace(0.2, 0.8, 10)),\n",
+        "    },\n",
+        "    post_process_fn=process_results\n",
+        ")\n",
+        "result.log()\n"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "d49e2e37"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Stress kappa\n",
+        "Let's evaluates the sensitivity of a model's output to changes in the kappa parameter, which is a mean reversion rate in stochastic volatility models."
+      ],
+      "id": "4e7a1f00"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"my_custom_tests.Stressing:TheKappaParameter\",\n",
+        "    param_grid={\n",
+        "        \"model_type\": ['SV'],\n",
+        "        \"N\": [N],\n",
+        "        \"M\": [M],\n",
+        "        \"strike\": [strike_range[0]],\n",
+        "        \"barrier\": [barrier_range[0]],\n",
+        "        \"S0\": [S0],\n",
+        "        \"T\": [T],\n",
+        "        \"r\": [r],\n",
+        "        \"v0\": [0.2],\n",
+        "        \"kappa\": list(np.linspace(0, 8, 10)),\n",
+        "        \"theta\": [0.2],\n",
+        "        \"xi\": [0.1],\n",
+        "        \"rho\": [-0.5],\n",
+        "    },\n",
+        "    post_process_fn=process_results\n",
+        ")\n",
+        "result.log()\n"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "e995f6ae"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Stress theta\n",
+        "Stress Theta evaluates the sensitivity of a model's output to changes in the parameter theta, which represents the long-term variance in a stochastic volatility model"
+      ],
+      "id": "40d1c9e2"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"my_custom_tests.Stressing:TheThetaParameter\",\n",
+        "    param_grid={\n",
+        "        \"model_type\": ['SV'],\n",
+        "        \"N\": [N],\n",
+        "        \"M\": [M],\n",
+        "        \"strike\": [strike_range[0]],\n",
+        "        \"barrier\": [barrier_range[0]],\n",
+        "        \"S0\": [S0],\n",
+        "        \"T\": [T],\n",
+        "        \"r\": [r],\n",
+        "        \"v0\": [0.2],\n",
+        "        \"kappa\": [2],\n",
+        "        \"theta\": list(np.linspace(0, 0.8, 10)),\n",
+        "        \"xi\": [0.1],\n",
+        "        \"rho\": [-0.5],\n",
+        "    },\n",
+        "    post_process_fn=process_results\n",
+        ")\n",
+        "result.log()\n"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "7e371aee"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Stress xi\n",
+        "Stress Xi evaluates the sensitivity of a model's output to changes in the parameter xi, which represents the volatility of volatility in a stochastic volatility model. This test is crucial for understanding how variations in xi impact the model's valuation, particularly in financial derivatives pricing."
+      ],
+      "id": "e20d074f"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"my_custom_tests.Stressing:TheXiParameter\",\n",
+        "    param_grid={\n",
+        "        \"model_type\": ['SV'],\n",
+        "        \"N\": [N],\n",
+        "        \"M\": [M],\n",
+        "        \"strike\": [strike_range[0]],\n",
+        "        \"barrier\": [barrier_range[0]],\n",
+        "        \"S0\": [S0],\n",
+        "        \"T\": [T],\n",
+        "        \"r\": [r],\n",
+        "        \"v0\": [0.2],\n",
+        "        \"kappa\": [2],\n",
+        "        \"theta\": [0.2],\n",
+        "        \"xi\": list(np.linspace(0.05, 0.95, 10)),\n",
+        "        \"rho\": [-0.5],\n",
+        "    },\n",
+        "    post_process_fn=process_results\n",
+        ")\n",
+        "result.log()\n"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "9c545090"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Stress rho\n",
+        "Stress rho test evaluates the sensitivity of a model's output to changes in the correlation parameter, rho, within a stochastic volatility (SV) model framework. This test is crucial for understanding how variations in rho, which represents the correlation between the asset price and its volatility, impact the model's valuation output."
+      ],
+      "id": "f0360e20"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"my_custom_tests.Stressing:TheRhoParameter\",\n",
+        "    param_grid={\n",
+        "        \"model_type\": ['SV'],\n",
+        "        \"N\": [N],\n",
+        "        \"M\": [M],\n",
+        "        \"strike\": [strike_range[0]],\n",
+        "        \"barrier\": [barrier_range[0]],\n",
+        "        \"S0\": [S0],\n",
+        "        \"T\": [T],\n",
+        "        \"r\": [r],\n",
+        "        \"v0\": [0.2],\n",
+        "        \"kappa\": [2],\n",
+        "        \"theta\": [0.2],\n",
+        "        \"xi\": [0.1],\n",
+        "        \"rho\": list(np.linspace(-1.0, 1.0, 20)),\n",
+        "    },\n",
+        "    post_process_fn=process_results\n",
+        ")\n",
+        "result.log()\n"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "e2c5dfb1"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
+        "\n",
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Work with your documentation\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
+        "\n",
+        "<a id='toc5_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ],
+      "id": "61d4e596"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-a23adf093a60485ea005cf8fc18545a5"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "validmind-1QuffXMV-py3.10",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.10.14"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 5
 }
diff --git a/site/notebooks/use_cases/capital_markets/quickstart_option_pricing_models_quantlib.ipynb b/site/notebooks/use_cases/capital_markets/quickstart_option_pricing_models_quantlib.ipynb
index 17471d33c4..eccfb8fc3b 100644
--- a/site/notebooks/use_cases/capital_markets/quickstart_option_pricing_models_quantlib.ipynb
+++ b/site/notebooks/use_cases/capital_markets/quickstart_option_pricing_models_quantlib.ipynb
@@ -1,1348 +1,1360 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "id": "1e2a4689",
-   "metadata": {},
-   "source": [
-    "# Quickstart for Heston option pricing model using QuantLib\n",
-    "\n",
-    "Welcome! Let's get you started with the basic process of documenting models with ValidMind.\n",
-    "\n",
-    "The Heston option pricing model is a popular stochastic volatility model used to price options. Developed by Steven Heston in 1993, the model assumes that the asset's volatility follows a mean-reverting square-root process, allowing it to capture the empirical observation of volatility \"clustering\" in financial markets. This model is particularly useful for assets where volatility is not constant, making it a favored approach in quantitative finance for pricing complex derivatives.\n",
-    "\n",
-    "Here’s an overview of the Heston model as implemented in QuantLib, a powerful library for quantitative finance:\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Model Assumptions and Characteristics\n",
-    "1. **Stochastic Volatility**: The volatility is modeled as a stochastic process, following a mean-reverting square-root process (Cox-Ingersoll-Ross process).\n",
-    "2. **Correlated Asset and Volatility Processes**: The asset price and volatility are assumed to be correlated, allowing the model to capture the \"smile\" effect observed in implied volatilities.\n",
-    "3. **Risk-Neutral Dynamics**: The Heston model is typically calibrated under a risk-neutral measure, which allows for direct application to pricing.\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### Heston Model Parameters\n",
-    "The model is governed by a set of key parameters:\n",
-    "- **S0**: Initial stock price\n",
-    "- **v0**: Initial variance of the asset price\n",
-    "- **kappa**: Speed of mean reversion of the variance\n",
-    "- **theta**: Long-term mean level of variance\n",
-    "- **sigma**: Volatility of volatility (vol of vol)\n",
-    "- **rho**: Correlation between the asset price and variance processes\n",
-    "\n",
-    "The dynamics of the asset price \\( S \\) and the variance \\( v \\) under the Heston model are given by:\n",
-    "\n",
-    "$$\n",
-    "dS_t = r S_t \\, dt + \\sqrt{v_t} S_t \\, dW^S_t\n",
-    "$$\n",
-    "\n",
-    "$$\n",
-    "dv_t = \\kappa (\\theta - v_t) \\, dt + \\sigma \\sqrt{v_t} \\, dW^v_t\n",
-    "$$\n",
-    "\n",
-    "where \\( $dW^S$ \\) and \\( $dW^v$ \\) are Wiener processes with correlation \\( $\\rho$ \\).\n",
-    "\n",
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Advantages and Limitations\n",
-    "- **Advantages**:\n",
-    "  - Ability to capture volatility smiles and skews.\n",
-    "  - More realistic pricing for options on assets with stochastic volatility.\n",
-    "- **Limitations**:\n",
-    "  - Calibration can be complex due to the number of parameters.\n",
-    "  - Computationally intensive compared to simpler models like Black-Scholes.\n",
-    "\n",
-    "This setup provides a robust framework for pricing and analyzing options with stochastic volatility dynamics. QuantLib’s implementation makes it easy to experiment with different parameter configurations and observe their effects on pricing.\n",
-    "\n",
-    "You will learn how to initialize the ValidMind Library, develop a option pricing model, and then write custom tests that can be used for sensitivity and stress testing to quickly generate documentation about model."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "69ec219a",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "  - [Model Assumptions and Characteristics](#toc1_1__)    \n",
-    "  - [Heston Model Parameters](#toc1_2__)    \n",
-    "  - [Advantages and Limitations](#toc1_3__)    \n",
-    "- [About ValidMind](#toc2__)    \n",
-    "  - [Before you begin](#toc2_1__)    \n",
-    "  - [New to ValidMind?](#toc2_2__)    \n",
-    "  - [Key concepts](#toc2_3__)    \n",
-    "- [Setting up](#toc3__)    \n",
-    "  - [Install the ValidMind Library](#toc3_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc3_2__)    \n",
-    "    - [Register sample model](#toc3_2_1__)    \n",
-    "    - [Apply documentation template](#toc3_2_2__)    \n",
-    "    - [Get your code snippet](#toc3_2_3__)    \n",
-    "  - [Initialize the Python environment](#toc3_3__)    \n",
-    "  - [Preview the documentation template](#toc3_4__)    \n",
-    "- [Data Preparation](#toc4__)    \n",
-    "    - [Helper functions](#toc4_1_1__)    \n",
-    "  - [Market Data Quality and Availability](#toc4_2__)    \n",
-    "  - [Initialize the ValidMind datasets](#toc4_3__)    \n",
-    "  - [Data Quality](#toc4_4__)    \n",
-    "    - [Isolation Forest Outliers Test](#toc4_4_1__)    \n",
-    "    - [Model parameters](#toc4_4_2__)    \n",
-    "- [Model development - Heston Option price](#toc5__)    \n",
-    "  - [Model Calibration](#toc5_1__)    \n",
-    "  - [Model Evaluation](#toc5_2__)    \n",
-    "    - [Benchmark Testing](#toc5_2_1__)    \n",
-    "    - [Sensitivity Testing](#toc5_2_2__)    \n",
-    "    - [Stress Testing](#toc5_2_3__)    \n",
-    "- [Next steps](#toc6__)    \n",
-    "  - [Work with your model documentation](#toc6_1__)    \n",
-    "  - [Discover more learning resources](#toc6_2__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b9fb5d17",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
-    "\n",
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Custom tests**: Custom tests are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom test.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom test. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "f2dccf35",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "5a5ce085",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "409352bf",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "65e870b2",
-   "metadata": {},
-   "source": [
-    "To install the QuantLib library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "3a34debf",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q QuantLib"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "fb30ae07",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "c6f87017",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "cbb2e2c9",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Capital Markets`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "41c4edca",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Can't select this template?</b></span>\n",
-    "<br></br>\n",
-    "Your organization administrators may need to add it to your template library:\n",
-    "<ul>\n",
-    "<li><a href=\"capital_markets_template.yaml\" style=\"color: #DE257E;\"><b>Download Template YAML</b></a></li>\n",
-    "<li><a href=\"https://docs.validmind.ai/guide/templates/customize-document-templates.html\" style=\"color: #DE257E;\"><b>Customize Document Templates</b></a></li>\n",
-    "</ul>\n",
-    "</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "2012eb82",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "0cd3f67e",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "6d944cc9",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_3__'></a>\n",
-    "\n",
-    "### Initialize the Python environment\n",
-    "\n",
-    "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "f8cf2746",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%matplotlib inline\n",
-    "\n",
-    "import pandas as pd\n",
-    "import numpy as np\n",
-    "import matplotlib.pyplot as plt\n",
-    "from scipy.optimize import minimize\n",
-    "import yfinance as yf\n",
-    "import QuantLib as ql\n",
-    "from validmind.tests import run_test"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "bc431ee0",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_4__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "7e844028",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "0c0ee8b9",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Data Preparation"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "5a4d2c36",
-   "metadata": {},
-   "source": [
-    "### Market Data Sources\n",
-    "\n",
-    "<a id='toc4_1_1__'></a>\n",
-    "\n",
-    "#### Helper functions\n",
-    "Let's define helper function retrieve to option data from Yahoo Finance."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "b96a500f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def get_market_data(ticker, expiration_date_str):\n",
-    "    \"\"\"\n",
-    "    Fetch option market data from Yahoo Finance for the given ticker and expiration date.\n",
-    "    Returns a list of tuples: (strike, maturity, option_price).\n",
-    "    \"\"\"\n",
-    "    # Create a Ticker object for the specified stock\n",
-    "    stock = yf.Ticker(ticker)\n",
-    "\n",
-    "    # Get all available expiration dates for options\n",
-    "    option_dates = stock.options\n",
-    "\n",
-    "    # Check if the requested expiration date is available\n",
-    "    if expiration_date_str not in option_dates:\n",
-    "        raise ValueError(f\"Expiration date {expiration_date_str} not available for {ticker}. Available dates: {option_dates}\")\n",
-    "\n",
-    "    # Get the option chain for the specified expiration date\n",
-    "    option_chain = stock.option_chain(expiration_date_str)\n",
-    "\n",
-    "    # Get call options (or you can use puts as well based on your requirement)\n",
-    "    calls = option_chain.calls\n",
-    "\n",
-    "    # Convert expiration_date_str to QuantLib Date\n",
-    "    expiry_date_parts = list(map(int, expiration_date_str.split('-')))  # Split YYYY-MM-DD\n",
-    "    maturity_date = ql.Date(expiry_date_parts[2], expiry_date_parts[1], expiry_date_parts[0])  # Convert to QuantLib Date\n",
-    "\n",
-    "    # Create a list to store strike prices, maturity dates, and option prices\n",
-    "    market_data = []\n",
-    "    for index, row in calls.iterrows():\n",
-    "        strike = row['strike']\n",
-    "        option_price = row['lastPrice']  # You can also use 'bid', 'ask', 'mid', etc.\n",
-    "        market_data.append((strike, maturity_date, option_price))\n",
-    "    df = pd.DataFrame(market_data, columns = ['strike', 'maturity_date', 'option_price'])\n",
-    "    return df"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "c7769b73",
-   "metadata": {},
-   "source": [
-    "Let's define helper function retrieve to stock data from Yahoo Finance. This helper function to calculate spot price, dividend yield, volatility and risk free rate using the underline stock data."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "dc44c448",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def get_option_parameters(ticker):\n",
-    "    # Fetch historical data for the stock\n",
-    "    stock_data = yf.Ticker(ticker)\n",
-    "    \n",
-    "    # Get the current spot price\n",
-    "    spot_price = stock_data.history(period=\"1d\")['Close'].iloc[-1]\n",
-    "    \n",
-    "    # Get dividend yield\n",
-    "    dividend_rate = stock_data.dividends.mean() / spot_price if not stock_data.dividends.empty else 0.0\n",
-    "    \n",
-    "    # Estimate volatility (standard deviation of log returns)\n",
-    "    hist_data = stock_data.history(period=\"1y\")['Close']\n",
-    "    log_returns = np.log(hist_data / hist_data.shift(1)).dropna()\n",
-    "    volatility = np.std(log_returns) * np.sqrt(252)  # Annualized volatility\n",
-    "    \n",
-    "    # Assume a risk-free rate from some known data (can be fetched from market data, here we use 0.001)\n",
-    "    risk_free_rate = 0.001\n",
-    "    \n",
-    "    # Return the calculated parameters\n",
-    "    return {\n",
-    "        \"spot_price\": spot_price,\n",
-    "        \"volatility\": volatility,\n",
-    "        \"dividend_rate\": dividend_rate,\n",
-    "        \"risk_free_rate\": risk_free_rate\n",
-    "    }"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "c7b739d3",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Market Data Quality and Availability\n",
-    "Next, let's specify ticker and expiration date to get market data."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "50225fde",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "ticker = \"MSFT\"\n",
-    "expiration_date =  \"2024-12-13\" # Example expiration date in 'YYYY-MM-DD' form\n",
-    "\n",
-    "market_data = get_market_data(ticker=ticker, expiration_date_str=expiration_date)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "c539b95e",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_3__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind datasets\n",
-    "\n",
-    "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "113f9c17",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_market_data = vm.init_dataset(\n",
-    "    dataset=market_data,\n",
-    "    input_id=\"market_data\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "185beb24",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_4__'></a>\n",
-    "\n",
-    "### Data Quality\n",
-    "Let's check quality of the data using outliers and missing data tests."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "7f14464c",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_4_1__'></a>\n",
-    "\n",
-    "#### Isolation Forest Outliers Test\n",
-    "Let's detects anomalies in the dataset using the Isolation Forest algorithm, visualized through scatter plots."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "56c919ec",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"validmind.data_validation.IsolationForestOutliers\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_market_data,\n",
-    "    },\n",
-    "    title=\"Outliers detection using Isolation Forest\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e4d0e5ca",
-   "metadata": {},
-   "source": [
-    "##### Missing Values Test\n",
-    "Let's evaluates dataset quality by ensuring the missing value ratio across all features does not exceed a set threshold."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "e95c825f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"validmind.data_validation.MissingValues\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_market_data,\n",
-    "    },\n",
-    "    title=\"Missing Values detection\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "829403a3",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_4_2__'></a>\n",
-    "\n",
-    "#### Model parameters\n",
-    "Let's calculate the model parameters using from stock data "
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "25936449",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "option_params = get_option_parameters(ticker=ticker)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "0a0948b6",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Model development - Heston Option price"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "e15b8221",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "class HestonModel:\n",
-    "\n",
-    "    def __init__(self, ticker, expiration_date_str, calculation_date, spot_price, dividend_rate, risk_free_rate):\n",
-    "        self.ticker = ticker\n",
-    "        self.expiration_date_str = expiration_date_str,\n",
-    "        self.calculation_date = calculation_date\n",
-    "        self.spot_price = spot_price\n",
-    "        self.dividend_rate = dividend_rate\n",
-    "        self.risk_free_rate = risk_free_rate\n",
-    "    \n",
-    "    def predict_option_price(self, strike, maturity_date, spot_price, v0=None, theta=None, kappa=None, sigma=None, rho=None):\n",
-    "        # Set the evaluation date\n",
-    "        ql.Settings.instance().evaluationDate = self.calculation_date\n",
-    "\n",
-    "        # Construct the European Option\n",
-    "        payoff = ql.PlainVanillaPayoff(ql.Option.Call, strike)\n",
-    "        exercise = ql.EuropeanExercise(maturity_date)\n",
-    "        european_option = ql.VanillaOption(payoff, exercise)\n",
-    "\n",
-    "        # Yield term structures for risk-free rate and dividend\n",
-    "        riskFreeTS = ql.YieldTermStructureHandle(ql.FlatForward(calculation_date, self.risk_free_rate, ql.Actual365Fixed()))\n",
-    "        dividendTS = ql.YieldTermStructureHandle(ql.FlatForward(calculation_date, self.dividend_rate, ql.Actual365Fixed()))\n",
-    "\n",
-    "        # Initial stock price\n",
-    "        initialValue = ql.QuoteHandle(ql.SimpleQuote(spot_price))\n",
-    "\n",
-    "        # Heston process parameters\n",
-    "        heston_process = ql.HestonProcess(riskFreeTS, dividendTS, initialValue, v0, kappa, theta, sigma, rho)\n",
-    "        hestonModel = ql.HestonModel(heston_process)\n",
-    "\n",
-    "        # Use the Heston analytic engine\n",
-    "        engine = ql.AnalyticHestonEngine(hestonModel)\n",
-    "        european_option.setPricingEngine(engine)\n",
-    "\n",
-    "        # Calculate the Heston model price\n",
-    "        h_price = european_option.NPV()\n",
-    "\n",
-    "        return h_price\n",
-    "\n",
-    "    def predict_american_option_price(self, strike, maturity_date, spot_price, v0=None, theta=None, kappa=None, sigma=None, rho=None):\n",
-    "        # Set the evaluation date\n",
-    "        ql.Settings.instance().evaluationDate = self.calculation_date\n",
-    "\n",
-    "        # Construct the American Option\n",
-    "        payoff = ql.PlainVanillaPayoff(ql.Option.Call, strike)\n",
-    "        exercise = ql.AmericanExercise(self.calculation_date, maturity_date)\n",
-    "        american_option = ql.VanillaOption(payoff, exercise)\n",
-    "\n",
-    "        # Yield term structures for risk-free rate and dividend\n",
-    "        riskFreeTS = ql.YieldTermStructureHandle(ql.FlatForward(self.calculation_date, self.risk_free_rate, ql.Actual365Fixed()))\n",
-    "        dividendTS = ql.YieldTermStructureHandle(ql.FlatForward(self.calculation_date, self.dividend_rate, ql.Actual365Fixed()))\n",
-    "\n",
-    "        # Initial stock price\n",
-    "        initialValue = ql.QuoteHandle(ql.SimpleQuote(spot_price))\n",
-    "\n",
-    "        # Heston process parameters\n",
-    "        heston_process = ql.HestonProcess(riskFreeTS, dividendTS, initialValue, v0, kappa, theta, sigma, rho)\n",
-    "        heston_model = ql.HestonModel(heston_process)\n",
-    "\n",
-    "\n",
-    "        payoff = ql.PlainVanillaPayoff(ql.Option.Call, strike)\n",
-    "        exercise = ql.AmericanExercise(self.calculation_date, maturity_date)\n",
-    "        american_option = ql.VanillaOption(payoff, exercise)\n",
-    "        heston_fd_engine = ql.FdHestonVanillaEngine(heston_model)\n",
-    "        american_option.setPricingEngine(heston_fd_engine)\n",
-    "        option_price = american_option.NPV()\n",
-    "\n",
-    "        return option_price\n",
-    "\n",
-    "    def objective_function(self, params, market_data, spot_price, dividend_rate, risk_free_rate):\n",
-    "        v0, theta, kappa, sigma, rho = params\n",
-    "\n",
-    "        # Sum of squared differences between market prices and model prices\n",
-    "        error = 0.0\n",
-    "        for i, row in market_data.iterrows():\n",
-    "            model_price = self.predict_option_price(row['strike'], row['maturity_date'], spot_price, \n",
-    "                                            v0, theta, kappa, sigma, rho)\n",
-    "            error += (model_price - row['option_price']) ** 2\n",
-    "        \n",
-    "        return error\n",
-    "\n",
-    "    def calibrate_model(self, ticker, expiration_date_str):\n",
-    "        # Get the option market data dynamically from Yahoo Finance\n",
-    "        market_data = get_market_data(ticker, expiration_date_str)\n",
-    "\n",
-    "        # Initial guesses for Heston parameters\n",
-    "        initial_params = [0.04, 0.04, 0.1, 0.1, -0.75]\n",
-    "\n",
-    "        # Bounds for the parameters to ensure realistic values\n",
-    "        bounds = [(0.0001, 1.0),  # v0\n",
-    "                (0.0001, 1.0),  # theta\n",
-    "                (0.001, 2.0),   # kappa\n",
-    "                (0.001, 1.0),   # sigma\n",
-    "                (-0.75, 0.0)]    # rho\n",
-    "\n",
-    "        # Optimize the parameters to minimize the error between model and market prices\n",
-    "        result = minimize(self.objective_function, initial_params, args=(market_data, self.spot_price, self.dividend_rate, self.risk_free_rate),\n",
-    "                        bounds=bounds, method='L-BFGS-B')\n",
-    "\n",
-    "        # Optimized Heston parameters\n",
-    "        v0_opt, theta_opt, kappa_opt, sigma_opt, rho_opt = result.x\n",
-    "\n",
-    "        return v0_opt, theta_opt, kappa_opt, sigma_opt, rho_opt\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "a941aa32",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_1__'></a>\n",
-    "\n",
-    "### Model Calibration\n",
-    "* The calibration process aims to optimize the Heston model parameters (v0, theta, kappa, sigma, rho) by minimizing the difference between model-predicted option prices and observed market prices.\n",
-    "* In this implementation, the model is calibrated to current market data, specifically using option prices from the selected ticker and expiration date.\n",
-    "\n",
-    "Let's specify `calculation_date` and `strike_price` as input parameters for the model to verify its functionality and confirm it operates as expected."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "1d61dfca",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "calculation_date = ql.Date(26, 11, 2024)\n",
-    "# Convert expiration date string to QuantLib.Date\n",
-    "expiry_date_parts = list(map(int, expiration_date.split('-')))\n",
-    "maturity_date = ql.Date(expiry_date_parts[2], expiry_date_parts[1], expiry_date_parts[0])\n",
-    "strike_price = 460.0\n",
-    "\n",
-    "hm = HestonModel(\n",
-    "    ticker=ticker,\n",
-    "    expiration_date_str= expiration_date,\n",
-    "    calculation_date= calculation_date,\n",
-    "    spot_price= option_params['spot_price'],\n",
-    "    dividend_rate = option_params['dividend_rate'],\n",
-    "    risk_free_rate = option_params['risk_free_rate']\n",
-    ")\n",
-    "\n",
-    "# Let's calibrate model\n",
-    "v0_opt, theta_opt, kappa_opt, sigma_opt, rho_opt = hm.calibrate_model(ticker, expiration_date)\n",
-    "print(f\"Optimized Heston parameters: v0={v0_opt}, theta={theta_opt}, kappa={kappa_opt}, sigma={sigma_opt}, rho={rho_opt}\")\n",
-    "\n",
-    "\n",
-    "# option price\n",
-    "h_price = hm.predict_option_price(strike_price, maturity_date, option_params['spot_price'], v0_opt, theta_opt, kappa_opt, sigma_opt, rho_opt)\n",
-    "print(\"The Heston model price for the option is:\", h_price)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "75313272",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2__'></a>\n",
-    "\n",
-    "### Model Evaluation"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "2e6471ef",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2_1__'></a>\n",
-    "\n",
-    "#### Benchmark Testing\n",
-    "The benchmark testing framework provides a robust way to validate the Heston model implementation and understand the relationships between European and American option prices under stochastic volatility conditions.\n",
-    "Let's compares European and American option prices using the Heston model."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 15,
-   "id": "810cf887",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "@vm.test(\"my_custom_tests.BenchmarkTest\")\n",
-    "def benchmark_test(hm_model, strikes, maturity_date, spot_price, v0=None, theta=None, kappa=None, sigma=None, rho=None):\n",
-    "    \"\"\"\n",
-    "    Compares European and American option prices using the Heston model.\n",
-    "\n",
-    "    This test evaluates the price differences between European and American options\n",
-    "    across multiple strike prices while keeping other parameters constant. The comparison\n",
-    "    helps understand the early exercise premium of American options over their European\n",
-    "    counterparts under stochastic volatility conditions.\n",
-    "\n",
-    "    Args:\n",
-    "        hm_model: HestonModel instance for option pricing calculations\n",
-    "        strikes (list[float]): List of strike prices to test\n",
-    "        maturity_date (ql.Date): Option expiration date in QuantLib format\n",
-    "        spot_price (float): Current price of the underlying asset\n",
-    "        v0 (float, optional): Initial variance. Defaults to None.\n",
-    "        theta (float, optional): Long-term variance. Defaults to None.\n",
-    "        kappa (float, optional): Mean reversion rate. Defaults to None.\n",
-    "        sigma (float, optional): Volatility of variance. Defaults to None.\n",
-    "        rho (float, optional): Correlation between asset and variance. Defaults to None.\n",
-    "\n",
-    "    Returns:\n",
-    "        dict: Contains a DataFrame with the following columns:\n",
-    "            - Strike: Strike prices tested\n",
-    "            - Maturity date: Expiration date for all options\n",
-    "            - Spot price: Current underlying price\n",
-    "            - european model price: Prices for European options\n",
-    "            - american model price: Prices for American options\n",
-    "\"\"\"\n",
-    "    american_derived_prices = []\n",
-    "    european_derived_prices = []\n",
-    "    for K in strikes:\n",
-    "        european_derived_prices.append(hm_model.predict_option_price(K, maturity_date, spot_price, v0, theta, kappa, sigma, rho))\n",
-    "        american_derived_prices.append(hm_model.predict_american_option_price(K, maturity_date, spot_price, v0, theta, kappa, sigma, rho))\n",
-    "\n",
-    "    data = {\n",
-    "        \"Strike\": strikes,\n",
-    "        \"Maturity date\": [maturity_date] * len(strikes),\n",
-    "        \"Spot price\": [spot_price] * len(strikes),\n",
-    "        \"european model price\": european_derived_prices,\n",
-    "        \"american model price\": american_derived_prices,\n",
-    "\n",
-    "    }\n",
-    "    df1 = pd.DataFrame(data)\n",
-    "    return {\"strikes variation benchmarking\": df1}"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "3fdd6705",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"my_custom_tests.BenchmarkTest\",\n",
-    "    params={\n",
-    "        \"hm_model\": hm,\n",
-    "        \"strikes\": [400, 425, 460, 495, 520],\n",
-    "        \"maturity_date\": maturity_date,\n",
-    "        \"spot_price\": option_params['spot_price'],\n",
-    "        \"v0\":v0_opt,\n",
-    "        \"theta\": theta_opt,\n",
-    "        \"kappa\":kappa_opt ,\n",
-    "        \"sigma\": sigma_opt,\n",
-    "        \"rho\":rho_opt\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "e359b503",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2_2__'></a>\n",
-    "\n",
-    "#### Sensitivity Testing\n",
-    "The sensitivity testing framework provides a systematic approach to understanding how the Heston model responds to parameter changes, which is crucial for both model validation and practical application in trading and risk management."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "51922313",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "@vm.test(\"my_test_provider.Sensitivity\")\n",
-    "def SensitivityTest(\n",
-    "    model,\n",
-    "    strike_price,\n",
-    "    maturity_date,\n",
-    "    spot_price,\n",
-    "    v0_opt,\n",
-    "    theta_opt,\n",
-    "    kappa_opt,\n",
-    "    sigma_opt,\n",
-    "    rho_opt,\n",
-    "):\n",
-    "    \"\"\"\n",
-    "    Evaluates the sensitivity of American option prices to changes in model parameters.\n",
-    "\n",
-    "    This test calculates option prices using the Heston model with optimized parameters.\n",
-    "    It's designed to analyze how changes in various model inputs affect the option price,\n",
-    "    which is crucial for understanding model behavior and risk management.\n",
-    "\n",
-    "    Args:\n",
-    "        model (HestonModel): Initialized Heston model instance wrapped in ValidMind model object\n",
-    "        strike_price (float): Strike price of the option\n",
-    "        maturity_date (ql.Date): Expiration date of the option in QuantLib format\n",
-    "        spot_price (float): Current price of the underlying asset\n",
-    "        v0_opt (float): Optimized initial variance parameter\n",
-    "        theta_opt (float): Optimized long-term variance parameter\n",
-    "        kappa_opt (float): Optimized mean reversion rate parameter\n",
-    "        sigma_opt (float): Optimized volatility of variance parameter\n",
-    "        rho_opt (float): Optimized correlation parameter between asset price and variance\n",
-    "    \"\"\"\n",
-    "    price = model.model.predict_american_option_price(\n",
-    "        strike_price,\n",
-    "        maturity_date,\n",
-    "        spot_price,\n",
-    "        v0_opt,\n",
-    "        theta_opt,\n",
-    "        kappa_opt,\n",
-    "        sigma_opt,\n",
-    "        rho_opt,\n",
-    "    )\n",
-    "\n",
-    "    return price\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "408a05ef",
-   "metadata": {},
-   "source": [
-    "##### Common plot function"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "104ca6dd",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def plot_results(df, params: dict = None):\n",
-    "        fig2 =  plt.figure(figsize=(10, 6))\n",
-    "        plt.plot(df[params[\"x\"]], df[params[\"y\"]], label=params[\"label\"])\n",
-    "        plt.xlabel(params[\"xlabel\"])\n",
-    "        plt.ylabel(params[\"ylabel\"])\n",
-    "        \n",
-    "        plt.title(params[\"title\"])\n",
-    "        plt.legend()\n",
-    "        plt.grid(True)\n",
-    "        plt.show()  # close the plot to avoid displaying it"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "ca72b9e5",
-   "metadata": {},
-   "source": [
-    "Let's create ValidMind model object"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "ae7093fa",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "hm_model = vm.init_model(model=hm, input_id=\"HestonModel\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b2141640",
-   "metadata": {},
-   "source": [
-    "##### Strike sensitivity\n",
-    "Let's analyzes how option prices change as the strike price varies. We create a range of strike prices around the current strike (460) and observe the impact on option prices while keeping all other parameters constant."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "ea7f1cbe",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"my_test_provider.Sensitivity:ToStrike\",\n",
-    "    inputs = {\n",
-    "        \"model\": hm_model\n",
-    "    },\n",
-    "    param_grid={\n",
-    "        \"strike_price\": list(np.linspace(460-50, 460+50, 10)),\n",
-    "        \"maturity_date\": [maturity_date],\n",
-    "        \"spot_price\": [option_params[\"spot_price\"]],\n",
-    "        \"v0_opt\": [v0_opt],\n",
-    "        \"theta_opt\": [theta_opt],\n",
-    "        \"kappa_opt\": [kappa_opt],\n",
-    "        \"sigma_opt\": [sigma_opt],\n",
-    "        \"rho_opt\":[rho_opt]\n",
-    "    },\n",
-    ")\n",
-    "result.log()\n",
-    "# Visualize how option prices change with different strike prices\n",
-    "plot_results(\n",
-    "    pd.DataFrame(result.tables[0].data),\n",
-    "    params={\n",
-    "        \"x\": \"strike_price\",\n",
-    "        \"y\":\"Value\",\n",
-    "        \"label\":\"Strike price\",\n",
-    "        \"xlabel\":\"Strike price\",\n",
-    "        \"ylabel\":\"option price\",\n",
-    "        \"title\":\"Heston option - Strike price Sensitivity\",\n",
-    "    }\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "be143012",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2_3__'></a>\n",
-    "\n",
-    "#### Stress Testing\n",
-    "This stress testing framework provides a comprehensive view of how the Heston model behaves under different market conditions and helps identify potential risks in option pricing."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "f2f01a40",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "@vm.test(\"my_custom_tests.Stressing\")\n",
-    "def StressTest(\n",
-    "    model,\n",
-    "    strike_price,\n",
-    "    maturity_date,\n",
-    "    spot_price,\n",
-    "    v0_opt,\n",
-    "    theta_opt,\n",
-    "    kappa_opt,\n",
-    "    sigma_opt,\n",
-    "    rho_opt,\n",
-    "):\n",
-    "    \"\"\"\n",
-    "    Performs stress testing on Heston model parameters to evaluate option price sensitivity.\n",
-    "\n",
-    "    This test evaluates how the American option price responds to stressed market conditions\n",
-    "    by varying key model parameters. It's designed to:\n",
-    "    1. Identify potential model vulnerabilities\n",
-    "    2. Understand price behavior under extreme scenarios\n",
-    "    3. Support risk management decisions\n",
-    "    4. Validate model stability across parameter ranges\n",
-    "\n",
-    "    Args:\n",
-    "        model (HestonModel): Initialized Heston model instance wrapped in ValidMind model object\n",
-    "        strike_price (float): Option strike price\n",
-    "        maturity_date (ql.Date): Option expiration date in QuantLib format\n",
-    "        spot_price (float): Current price of the underlying asset\n",
-    "        v0_opt (float): Initial variance parameter under stress testing\n",
-    "        theta_opt (float): Long-term variance parameter under stress testing\n",
-    "        kappa_opt (float): Mean reversion rate parameter under stress testing\n",
-    "        sigma_opt (float): Volatility of variance parameter under stress testing\n",
-    "        rho_opt (float): Correlation parameter under stress testing\n",
-    "    \"\"\"\n",
-    "    price = model.model.predict_american_option_price(\n",
-    "        strike_price,\n",
-    "        maturity_date,\n",
-    "        spot_price,\n",
-    "        v0_opt,\n",
-    "        theta_opt,\n",
-    "        kappa_opt,\n",
-    "        sigma_opt,\n",
-    "        rho_opt,\n",
-    "    )\n",
-    "\n",
-    "    return price\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "31fcbe9c",
-   "metadata": {},
-   "source": [
-    "##### Rho (correlation) and Theta (long term vol) stress test\n",
-    "Next, let's evaluates the sensitivity of a model's output to changes in the correlation parameter (rho) and the long-term variance parameter (theta) within a stochastic volatility framework."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "6119b5d9",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"my_custom_tests.Stressing:TheRhoAndThetaParameters\",\n",
-    "    inputs = {\n",
-    "        \"model\": hm_model,\n",
-    "    },\n",
-    "    param_grid={\n",
-    "        \"strike_price\": [460],\n",
-    "        \"maturity_date\": [maturity_date],\n",
-    "        \"spot_price\": [option_params[\"spot_price\"]],\n",
-    "        \"v0_opt\": [v0_opt],\n",
-    "        \"theta_opt\": list(np.linspace(0.1, theta_opt+0.4, 5)),\n",
-    "        \"kappa_opt\": [kappa_opt],\n",
-    "        \"sigma_opt\": [sigma_opt],\n",
-    "        \"rho_opt\":list(np.linspace(rho_opt-0.2, rho_opt+0.2, 5))\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "be39cb3a",
-   "metadata": {},
-   "source": [
-    "##### Sigma stress test\n",
-    "Let's evaluates the sensitivity of a model's output to changes in the volatility parameter, sigma. This test is crucial for understanding how variations in market volatility impact the model's valuation of financial instruments, particularly options."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "0dc189b7",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"my_custom_tests.Stressing:TheSigmaParameter\",\n",
-    "    inputs = {\n",
-    "        \"model\": hm_model,\n",
-    "    },\n",
-    "    param_grid={\n",
-    "        \"strike_price\": [460],\n",
-    "        \"maturity_date\": [maturity_date],\n",
-    "        \"spot_price\": [option_params[\"spot_price\"]],\n",
-    "        \"v0_opt\": [v0_opt],\n",
-    "        \"theta_opt\": [theta_opt],\n",
-    "        \"kappa_opt\": [kappa_opt],\n",
-    "        \"sigma_opt\": list(np.linspace(0.1, sigma_opt+0.6, 5)),\n",
-    "        \"rho_opt\": [rho_opt]\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "173a5294",
-   "metadata": {},
-   "source": [
-    "##### Stress kappa\n",
-    "Let's evaluates the sensitivity of a model's output to changes in the kappa parameter, which is a mean reversion rate in stochastic volatility models."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "dae9714f",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"my_custom_tests.Stressing:TheKappaParameter\",\n",
-    "    inputs = {\n",
-    "        \"model\": hm_model,\n",
-    "    },\n",
-    "    param_grid={\n",
-    "        \"strike_price\": [460],\n",
-    "        \"maturity_date\": [maturity_date],\n",
-    "        \"spot_price\": [option_params[\"spot_price\"]],\n",
-    "        \"v0_opt\": [v0_opt],\n",
-    "        \"theta_opt\": [theta_opt],\n",
-    "        \"kappa_opt\": list(np.linspace(kappa_opt, kappa_opt+0.2, 5)),\n",
-    "        \"sigma_opt\": [sigma_opt],\n",
-    "        \"rho_opt\": [rho_opt]\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "b4d1d968",
-   "metadata": {},
-   "source": [
-    "##### Stress theta\n",
-    "Let's evaluates the sensitivity of a model's output to changes in the parameter theta, which represents the long-term variance in a stochastic volatility model."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "e68df3db",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"my_custom_tests.Stressing:TheThetaParameter\",\n",
-    "    inputs = {\n",
-    "        \"model\": hm_model,\n",
-    "    },\n",
-    "    param_grid={\n",
-    "        \"strike_price\": [460],\n",
-    "        \"maturity_date\": [maturity_date],\n",
-    "        \"spot_price\": [option_params[\"spot_price\"]],\n",
-    "        \"v0_opt\": [v0_opt],\n",
-    "        \"theta_opt\": list(np.linspace(0.1, theta_opt+0.9, 5)),\n",
-    "        \"kappa_opt\": [kappa_opt],\n",
-    "        \"sigma_opt\": [sigma_opt],\n",
-    "        \"rho_opt\": [rho_opt]\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "32e70456",
-   "metadata": {},
-   "source": [
-    "##### Stress rho\n",
-    "Let's evaluates the sensitivity of a model's output to changes in the correlation parameter, rho, within a stochastic volatility (SV) model framework. This test is crucial for understanding how variations in rho, which represents the correlation between the asset price and its volatility, impact the model's valuation output."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "id": "b5ca3fc2",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_test(\n",
-    "    \"my_custom_tests.Stressing:TheRhoParameter\",\n",
-    "    inputs = {\n",
-    "        \"model\": hm_model,\n",
-    "    },\n",
-    "    param_grid={\n",
-    "        \"strike_price\": [460],\n",
-    "        \"maturity_date\": [maturity_date],\n",
-    "        \"spot_price\": [option_params[\"spot_price\"]],\n",
-    "        \"v0_opt\": [v0_opt],\n",
-    "        \"theta_opt\": [theta_opt],\n",
-    "        \"kappa_opt\": [kappa_opt],\n",
-    "        \"sigma_opt\": [sigma_opt],\n",
-    "        \"rho_opt\": list(np.linspace(rho_opt-0.2, rho_opt+0.2, 5))\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "892c5347",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
-    "\n",
-    "<a id='toc6_1__'></a>\n",
-    "\n",
-    "### Work with your model documentation\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)\n",
-    "\n",
-    "<a id='toc6_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-de5d1e182b09403abddabc2850f2dd05",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "validmind-1QuffXMV-py3.10",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.14"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 5
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Quickstart for Heston option pricing model using QuantLib\n",
+        "\n",
+        "Welcome! Let's get you started with the basic process of documenting models with ValidMind.\n",
+        "\n",
+        "The Heston option pricing model is a popular stochastic volatility model used to price options. Developed by Steven Heston in 1993, the model assumes that the asset's volatility follows a mean-reverting square-root process, allowing it to capture the empirical observation of volatility \"clustering\" in financial markets. This model is particularly useful for assets where volatility is not constant, making it a favored approach in quantitative finance for pricing complex derivatives.\n",
+        "\n",
+        "Here’s an overview of the Heston model as implemented in QuantLib, a powerful library for quantitative finance:\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Model Assumptions and Characteristics\n",
+        "1. **Stochastic Volatility**: The volatility is modeled as a stochastic process, following a mean-reverting square-root process (Cox-Ingersoll-Ross process).\n",
+        "2. **Correlated Asset and Volatility Processes**: The asset price and volatility are assumed to be correlated, allowing the model to capture the \"smile\" effect observed in implied volatilities.\n",
+        "3. **Risk-Neutral Dynamics**: The Heston model is typically calibrated under a risk-neutral measure, which allows for direct application to pricing.\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### Heston Model Parameters\n",
+        "The model is governed by a set of key parameters:\n",
+        "- **S0**: Initial stock price\n",
+        "- **v0**: Initial variance of the asset price\n",
+        "- **kappa**: Speed of mean reversion of the variance\n",
+        "- **theta**: Long-term mean level of variance\n",
+        "- **sigma**: Volatility of volatility (vol of vol)\n",
+        "- **rho**: Correlation between the asset price and variance processes\n",
+        "\n",
+        "The dynamics of the asset price \\( S \\) and the variance \\( v \\) under the Heston model are given by:\n",
+        "\n",
+        "$$\n",
+        "dS_t = r S_t \\, dt + \\sqrt{v_t} S_t \\, dW^S_t\n",
+        "$$\n",
+        "\n",
+        "$$\n",
+        "dv_t = \\kappa (\\theta - v_t) \\, dt + \\sigma \\sqrt{v_t} \\, dW^v_t\n",
+        "$$\n",
+        "\n",
+        "where \\( $dW^S$ \\) and \\( $dW^v$ \\) are Wiener processes with correlation \\( $\\rho$ \\).\n",
+        "\n",
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Advantages and Limitations\n",
+        "- **Advantages**:\n",
+        "  - Ability to capture volatility smiles and skews.\n",
+        "  - More realistic pricing for options on assets with stochastic volatility.\n",
+        "- **Limitations**:\n",
+        "  - Calibration can be complex due to the number of parameters.\n",
+        "  - Computationally intensive compared to simpler models like Black-Scholes.\n",
+        "\n",
+        "This setup provides a robust framework for pricing and analyzing options with stochastic volatility dynamics. QuantLib’s implementation makes it easy to experiment with different parameter configurations and observe their effects on pricing.\n",
+        "\n",
+        "You will learn how to initialize the ValidMind Library, develop a option pricing model, and then write custom tests that can be used for sensitivity and stress testing to quickly generate documentation about model."
+      ],
+      "id": "1e2a4689"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "  - [Model Assumptions and Characteristics](#toc1_1__)    \n",
+        "  - [Heston Model Parameters](#toc1_2__)    \n",
+        "  - [Advantages and Limitations](#toc1_3__)    \n",
+        "- [About ValidMind](#toc2__)    \n",
+        "  - [Before you begin](#toc2_1__)    \n",
+        "  - [New to ValidMind?](#toc2_2__)    \n",
+        "  - [Key concepts](#toc2_3__)    \n",
+        "- [Setting up](#toc3__)    \n",
+        "  - [Install the ValidMind Library](#toc3_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc3_2__)    \n",
+        "    - [Register sample model](#toc3_2_1__)    \n",
+        "    - [Apply documentation template](#toc3_2_2__)    \n",
+        "    - [Get your code snippet](#toc3_2_3__)    \n",
+        "  - [Initialize the Python environment](#toc3_3__)    \n",
+        "  - [Preview the documentation template](#toc3_4__)    \n",
+        "- [Data Preparation](#toc4__)    \n",
+        "    - [Helper functions](#toc4_1_1__)    \n",
+        "  - [Market Data Quality and Availability](#toc4_2__)    \n",
+        "  - [Initialize the ValidMind datasets](#toc4_3__)    \n",
+        "  - [Data Quality](#toc4_4__)    \n",
+        "    - [Isolation Forest Outliers Test](#toc4_4_1__)    \n",
+        "    - [Model parameters](#toc4_4_2__)    \n",
+        "- [Model development - Heston Option price](#toc5__)    \n",
+        "  - [Model Calibration](#toc5_1__)    \n",
+        "  - [Model Evaluation](#toc5_2__)    \n",
+        "    - [Benchmark Testing](#toc5_2_1__)    \n",
+        "    - [Sensitivity Testing](#toc5_2_2__)    \n",
+        "    - [Stress Testing](#toc5_2_3__)    \n",
+        "- [Next steps](#toc6__)    \n",
+        "  - [Work with your model documentation](#toc6_1__)    \n",
+        "  - [Discover more learning resources](#toc6_2__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ],
+      "id": "69ec219a"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+        "\n",
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ],
+      "id": "b9fb5d17"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Setting up"
+      ],
+      "id": "f2dccf35"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "To install the library:"
+      ],
+      "id": "5a5ce085"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "409352bf"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "To install the QuantLib library:"
+      ],
+      "id": "65e870b2"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q QuantLib"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "3a34debf"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ],
+      "id": "fb30ae07"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ],
+      "id": "c6f87017"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Capital Markets`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ],
+      "id": "cbb2e2c9"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Can't select this template?</b></span>\n",
+        "<br></br>\n",
+        "Your organization administrators may need to add it to your template library:\n",
+        "<ul>\n",
+        "<li><a href=\"capital_markets_template.yaml\" style=\"color: #DE257E;\"><b>Download Template YAML</b></a></li>\n",
+        "<li><a href=\"https://docs.validmind.ai/guide/templates/customize-document-templates.html\" style=\"color: #DE257E;\"><b>Customize Document Templates</b></a></li>\n",
+        "</ul>\n",
+        "</div>"
+      ],
+      "id": "41c4edca"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ],
+      "id": "2012eb82"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")\n"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "0cd3f67e"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_3__'></a>\n",
+        "\n",
+        "### Initialize the Python environment\n",
+        "\n",
+        "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
+      ],
+      "id": "6d944cc9"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%matplotlib inline\n",
+        "\n",
+        "import pandas as pd\n",
+        "import numpy as np\n",
+        "import matplotlib.pyplot as plt\n",
+        "from scipy.optimize import minimize\n",
+        "import yfinance as yf\n",
+        "import QuantLib as ql\n",
+        "from validmind.tests import run_test"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "f8cf2746"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_4__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ],
+      "id": "bc431ee0"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "7e844028"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Data Preparation"
+      ],
+      "id": "0c0ee8b9"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "### Market Data Sources\n",
+        "\n",
+        "<a id='toc4_1_1__'></a>\n",
+        "\n",
+        "#### Helper functions\n",
+        "Let's define helper function retrieve to option data from Yahoo Finance."
+      ],
+      "id": "5a4d2c36"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "def get_market_data(ticker, expiration_date_str):\n",
+        "    \"\"\"\n",
+        "    Fetch option market data from Yahoo Finance for the given ticker and expiration date.\n",
+        "    Returns a list of tuples: (strike, maturity, option_price).\n",
+        "    \"\"\"\n",
+        "    # Create a Ticker object for the specified stock\n",
+        "    stock = yf.Ticker(ticker)\n",
+        "\n",
+        "    # Get all available expiration dates for options\n",
+        "    option_dates = stock.options\n",
+        "\n",
+        "    # Check if the requested expiration date is available\n",
+        "    if expiration_date_str not in option_dates:\n",
+        "        raise ValueError(f\"Expiration date {expiration_date_str} not available for {ticker}. Available dates: {option_dates}\")\n",
+        "\n",
+        "    # Get the option chain for the specified expiration date\n",
+        "    option_chain = stock.option_chain(expiration_date_str)\n",
+        "\n",
+        "    # Get call options (or you can use puts as well based on your requirement)\n",
+        "    calls = option_chain.calls\n",
+        "\n",
+        "    # Convert expiration_date_str to QuantLib Date\n",
+        "    expiry_date_parts = list(map(int, expiration_date_str.split('-')))  # Split YYYY-MM-DD\n",
+        "    maturity_date = ql.Date(expiry_date_parts[2], expiry_date_parts[1], expiry_date_parts[0])  # Convert to QuantLib Date\n",
+        "\n",
+        "    # Create a list to store strike prices, maturity dates, and option prices\n",
+        "    market_data = []\n",
+        "    for index, row in calls.iterrows():\n",
+        "        strike = row['strike']\n",
+        "        option_price = row['lastPrice']  # You can also use 'bid', 'ask', 'mid', etc.\n",
+        "        market_data.append((strike, maturity_date, option_price))\n",
+        "    df = pd.DataFrame(market_data, columns = ['strike', 'maturity_date', 'option_price'])\n",
+        "    return df"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "b96a500f"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let's define helper function retrieve to stock data from Yahoo Finance. This helper function to calculate spot price, dividend yield, volatility and risk free rate using the underline stock data."
+      ],
+      "id": "c7769b73"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "def get_option_parameters(ticker):\n",
+        "    # Fetch historical data for the stock\n",
+        "    stock_data = yf.Ticker(ticker)\n",
+        "    \n",
+        "    # Get the current spot price\n",
+        "    spot_price = stock_data.history(period=\"1d\")['Close'].iloc[-1]\n",
+        "    \n",
+        "    # Get dividend yield\n",
+        "    dividend_rate = stock_data.dividends.mean() / spot_price if not stock_data.dividends.empty else 0.0\n",
+        "    \n",
+        "    # Estimate volatility (standard deviation of log returns)\n",
+        "    hist_data = stock_data.history(period=\"1y\")['Close']\n",
+        "    log_returns = np.log(hist_data / hist_data.shift(1)).dropna()\n",
+        "    volatility = np.std(log_returns) * np.sqrt(252)  # Annualized volatility\n",
+        "    \n",
+        "    # Assume a risk-free rate from some known data (can be fetched from market data, here we use 0.001)\n",
+        "    risk_free_rate = 0.001\n",
+        "    \n",
+        "    # Return the calculated parameters\n",
+        "    return {\n",
+        "        \"spot_price\": spot_price,\n",
+        "        \"volatility\": volatility,\n",
+        "        \"dividend_rate\": dividend_rate,\n",
+        "        \"risk_free_rate\": risk_free_rate\n",
+        "    }"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "dc44c448"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Market Data Quality and Availability\n",
+        "Next, let's specify ticker and expiration date to get market data."
+      ],
+      "id": "c7b739d3"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "ticker = \"MSFT\"\n",
+        "expiration_date =  \"2024-12-13\" # Example expiration date in 'YYYY-MM-DD' form\n",
+        "\n",
+        "market_data = get_market_data(ticker=ticker, expiration_date_str=expiration_date)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "50225fde"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_3__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind datasets\n",
+        "\n",
+        "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module."
+      ],
+      "id": "c539b95e"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_market_data = vm.init_dataset(\n",
+        "    dataset=market_data,\n",
+        "    input_id=\"market_data\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "113f9c17"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_4__'></a>\n",
+        "\n",
+        "### Data Quality\n",
+        "Let's check quality of the data using outliers and missing data tests."
+      ],
+      "id": "185beb24"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_4_1__'></a>\n",
+        "\n",
+        "#### Isolation Forest Outliers Test\n",
+        "Let's detects anomalies in the dataset using the Isolation Forest algorithm, visualized through scatter plots."
+      ],
+      "id": "7f14464c"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"validmind.data_validation.IsolationForestOutliers\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_market_data,\n",
+        "    },\n",
+        "    title=\"Outliers detection using Isolation Forest\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "56c919ec"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Missing Values Test\n",
+        "Let's evaluates dataset quality by ensuring the missing value ratio across all features does not exceed a set threshold."
+      ],
+      "id": "e4d0e5ca"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"validmind.data_validation.MissingValues\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_market_data,\n",
+        "    },\n",
+        "    title=\"Missing Values detection\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "e95c825f"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_4_2__'></a>\n",
+        "\n",
+        "#### Model parameters\n",
+        "Let's calculate the model parameters using from stock data "
+      ],
+      "id": "829403a3"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "option_params = get_option_parameters(ticker=ticker)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "25936449"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Model development - Heston Option price"
+      ],
+      "id": "0a0948b6"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "class HestonModel:\n",
+        "\n",
+        "    def __init__(self, ticker, expiration_date_str, calculation_date, spot_price, dividend_rate, risk_free_rate):\n",
+        "        self.ticker = ticker\n",
+        "        self.expiration_date_str = expiration_date_str,\n",
+        "        self.calculation_date = calculation_date\n",
+        "        self.spot_price = spot_price\n",
+        "        self.dividend_rate = dividend_rate\n",
+        "        self.risk_free_rate = risk_free_rate\n",
+        "    \n",
+        "    def predict_option_price(self, strike, maturity_date, spot_price, v0=None, theta=None, kappa=None, sigma=None, rho=None):\n",
+        "        # Set the evaluation date\n",
+        "        ql.Settings.instance().evaluationDate = self.calculation_date\n",
+        "\n",
+        "        # Construct the European Option\n",
+        "        payoff = ql.PlainVanillaPayoff(ql.Option.Call, strike)\n",
+        "        exercise = ql.EuropeanExercise(maturity_date)\n",
+        "        european_option = ql.VanillaOption(payoff, exercise)\n",
+        "\n",
+        "        # Yield term structures for risk-free rate and dividend\n",
+        "        riskFreeTS = ql.YieldTermStructureHandle(ql.FlatForward(calculation_date, self.risk_free_rate, ql.Actual365Fixed()))\n",
+        "        dividendTS = ql.YieldTermStructureHandle(ql.FlatForward(calculation_date, self.dividend_rate, ql.Actual365Fixed()))\n",
+        "\n",
+        "        # Initial stock price\n",
+        "        initialValue = ql.QuoteHandle(ql.SimpleQuote(spot_price))\n",
+        "\n",
+        "        # Heston process parameters\n",
+        "        heston_process = ql.HestonProcess(riskFreeTS, dividendTS, initialValue, v0, kappa, theta, sigma, rho)\n",
+        "        hestonModel = ql.HestonModel(heston_process)\n",
+        "\n",
+        "        # Use the Heston analytic engine\n",
+        "        engine = ql.AnalyticHestonEngine(hestonModel)\n",
+        "        european_option.setPricingEngine(engine)\n",
+        "\n",
+        "        # Calculate the Heston model price\n",
+        "        h_price = european_option.NPV()\n",
+        "\n",
+        "        return h_price\n",
+        "\n",
+        "    def predict_american_option_price(self, strike, maturity_date, spot_price, v0=None, theta=None, kappa=None, sigma=None, rho=None):\n",
+        "        # Set the evaluation date\n",
+        "        ql.Settings.instance().evaluationDate = self.calculation_date\n",
+        "\n",
+        "        # Construct the American Option\n",
+        "        payoff = ql.PlainVanillaPayoff(ql.Option.Call, strike)\n",
+        "        exercise = ql.AmericanExercise(self.calculation_date, maturity_date)\n",
+        "        american_option = ql.VanillaOption(payoff, exercise)\n",
+        "\n",
+        "        # Yield term structures for risk-free rate and dividend\n",
+        "        riskFreeTS = ql.YieldTermStructureHandle(ql.FlatForward(self.calculation_date, self.risk_free_rate, ql.Actual365Fixed()))\n",
+        "        dividendTS = ql.YieldTermStructureHandle(ql.FlatForward(self.calculation_date, self.dividend_rate, ql.Actual365Fixed()))\n",
+        "\n",
+        "        # Initial stock price\n",
+        "        initialValue = ql.QuoteHandle(ql.SimpleQuote(spot_price))\n",
+        "\n",
+        "        # Heston process parameters\n",
+        "        heston_process = ql.HestonProcess(riskFreeTS, dividendTS, initialValue, v0, kappa, theta, sigma, rho)\n",
+        "        heston_model = ql.HestonModel(heston_process)\n",
+        "\n",
+        "\n",
+        "        payoff = ql.PlainVanillaPayoff(ql.Option.Call, strike)\n",
+        "        exercise = ql.AmericanExercise(self.calculation_date, maturity_date)\n",
+        "        american_option = ql.VanillaOption(payoff, exercise)\n",
+        "        heston_fd_engine = ql.FdHestonVanillaEngine(heston_model)\n",
+        "        american_option.setPricingEngine(heston_fd_engine)\n",
+        "        option_price = american_option.NPV()\n",
+        "\n",
+        "        return option_price\n",
+        "\n",
+        "    def objective_function(self, params, market_data, spot_price, dividend_rate, risk_free_rate):\n",
+        "        v0, theta, kappa, sigma, rho = params\n",
+        "\n",
+        "        # Sum of squared differences between market prices and model prices\n",
+        "        error = 0.0\n",
+        "        for i, row in market_data.iterrows():\n",
+        "            model_price = self.predict_option_price(row['strike'], row['maturity_date'], spot_price, \n",
+        "                                            v0, theta, kappa, sigma, rho)\n",
+        "            error += (model_price - row['option_price']) ** 2\n",
+        "        \n",
+        "        return error\n",
+        "\n",
+        "    def calibrate_model(self, ticker, expiration_date_str):\n",
+        "        # Get the option market data dynamically from Yahoo Finance\n",
+        "        market_data = get_market_data(ticker, expiration_date_str)\n",
+        "\n",
+        "        # Initial guesses for Heston parameters\n",
+        "        initial_params = [0.04, 0.04, 0.1, 0.1, -0.75]\n",
+        "\n",
+        "        # Bounds for the parameters to ensure realistic values\n",
+        "        bounds = [(0.0001, 1.0),  # v0\n",
+        "                (0.0001, 1.0),  # theta\n",
+        "                (0.001, 2.0),   # kappa\n",
+        "                (0.001, 1.0),   # sigma\n",
+        "                (-0.75, 0.0)]    # rho\n",
+        "\n",
+        "        # Optimize the parameters to minimize the error between model and market prices\n",
+        "        result = minimize(self.objective_function, initial_params, args=(market_data, self.spot_price, self.dividend_rate, self.risk_free_rate),\n",
+        "                        bounds=bounds, method='L-BFGS-B')\n",
+        "\n",
+        "        # Optimized Heston parameters\n",
+        "        v0_opt, theta_opt, kappa_opt, sigma_opt, rho_opt = result.x\n",
+        "\n",
+        "        return v0_opt, theta_opt, kappa_opt, sigma_opt, rho_opt\n"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "e15b8221"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Model Calibration\n",
+        "* The calibration process aims to optimize the Heston model parameters (v0, theta, kappa, sigma, rho) by minimizing the difference between model-predicted option prices and observed market prices.\n",
+        "* In this implementation, the model is calibrated to current market data, specifically using option prices from the selected ticker and expiration date.\n",
+        "\n",
+        "Let's specify `calculation_date` and `strike_price` as input parameters for the model to verify its functionality and confirm it operates as expected."
+      ],
+      "id": "a941aa32"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "calculation_date = ql.Date(26, 11, 2024)\n",
+        "# Convert expiration date string to QuantLib.Date\n",
+        "expiry_date_parts = list(map(int, expiration_date.split('-')))\n",
+        "maturity_date = ql.Date(expiry_date_parts[2], expiry_date_parts[1], expiry_date_parts[0])\n",
+        "strike_price = 460.0\n",
+        "\n",
+        "hm = HestonModel(\n",
+        "    ticker=ticker,\n",
+        "    expiration_date_str= expiration_date,\n",
+        "    calculation_date= calculation_date,\n",
+        "    spot_price= option_params['spot_price'],\n",
+        "    dividend_rate = option_params['dividend_rate'],\n",
+        "    risk_free_rate = option_params['risk_free_rate']\n",
+        ")\n",
+        "\n",
+        "# Let's calibrate model\n",
+        "v0_opt, theta_opt, kappa_opt, sigma_opt, rho_opt = hm.calibrate_model(ticker, expiration_date)\n",
+        "print(f\"Optimized Heston parameters: v0={v0_opt}, theta={theta_opt}, kappa={kappa_opt}, sigma={sigma_opt}, rho={rho_opt}\")\n",
+        "\n",
+        "\n",
+        "# option price\n",
+        "h_price = hm.predict_option_price(strike_price, maturity_date, option_params['spot_price'], v0_opt, theta_opt, kappa_opt, sigma_opt, rho_opt)\n",
+        "print(\"The Heston model price for the option is:\", h_price)"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "1d61dfca"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2__'></a>\n",
+        "\n",
+        "### Model Evaluation"
+      ],
+      "id": "75313272"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2_1__'></a>\n",
+        "\n",
+        "#### Benchmark Testing\n",
+        "The benchmark testing framework provides a robust way to validate the Heston model implementation and understand the relationships between European and American option prices under stochastic volatility conditions.\n",
+        "Let's compares European and American option prices using the Heston model."
+      ],
+      "id": "2e6471ef"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "@vm.test(\"my_custom_tests.BenchmarkTest\")\n",
+        "def benchmark_test(hm_model, strikes, maturity_date, spot_price, v0=None, theta=None, kappa=None, sigma=None, rho=None):\n",
+        "    \"\"\"\n",
+        "    Compares European and American option prices using the Heston model.\n",
+        "\n",
+        "    This test evaluates the price differences between European and American options\n",
+        "    across multiple strike prices while keeping other parameters constant. The comparison\n",
+        "    helps understand the early exercise premium of American options over their European\n",
+        "    counterparts under stochastic volatility conditions.\n",
+        "\n",
+        "    Args:\n",
+        "        hm_model: HestonModel instance for option pricing calculations\n",
+        "        strikes (list[float]): List of strike prices to test\n",
+        "        maturity_date (ql.Date): Option expiration date in QuantLib format\n",
+        "        spot_price (float): Current price of the underlying asset\n",
+        "        v0 (float, optional): Initial variance. Defaults to None.\n",
+        "        theta (float, optional): Long-term variance. Defaults to None.\n",
+        "        kappa (float, optional): Mean reversion rate. Defaults to None.\n",
+        "        sigma (float, optional): Volatility of variance. Defaults to None.\n",
+        "        rho (float, optional): Correlation between asset and variance. Defaults to None.\n",
+        "\n",
+        "    Returns:\n",
+        "        dict: Contains a DataFrame with the following columns:\n",
+        "            - Strike: Strike prices tested\n",
+        "            - Maturity date: Expiration date for all options\n",
+        "            - Spot price: Current underlying price\n",
+        "            - european model price: Prices for European options\n",
+        "            - american model price: Prices for American options\n",
+        "\"\"\"\n",
+        "    american_derived_prices = []\n",
+        "    european_derived_prices = []\n",
+        "    for K in strikes:\n",
+        "        european_derived_prices.append(hm_model.predict_option_price(K, maturity_date, spot_price, v0, theta, kappa, sigma, rho))\n",
+        "        american_derived_prices.append(hm_model.predict_american_option_price(K, maturity_date, spot_price, v0, theta, kappa, sigma, rho))\n",
+        "\n",
+        "    data = {\n",
+        "        \"Strike\": strikes,\n",
+        "        \"Maturity date\": [maturity_date] * len(strikes),\n",
+        "        \"Spot price\": [spot_price] * len(strikes),\n",
+        "        \"european model price\": european_derived_prices,\n",
+        "        \"american model price\": american_derived_prices,\n",
+        "\n",
+        "    }\n",
+        "    df1 = pd.DataFrame(data)\n",
+        "    return {\"strikes variation benchmarking\": df1}"
+      ],
+      "execution_count": 15,
+      "outputs": [],
+      "id": "810cf887"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"my_custom_tests.BenchmarkTest\",\n",
+        "    params={\n",
+        "        \"hm_model\": hm,\n",
+        "        \"strikes\": [400, 425, 460, 495, 520],\n",
+        "        \"maturity_date\": maturity_date,\n",
+        "        \"spot_price\": option_params['spot_price'],\n",
+        "        \"v0\":v0_opt,\n",
+        "        \"theta\": theta_opt,\n",
+        "        \"kappa\":kappa_opt ,\n",
+        "        \"sigma\": sigma_opt,\n",
+        "        \"rho\":rho_opt\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "3fdd6705"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2_2__'></a>\n",
+        "\n",
+        "#### Sensitivity Testing\n",
+        "The sensitivity testing framework provides a systematic approach to understanding how the Heston model responds to parameter changes, which is crucial for both model validation and practical application in trading and risk management."
+      ],
+      "id": "e359b503"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "@vm.test(\"my_test_provider.Sensitivity\")\n",
+        "def SensitivityTest(\n",
+        "    model,\n",
+        "    strike_price,\n",
+        "    maturity_date,\n",
+        "    spot_price,\n",
+        "    v0_opt,\n",
+        "    theta_opt,\n",
+        "    kappa_opt,\n",
+        "    sigma_opt,\n",
+        "    rho_opt,\n",
+        "):\n",
+        "    \"\"\"\n",
+        "    Evaluates the sensitivity of American option prices to changes in model parameters.\n",
+        "\n",
+        "    This test calculates option prices using the Heston model with optimized parameters.\n",
+        "    It's designed to analyze how changes in various model inputs affect the option price,\n",
+        "    which is crucial for understanding model behavior and risk management.\n",
+        "\n",
+        "    Args:\n",
+        "        model (HestonModel): Initialized Heston model instance wrapped in ValidMind model object\n",
+        "        strike_price (float): Strike price of the option\n",
+        "        maturity_date (ql.Date): Expiration date of the option in QuantLib format\n",
+        "        spot_price (float): Current price of the underlying asset\n",
+        "        v0_opt (float): Optimized initial variance parameter\n",
+        "        theta_opt (float): Optimized long-term variance parameter\n",
+        "        kappa_opt (float): Optimized mean reversion rate parameter\n",
+        "        sigma_opt (float): Optimized volatility of variance parameter\n",
+        "        rho_opt (float): Optimized correlation parameter between asset price and variance\n",
+        "    \"\"\"\n",
+        "    price = model.model.predict_american_option_price(\n",
+        "        strike_price,\n",
+        "        maturity_date,\n",
+        "        spot_price,\n",
+        "        v0_opt,\n",
+        "        theta_opt,\n",
+        "        kappa_opt,\n",
+        "        sigma_opt,\n",
+        "        rho_opt,\n",
+        "    )\n",
+        "\n",
+        "    return price\n"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "51922313"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Common plot function"
+      ],
+      "id": "408a05ef"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "def plot_results(df, params: dict = None):\n",
+        "        fig2 =  plt.figure(figsize=(10, 6))\n",
+        "        plt.plot(df[params[\"x\"]], df[params[\"y\"]], label=params[\"label\"])\n",
+        "        plt.xlabel(params[\"xlabel\"])\n",
+        "        plt.ylabel(params[\"ylabel\"])\n",
+        "        \n",
+        "        plt.title(params[\"title\"])\n",
+        "        plt.legend()\n",
+        "        plt.grid(True)\n",
+        "        plt.show()  # close the plot to avoid displaying it"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "104ca6dd"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let's create ValidMind model object"
+      ],
+      "id": "ca72b9e5"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "hm_model = vm.init_model(model=hm, input_id=\"HestonModel\")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "ae7093fa"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Strike sensitivity\n",
+        "Let's analyzes how option prices change as the strike price varies. We create a range of strike prices around the current strike (460) and observe the impact on option prices while keeping all other parameters constant."
+      ],
+      "id": "b2141640"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"my_test_provider.Sensitivity:ToStrike\",\n",
+        "    inputs = {\n",
+        "        \"model\": hm_model\n",
+        "    },\n",
+        "    param_grid={\n",
+        "        \"strike_price\": list(np.linspace(460-50, 460+50, 10)),\n",
+        "        \"maturity_date\": [maturity_date],\n",
+        "        \"spot_price\": [option_params[\"spot_price\"]],\n",
+        "        \"v0_opt\": [v0_opt],\n",
+        "        \"theta_opt\": [theta_opt],\n",
+        "        \"kappa_opt\": [kappa_opt],\n",
+        "        \"sigma_opt\": [sigma_opt],\n",
+        "        \"rho_opt\":[rho_opt]\n",
+        "    },\n",
+        ")\n",
+        "result.log()\n",
+        "# Visualize how option prices change with different strike prices\n",
+        "plot_results(\n",
+        "    pd.DataFrame(result.tables[0].data),\n",
+        "    params={\n",
+        "        \"x\": \"strike_price\",\n",
+        "        \"y\":\"Value\",\n",
+        "        \"label\":\"Strike price\",\n",
+        "        \"xlabel\":\"Strike price\",\n",
+        "        \"ylabel\":\"option price\",\n",
+        "        \"title\":\"Heston option - Strike price Sensitivity\",\n",
+        "    }\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "ea7f1cbe"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2_3__'></a>\n",
+        "\n",
+        "#### Stress Testing\n",
+        "This stress testing framework provides a comprehensive view of how the Heston model behaves under different market conditions and helps identify potential risks in option pricing."
+      ],
+      "id": "be143012"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "@vm.test(\"my_custom_tests.Stressing\")\n",
+        "def StressTest(\n",
+        "    model,\n",
+        "    strike_price,\n",
+        "    maturity_date,\n",
+        "    spot_price,\n",
+        "    v0_opt,\n",
+        "    theta_opt,\n",
+        "    kappa_opt,\n",
+        "    sigma_opt,\n",
+        "    rho_opt,\n",
+        "):\n",
+        "    \"\"\"\n",
+        "    Performs stress testing on Heston model parameters to evaluate option price sensitivity.\n",
+        "\n",
+        "    This test evaluates how the American option price responds to stressed market conditions\n",
+        "    by varying key model parameters. It's designed to:\n",
+        "    1. Identify potential model vulnerabilities\n",
+        "    2. Understand price behavior under extreme scenarios\n",
+        "    3. Support risk management decisions\n",
+        "    4. Validate model stability across parameter ranges\n",
+        "\n",
+        "    Args:\n",
+        "        model (HestonModel): Initialized Heston model instance wrapped in ValidMind model object\n",
+        "        strike_price (float): Option strike price\n",
+        "        maturity_date (ql.Date): Option expiration date in QuantLib format\n",
+        "        spot_price (float): Current price of the underlying asset\n",
+        "        v0_opt (float): Initial variance parameter under stress testing\n",
+        "        theta_opt (float): Long-term variance parameter under stress testing\n",
+        "        kappa_opt (float): Mean reversion rate parameter under stress testing\n",
+        "        sigma_opt (float): Volatility of variance parameter under stress testing\n",
+        "        rho_opt (float): Correlation parameter under stress testing\n",
+        "    \"\"\"\n",
+        "    price = model.model.predict_american_option_price(\n",
+        "        strike_price,\n",
+        "        maturity_date,\n",
+        "        spot_price,\n",
+        "        v0_opt,\n",
+        "        theta_opt,\n",
+        "        kappa_opt,\n",
+        "        sigma_opt,\n",
+        "        rho_opt,\n",
+        "    )\n",
+        "\n",
+        "    return price\n"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "f2f01a40"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Rho (correlation) and Theta (long term vol) stress test\n",
+        "Next, let's evaluates the sensitivity of a model's output to changes in the correlation parameter (rho) and the long-term variance parameter (theta) within a stochastic volatility framework."
+      ],
+      "id": "31fcbe9c"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"my_custom_tests.Stressing:TheRhoAndThetaParameters\",\n",
+        "    inputs = {\n",
+        "        \"model\": hm_model,\n",
+        "    },\n",
+        "    param_grid={\n",
+        "        \"strike_price\": [460],\n",
+        "        \"maturity_date\": [maturity_date],\n",
+        "        \"spot_price\": [option_params[\"spot_price\"]],\n",
+        "        \"v0_opt\": [v0_opt],\n",
+        "        \"theta_opt\": list(np.linspace(0.1, theta_opt+0.4, 5)),\n",
+        "        \"kappa_opt\": [kappa_opt],\n",
+        "        \"sigma_opt\": [sigma_opt],\n",
+        "        \"rho_opt\":list(np.linspace(rho_opt-0.2, rho_opt+0.2, 5))\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "6119b5d9"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Sigma stress test\n",
+        "Let's evaluates the sensitivity of a model's output to changes in the volatility parameter, sigma. This test is crucial for understanding how variations in market volatility impact the model's valuation of financial instruments, particularly options."
+      ],
+      "id": "be39cb3a"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"my_custom_tests.Stressing:TheSigmaParameter\",\n",
+        "    inputs = {\n",
+        "        \"model\": hm_model,\n",
+        "    },\n",
+        "    param_grid={\n",
+        "        \"strike_price\": [460],\n",
+        "        \"maturity_date\": [maturity_date],\n",
+        "        \"spot_price\": [option_params[\"spot_price\"]],\n",
+        "        \"v0_opt\": [v0_opt],\n",
+        "        \"theta_opt\": [theta_opt],\n",
+        "        \"kappa_opt\": [kappa_opt],\n",
+        "        \"sigma_opt\": list(np.linspace(0.1, sigma_opt+0.6, 5)),\n",
+        "        \"rho_opt\": [rho_opt]\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "0dc189b7"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Stress kappa\n",
+        "Let's evaluates the sensitivity of a model's output to changes in the kappa parameter, which is a mean reversion rate in stochastic volatility models."
+      ],
+      "id": "173a5294"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"my_custom_tests.Stressing:TheKappaParameter\",\n",
+        "    inputs = {\n",
+        "        \"model\": hm_model,\n",
+        "    },\n",
+        "    param_grid={\n",
+        "        \"strike_price\": [460],\n",
+        "        \"maturity_date\": [maturity_date],\n",
+        "        \"spot_price\": [option_params[\"spot_price\"]],\n",
+        "        \"v0_opt\": [v0_opt],\n",
+        "        \"theta_opt\": [theta_opt],\n",
+        "        \"kappa_opt\": list(np.linspace(kappa_opt, kappa_opt+0.2, 5)),\n",
+        "        \"sigma_opt\": [sigma_opt],\n",
+        "        \"rho_opt\": [rho_opt]\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "dae9714f"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Stress theta\n",
+        "Let's evaluates the sensitivity of a model's output to changes in the parameter theta, which represents the long-term variance in a stochastic volatility model."
+      ],
+      "id": "b4d1d968"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"my_custom_tests.Stressing:TheThetaParameter\",\n",
+        "    inputs = {\n",
+        "        \"model\": hm_model,\n",
+        "    },\n",
+        "    param_grid={\n",
+        "        \"strike_price\": [460],\n",
+        "        \"maturity_date\": [maturity_date],\n",
+        "        \"spot_price\": [option_params[\"spot_price\"]],\n",
+        "        \"v0_opt\": [v0_opt],\n",
+        "        \"theta_opt\": list(np.linspace(0.1, theta_opt+0.9, 5)),\n",
+        "        \"kappa_opt\": [kappa_opt],\n",
+        "        \"sigma_opt\": [sigma_opt],\n",
+        "        \"rho_opt\": [rho_opt]\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "e68df3db"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "##### Stress rho\n",
+        "Let's evaluates the sensitivity of a model's output to changes in the correlation parameter, rho, within a stochastic volatility (SV) model framework. This test is crucial for understanding how variations in rho, which represents the correlation between the asset price and its volatility, impact the model's valuation output."
+      ],
+      "id": "32e70456"
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_test(\n",
+        "    \"my_custom_tests.Stressing:TheRhoParameter\",\n",
+        "    inputs = {\n",
+        "        \"model\": hm_model,\n",
+        "    },\n",
+        "    param_grid={\n",
+        "        \"strike_price\": [460],\n",
+        "        \"maturity_date\": [maturity_date],\n",
+        "        \"spot_price\": [option_params[\"spot_price\"]],\n",
+        "        \"v0_opt\": [v0_opt],\n",
+        "        \"theta_opt\": [theta_opt],\n",
+        "        \"kappa_opt\": [kappa_opt],\n",
+        "        \"sigma_opt\": [sigma_opt],\n",
+        "        \"rho_opt\": list(np.linspace(rho_opt-0.2, rho_opt+0.2, 5))\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": [],
+      "id": "b5ca3fc2"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
+        "\n",
+        "<a id='toc6_1__'></a>\n",
+        "\n",
+        "### Work with your documentation\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
+        "\n",
+        "<a id='toc6_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ],
+      "id": "892c5347"
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-de5d1e182b09403abddabc2850f2dd05"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "validmind-1QuffXMV-py3.10",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.10.14"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 5
 }
diff --git a/site/notebooks/use_cases/code_explainer/customer_churn_full_suite.py b/site/notebooks/use_cases/code_explainer/customer_churn_full_suite.py
index 3f7c828092..ce052801d9 100644
--- a/site/notebooks/use_cases/code_explainer/customer_churn_full_suite.py
+++ b/site/notebooks/use_cases/code_explainer/customer_churn_full_suite.py
@@ -3,7 +3,7 @@
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
 
 """
-Quickstart for model documentation
+Quickstart for documentation
 
 Welcome! Let's get you started with the basic process of documenting models with ValidMind.
 
diff --git a/site/notebooks/use_cases/code_explainer/quickstart_code_explainer_demo.ipynb b/site/notebooks/use_cases/code_explainer/quickstart_code_explainer_demo.ipynb
index b1d91a6572..4f912501fe 100644
--- a/site/notebooks/use_cases/code_explainer/quickstart_code_explainer_demo.ipynb
+++ b/site/notebooks/use_cases/code_explainer/quickstart_code_explainer_demo.ipynb
@@ -1,876 +1,888 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Quickstart for model code documentation\n",
-    "\n",
-    "Welcome! This notebook demonstrates how to use the ValidMind code explainer to automatically generate comprehensive documentation for your codebase. The code explainer analyzes your source code and provides detailed explanations across various aspects of your implementation.\n",
-    "\n",
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About Code Explainer\n",
-    "The ValidMind code explainer is a powerful tool that automatically analyzes your source code and generates comprehensive documentation. It helps you:\n",
-    "\n",
-    "- Understand the structure and organization of your codebase\n",
-    "- Document dependencies and environment setup\n",
-    "- Explain data processing and model implementation details\n",
-    "- Document training, evaluation, and inference pipelines\n",
-    "- Track configuration, testing, and security measures\n",
-    "\n",
-    "This tool is particularly useful for:\n",
-    "- Onboarding new team members\n",
-    "- Maintaining up-to-date documentation\n",
-    "- Ensuring code quality and best practices\n",
-    "- Facilitating code reviews and audits"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About Code Explainer](#toc1__)    \n",
-    "- [About ValidMind](#toc2__)    \n",
-    "  - [Before you begin](#toc2_1__)    \n",
-    "  - [New to ValidMind?](#toc2_2__)    \n",
-    "  - [Key concepts](#toc2_3__)    \n",
-    "- [Setting up](#toc3__)    \n",
-    "  - [Install the ValidMind Library](#toc3_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc3_2__)    \n",
-    "    - [Register sample model](#toc3_2_1__)    \n",
-    "    - [Apply documentation template](#toc3_2_2__)    \n",
-    "    - [Get your code snippet](#toc3_2_3__)    \n",
-    "  - [Preview the documentation template](#toc3_3__)    \n",
-    "- [Common function](#toc4__)    \n",
-    "- [Default Behavior](#toc5__)    \n",
-    "- [Codebase Overview](#toc6__)    \n",
-    "- [Environment and Dependencies ('environment_setup')](#toc7__)    \n",
-    "- [Data Ingestion and Preprocessing](#toc8__)    \n",
-    "- [Model Implementation Details](#toc9__)    \n",
-    "- [Model Training Pipeline](#toc10__)    \n",
-    "- [Evaluation and Validation Code](#toc11__)    \n",
-    "- [Inference and Scoring Logic](#toc12__)    \n",
-    "- [Configuration and Parameters](#toc13__)    \n",
-    "- [Unit and Integration Testing](#toc14__)    \n",
-    "- [Logging and Monitoring Hooks](#toc15__)    \n",
-    "- [Code and Model Versioning](#toc16__)    \n",
-    "- [Security and Access Control](#toc17__)    \n",
-    "- [Example Runs and Scripts](#toc18__)    \n",
-    "- [Known Issues and Future Improvements](#toc19__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
-    "\n",
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Custom tests**: Custom tests are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom test.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom test. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Model Source Code Documentation`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Can't select this template?</b></span>\n",
-    "<br></br>\n",
-    "Your organization administrators may need to add it to your template library:\n",
-    "<ul>\n",
-    "<li><a href=\"model_source_code_documentation_template.yaml\" style=\"color: #DE257E;\"><b>Download Template YAML</b></a></li>\n",
-    "<li><a href=\"https://docs.validmind.ai/guide/templates/customize-document-templates.html\" style=\"color: #DE257E;\"><b>Customize Document Templates</b></a></li>\n",
-    "</ul>\n",
-    "</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_3__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Common function\n",
-    "The code above defines two key functions:\n",
-    "1. A function to read source code from 'customer_churn_full_suite.py' file\n",
-    "2. An 'explain_code' function that uses ValidMind's experimental agents to analyze and explain code."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "source_code=\"\"\n",
-    "with open(\"customer_churn_full_suite.py\", \"r\") as f:\n",
-    "    source_code = f.read()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "The `vm.experimental.agents.run_task` function is used to execute AI agent tasks.\n",
-    "\n",
-    "It requires:\n",
-    "- task: The type of task to run (e.g. `code_explainer`)\n",
-    "- input: A dictionary containing task-specific parameters\n",
-    "   - For `code_explainer`, this includes:\n",
-    "      - **source_code** (str): The code to be analyzed\n",
-    "      - **user_instructions** (str): Instructions for how to analyze the code"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def explain_code(content_id: str, user_instructions: str):\n",
-    "    \"\"\"Run code explanation task and log the results.\n",
-    "    By default, the code explainer includes sections for:\n",
-    "    - Main Purpose and Overall Functionality\n",
-    "    - Breakdown of Key Functions or Components\n",
-    "    - Potential Risks or Failure Points  \n",
-    "    - Assumptions or Limitations\n",
-    "    If you want default sections, specify user_instructions as an empty string.\n",
-    "    \n",
-    "    Args:\n",
-    "        user_instructions (str): Instructions for how to analyze the code\n",
-    "        content_id (str): ID to use when logging the results\n",
-    "    \n",
-    "    Returns:\n",
-    "        The result object from running the code explanation task\n",
-    "    \"\"\"\n",
-    "    result = vm.experimental.agents.run_task(\n",
-    "        task=\"code_explainer\",\n",
-    "        input={\n",
-    "            \"source_code\": source_code,\n",
-    "            \"user_instructions\": user_instructions\n",
-    "        }\n",
-    "    )\n",
-    "    result.log(content_id=content_id)\n",
-    "    return result"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='defaultBehavior'></a>\n",
-    "\n",
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Default Behavior"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "By default, the code explainer includes sections for:\n",
-    "- Main Purpose and Overall Functionality\n",
-    "- Breakdown of Key Functions or Components\n",
-    "- Potential Risks or Failure Points  \n",
-    "- Assumptions or Limitations\n",
-    "\n",
-    "If you want default sections, specify `user_instructions` as an empty string. For example:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = vm.experimental.agents.run_task(\n",
-    "    task=\"code_explainer\",\n",
-    "    input={\n",
-    "        \"source_code\": source_code,\n",
-    "        \"user_instructions\": \"\"\n",
-    "    }\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='overview'></a>\n",
-    "\n",
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Codebase Overview\n",
-    "\n",
-    "Let's analyze your codebase structure to understand the main modules, components, entry points and their relationships. We'll also examine the technology stack and frameworks that are being utilized in the implementation."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = explain_code(\n",
-    "    user_instructions=\"\"\"\n",
-    "        Please provide a summary of the following bullet points only.\n",
-    "        - Describe the overall structure of the source code repository.\n",
-    "        - Identify main modules, folders, and scripts.\n",
-    "        - Highlight entry points for training, inference, and evaluation.\n",
-    "        - State the main programming languages and frameworks used.\n",
-    "        \"\"\",\n",
-    "    content_id=\"code_structure_summary\"\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = explain_code(\n",
-    "    user_instructions=\"\",\n",
-    "    content_id=\"code_structure_summary\"\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='environment'></a>\n",
-    "\n",
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Environment and Dependencies ('environment_setup')\n",
-    "Let's document the technical requirements and setup needed to run your code, including Python packages, system dependencies, and environment configuration files. Understanding these requirements is essential for proper development environment setup and consistent deployments across different environments."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = explain_code(\n",
-    "    user_instructions=\"\"\"\n",
-    "    Please provide a summary of the following bullet points only.\n",
-    "    - List Python packages and system dependencies (OS, compilers, etc.).\n",
-    "    - Reference environment files (requirements.txt, environment.yml, Dockerfile).\n",
-    "    - Include setup instructions using Conda, virtualenv, or containers.\n",
-    "    Please remove Potential Risks or Failure Points and Assumptions or Limitations sections. Please don't add any other sections.\n",
-    "    \"\"\",\n",
-    "    content_id=\"setup_instructions\"\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='data'></a>\n",
-    "\n",
-    "<a id='toc8__'></a>\n",
-    "\n",
-    "## Data Ingestion and Preprocessing\n",
-    "Let's document how your code handles data, including data sources, validation procedures, and preprocessing steps. We'll examine the data pipeline architecture, covering everything from initial data loading through feature engineering and quality checks."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = explain_code(\n",
-    "    user_instructions=\"\"\"\n",
-    "    Please provide a summary of the following bullet points only.\n",
-    "    - Specify data input formats and sources.\n",
-    "    - Document ingestion, validation, and transformation logic.\n",
-    "    - Explain how raw data is preprocessed and features are generated.\n",
-    "    Please remove Potential Risks or Failure Points and Assumptions or Limitations sections. Please don't add any other sections.    \"\"\",\n",
-    "    content_id=\"data_handling_notes\"\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='model'> </a>\n",
-    "\n",
-    "<a id='toc9__'></a>\n",
-    "\n",
-    "## Model Implementation Details\n",
-    "Let's document the core implementation details of your model, including its architecture, components, and key algorithms. Understanding the technical implementation is crucial for maintenance, debugging, and future improvements to the codebase. We'll examine how theoretical concepts are translated into working code."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = explain_code(\n",
-    "    user_instructions=\"\"\"\n",
-    "    Please provide a summary of the following bullet points only.\n",
-    "    - Describe the core model code structure (classes, functions).\n",
-    "    - Link code to theoretical models or equations when applicable.\n",
-    "    - Note custom components like loss functions or feature selectors.\n",
-    "    Please remove Potential Risks or Failure Points and Assumptions or Limitations sections. Please don't add any other sections.\n",
-    "    \"\"\",\n",
-    "    content_id=\"model_code_description\"\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='training'></a>\n",
-    "\n",
-    "<a id='toc10__'></a>\n",
-    "\n",
-    "## Model Training Pipeline\n",
-    "\n",
-    "Let's document the training pipeline implementation, including how models are trained, optimized and evaluated. We'll examine the training process workflow, hyperparameter tuning approach, and model checkpointing mechanisms. This section provides insights into how the model learns from data and achieves optimal performance."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = explain_code(\n",
-    "    user_instructions=\"\"\"\n",
-    "    Please provide a summary of the following bullet points only.\n",
-    "    - Explain the training process, optimization strategy, and hyperparameters.\n",
-    "    - Describe logging, checkpointing, and early stopping mechanisms.\n",
-    "    - Include references to training config files or tuning logic.\n",
-    "    Please remove Potential Risks or Failure Points and Assumptions or Limitations sections. Please don't add any other sections.\n",
-    "    \"\"\",\n",
-    "    content_id=\"training_logic_details\"\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='evaluation'></a>\n",
-    "\n",
-    "<a id='toc11__'></a>\n",
-    "\n",
-    "## Evaluation and Validation Code\n",
-    "Let's examine how the model's validation and evaluation code is implemented, including the metrics calculation and validation processes. We'll explore the diagnostic tools and visualization methods used to assess model performance. This section will also cover how validation results are logged and stored for future reference."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = explain_code(\n",
-    "    user_instructions=\"\"\"\n",
-    "    Please provide a summary of the following bullet points only.\n",
-    "    - Describe how validation is implemented and metrics are calculated.\n",
-    "    - Include plots and diagnostic tools (e.g., ROC, SHAP, confusion matrix).\n",
-    "    - State how outputs are logged and persisted.\n",
-    "    Please remove Potential Risks or Failure Points and Assumptions or Limitations sections. Please don't add any other sections.\n",
-    "    \"\"\",\n",
-    "    content_id=\"evaluation_logic_notes\"\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='inference'></a>\n",
-    "\n",
-    "<a id='toc12__'></a>\n",
-    "\n",
-    "## Inference and Scoring Logic\n",
-    "Let's examine how the model performs inference and scoring on new data. This section will cover the implementation details of loading trained models, making predictions, and any required pre/post-processing steps. We'll also look at the APIs and interfaces available for both real-time serving and batch scoring scenarios."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = explain_code(\n",
-    "    user_instructions=\"\"\"\n",
-    "    Please provide a summary of the following bullet points only.\n",
-    "    - Detail how the trained model is loaded and used for predictions.\n",
-    "    - Explain I/O formats and APIs for serving or batch scoring.\n",
-    "    - Include any preprocessing/postprocessing logic required.\n",
-    "    Please remove Potential Risks or Failure Points and Assumptions or Limitations sections. Please don't add any other sections.\n",
-    "    \"\"\",\n",
-    "    content_id=\"inference_mechanism\"\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='config'></a>\n",
-    "\n",
-    "<a id='toc13__'></a>\n",
-    "\n",
-    "## Configuration and Parameters\n",
-    "Let's explore how configuration and parameters are managed in the codebase. We'll examine the configuration files, command-line arguments, environment variables, and other mechanisms used to control model behavior. This section will also cover parameter versioning and how different configurations are tracked across model iterations."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = explain_code(\n",
-    "    user_instructions=\"\"\"\n",
-    "    Please provide a summary of the following bullet points only.\n",
-    "    - Describe configuration management (files, CLI args, env vars).\n",
-    "    - Highlight default parameters and override mechanisms.\n",
-    "    - Reference versioning practices for config files.\n",
-    "    Please remove Potential Risks or Failure Points and Assumptions or Limitations sections. Please don't add any other sections.\n",
-    "    \"\"\",\n",
-    "    content_id=\"config_control_notes\"\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='testing'></a>\n",
-    "\n",
-    "<a id='toc14__'></a>\n",
-    "\n",
-    "## Unit and Integration Testing\n",
-    "Let's examine the testing strategy and implementation in the codebase. We'll analyze the unit tests, integration tests, and testing frameworks used to ensure code quality and reliability. This section will also cover test coverage metrics and continuous integration practices."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = explain_code(\n",
-    "    user_instructions=\"\"\"\n",
-    "    Please provide a summary of the following bullet points only.\n",
-    "    - List unit and integration tests and what they cover.\n",
-    "    - Mention testing frameworks and coverage tools used.\n",
-    "    - Explain testing strategy for production-readiness.\n",
-    "    Please remove Potential Risks or Failure Points and Assumptions or Limitations sections. Please don't add any other sections.\n",
-    "    \"\"\",\n",
-    "    content_id=\"test_strategy_overview\"\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='logging'></a>\n",
-    "\n",
-    "<a id='toc15__'></a>\n",
-    "\n",
-    "## Logging and Monitoring Hooks\n",
-    "Let's analyze how logging and monitoring are implemented in the codebase. We'll examine the logging configuration, monitoring hooks, and key metrics being tracked. This section will also cover any real-time observability integrations and alerting mechanisms in place."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = explain_code(\n",
-    "    user_instructions=\"\"\"\n",
-    "    Please provide a summary of the following bullet points only.\n",
-    "    - Describe logging configuration and structure.\n",
-    "    - Highlight real-time monitoring or observability integrations.\n",
-    "    - List key events, metrics, or alerts tracked.\n",
-    "    Please remove Potential Risks or Failure Points and Assumptions or Limitations sections. Please don't add any other sections.\n",
-    "    \"\"\",\n",
-    "    content_id=\"logging_monitoring_notes\"\n",
-    ")\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='versioning'></a>\n",
-    "\n",
-    "<a id='toc16__'></a>\n",
-    "\n",
-    "## Code and Model Versioning\n",
-    "Let's examine how code and model versioning is managed in the codebase. This section will cover version control practices, including Git workflows and model artifact versioning tools like DVC or MLflow. We'll also look at how versioning integrates with the CI/CD pipeline."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = explain_code(\n",
-    "    user_instructions=\"\"\"\n",
-    "    Please provide a summary of the following bullet points only.\n",
-    "      - Describe Git usage, branching, tagging, and commit standards.\n",
-    "      - Include model artifact versioning practices (e.g., DVC, MLflow).\n",
-    "      - Reference any automation in CI/CD.\n",
-    "    Please remove the following sections: \n",
-    "      - Potential Risks or Failure Points\n",
-    "      - Assumptions or Limitations\n",
-    "      - Breakdown of Key Functions or Components\n",
-    "    Please don't add any other sections.\n",
-    "    \"\"\",\n",
-    "    content_id=\"version_tracking_description\"\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='security'></a>\n",
-    "\n",
-    "<a id='toc17__'></a>\n",
-    "\n",
-    "## Security and Access Control\n",
-    "Let's analyze the security and access control measures implemented in the codebase. We'll examine how sensitive data and code are protected through access controls, encryption, and compliance measures. Additionally, we'll review secure deployment practices and any specific handling of PII data."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = explain_code(\n",
-    "    user_instructions=\"\"\"\n",
-    "    Please provide a summary of the following bullet points only.\n",
-    "      - Document access controls for source code and data.\n",
-    "      - Include any encryption, PII handling, or compliance measures.\n",
-    "      - Mention secure deployment practices.\n",
-    "    Please remove the following sections: \n",
-    "      - Potential Risks or Failure Points\n",
-    "      - Assumptions or Limitations\n",
-    "      - Breakdown of Key Functions or Components\n",
-    "    Please don't add any other sections.\n",
-    "    \"\"\",\n",
-    "    content_id=\"security_policies_notes\"\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='examples'></a>\n",
-    "\n",
-    "<a id='toc18__'></a>\n",
-    "\n",
-    "## Example Runs and Scripts\n",
-    "Let's explore example runs and scripts that demonstrate how to use this codebase in practice. We'll look at working examples, command-line usage, and sample notebooks that showcase the core functionality. This section will also point to demo datasets and test scenarios that can help new users get started quickly."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = explain_code(\n",
-    "    user_instructions=\"\"\"\n",
-    "    Please provide a summary of the following bullet points only.\n",
-    "      - Provide working script examples.\n",
-    "      - Include CLI usage instructions or sample notebooks.\n",
-    "      - Link to demo datasets or test scenarios.\n",
-    "    Please remove the following sections: \n",
-    "      - Potential Risks or Failure Points\n",
-    "      - Assumptions or Limitations\n",
-    "      - Breakdown of Key Functions or Components\n",
-    "    Please don't add any other sections.\n",
-    "    \"\"\",\n",
-    "    content_id=\"runnable_examples\"\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='issues'></a>\n",
-    "\n",
-    "<a id='toc19__'></a>\n",
-    "\n",
-    "## Known Issues and Future Improvements\n",
-    "Let's examine the current limitations and areas for improvement in the codebase. This section will document known technical debt, bugs, and feature gaps that need to be addressed. We'll also outline proposed enhancements and reference any existing tickets or GitHub issues tracking these improvements."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = explain_code(\n",
-    "    user_instructions=\"\"\"\n",
-    "    Please provide a summary of the following bullet points only.\n",
-    "      - List current limitations or technical debt.\n",
-    "      - Outline proposed enhancements or refactors.\n",
-    "      - Reference relevant tickets, GitHub issues, or roadmap items.\n",
-    "    Please remove Potential Risks or Failure Points and Assumptions or Limitations sections. Please don't add any other sections.\n",
-    "    \"\"\",\n",
-    "    content_id=\"issues_and_improvements_log\"\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-72ed6e2a48984af3aca5888b96d1f6b6",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "validmind-1QuffXMV-py3.11",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.11.9"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 4
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Quickstart for model code documentation\n",
+        "\n",
+        "Welcome! This notebook demonstrates how to use the ValidMind code explainer to automatically generate comprehensive documentation for your codebase. The code explainer analyzes your source code and provides detailed explanations across various aspects of your implementation.\n",
+        "\n",
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About Code Explainer\n",
+        "The ValidMind code explainer is a powerful tool that automatically analyzes your source code and generates comprehensive documentation. It helps you:\n",
+        "\n",
+        "- Understand the structure and organization of your codebase\n",
+        "- Document dependencies and environment setup\n",
+        "- Explain data processing and model implementation details\n",
+        "- Document training, evaluation, and inference pipelines\n",
+        "- Track configuration, testing, and security measures\n",
+        "\n",
+        "This tool is particularly useful for:\n",
+        "- Onboarding new team members\n",
+        "- Maintaining up-to-date documentation\n",
+        "- Ensuring code quality and best practices\n",
+        "- Facilitating code reviews and audits"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About Code Explainer](#toc1__)    \n",
+        "- [About ValidMind](#toc2__)    \n",
+        "  - [Before you begin](#toc2_1__)    \n",
+        "  - [New to ValidMind?](#toc2_2__)    \n",
+        "  - [Key concepts](#toc2_3__)    \n",
+        "- [Setting up](#toc3__)    \n",
+        "  - [Install the ValidMind Library](#toc3_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc3_2__)    \n",
+        "    - [Register sample model](#toc3_2_1__)    \n",
+        "    - [Apply documentation template](#toc3_2_2__)    \n",
+        "    - [Get your code snippet](#toc3_2_3__)    \n",
+        "  - [Preview the documentation template](#toc3_3__)    \n",
+        "- [Common function](#toc4__)    \n",
+        "- [Default Behavior](#toc5__)    \n",
+        "- [Codebase Overview](#toc6__)    \n",
+        "- [Environment and Dependencies ('environment_setup')](#toc7__)    \n",
+        "- [Data Ingestion and Preprocessing](#toc8__)    \n",
+        "- [Model Implementation Details](#toc9__)    \n",
+        "- [Model Training Pipeline](#toc10__)    \n",
+        "- [Evaluation and Validation Code](#toc11__)    \n",
+        "- [Inference and Scoring Logic](#toc12__)    \n",
+        "- [Configuration and Parameters](#toc13__)    \n",
+        "- [Unit and Integration Testing](#toc14__)    \n",
+        "- [Logging and Monitoring Hooks](#toc15__)    \n",
+        "- [Code and Model Versioning](#toc16__)    \n",
+        "- [Security and Access Control](#toc17__)    \n",
+        "- [Example Runs and Scripts](#toc18__)    \n",
+        "- [Known Issues and Future Improvements](#toc19__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+        "\n",
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Model Source Code Documentation`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Can't select this template?</b></span>\n",
+        "<br></br>\n",
+        "Your organization administrators may need to add it to your template library:\n",
+        "<ul>\n",
+        "<li><a href=\"model_source_code_documentation_template.yaml\" style=\"color: #DE257E;\"><b>Download Template YAML</b></a></li>\n",
+        "<li><a href=\"https://docs.validmind.ai/guide/templates/customize-document-templates.html\" style=\"color: #DE257E;\"><b>Customize Document Templates</b></a></li>\n",
+        "</ul>\n",
+        "</div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_3__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Common function\n",
+        "The code above defines two key functions:\n",
+        "1. A function to read source code from 'customer_churn_full_suite.py' file\n",
+        "2. An 'explain_code' function that uses ValidMind's experimental agents to analyze and explain code."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "source_code=\"\"\n",
+        "with open(\"customer_churn_full_suite.py\", \"r\") as f:\n",
+        "    source_code = f.read()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "The `vm.experimental.agents.run_task` function is used to execute AI agent tasks.\n",
+        "\n",
+        "It requires:\n",
+        "- task: The type of task to run (e.g. `code_explainer`)\n",
+        "- input: A dictionary containing task-specific parameters\n",
+        "   - For `code_explainer`, this includes:\n",
+        "      - **source_code** (str): The code to be analyzed\n",
+        "      - **user_instructions** (str): Instructions for how to analyze the code"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "def explain_code(content_id: str, user_instructions: str):\n",
+        "    \"\"\"Run code explanation task and log the results.\n",
+        "    By default, the code explainer includes sections for:\n",
+        "    - Main Purpose and Overall Functionality\n",
+        "    - Breakdown of Key Functions or Components\n",
+        "    - Potential Risks or Failure Points  \n",
+        "    - Assumptions or Limitations\n",
+        "    If you want default sections, specify user_instructions as an empty string.\n",
+        "    \n",
+        "    Args:\n",
+        "        user_instructions (str): Instructions for how to analyze the code\n",
+        "        content_id (str): ID to use when logging the results\n",
+        "    \n",
+        "    Returns:\n",
+        "        The result object from running the code explanation task\n",
+        "    \"\"\"\n",
+        "    result = vm.experimental.agents.run_task(\n",
+        "        task=\"code_explainer\",\n",
+        "        input={\n",
+        "            \"source_code\": source_code,\n",
+        "            \"user_instructions\": user_instructions\n",
+        "        }\n",
+        "    )\n",
+        "    result.log(content_id=content_id)\n",
+        "    return result"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='defaultBehavior'></a>\n",
+        "\n",
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Default Behavior"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "By default, the code explainer includes sections for:\n",
+        "- Main Purpose and Overall Functionality\n",
+        "- Breakdown of Key Functions or Components\n",
+        "- Potential Risks or Failure Points  \n",
+        "- Assumptions or Limitations\n",
+        "\n",
+        "If you want default sections, specify `user_instructions` as an empty string. For example:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = vm.experimental.agents.run_task(\n",
+        "    task=\"code_explainer\",\n",
+        "    input={\n",
+        "        \"source_code\": source_code,\n",
+        "        \"user_instructions\": \"\"\n",
+        "    }\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='overview'></a>\n",
+        "\n",
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Codebase Overview\n",
+        "\n",
+        "Let's analyze your codebase structure to understand the main modules, components, entry points and their relationships. We'll also examine the technology stack and frameworks that are being utilized in the implementation."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = explain_code(\n",
+        "    user_instructions=\"\"\"\n",
+        "        Please provide a summary of the following bullet points only.\n",
+        "        - Describe the overall structure of the source code repository.\n",
+        "        - Identify main modules, folders, and scripts.\n",
+        "        - Highlight entry points for training, inference, and evaluation.\n",
+        "        - State the main programming languages and frameworks used.\n",
+        "        \"\"\",\n",
+        "    content_id=\"code_structure_summary\"\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = explain_code(\n",
+        "    user_instructions=\"\",\n",
+        "    content_id=\"code_structure_summary\"\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='environment'></a>\n",
+        "\n",
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Environment and Dependencies ('environment_setup')\n",
+        "Let's document the technical requirements and setup needed to run your code, including Python packages, system dependencies, and environment configuration files. Understanding these requirements is essential for proper development environment setup and consistent deployments across different environments."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = explain_code(\n",
+        "    user_instructions=\"\"\"\n",
+        "    Please provide a summary of the following bullet points only.\n",
+        "    - List Python packages and system dependencies (OS, compilers, etc.).\n",
+        "    - Reference environment files (requirements.txt, environment.yml, Dockerfile).\n",
+        "    - Include setup instructions using Conda, virtualenv, or containers.\n",
+        "    Please remove Potential Risks or Failure Points and Assumptions or Limitations sections. Please don't add any other sections.\n",
+        "    \"\"\",\n",
+        "    content_id=\"setup_instructions\"\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='data'></a>\n",
+        "\n",
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## Data Ingestion and Preprocessing\n",
+        "Let's document how your code handles data, including data sources, validation procedures, and preprocessing steps. We'll examine the data pipeline architecture, covering everything from initial data loading through feature engineering and quality checks."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = explain_code(\n",
+        "    user_instructions=\"\"\"\n",
+        "    Please provide a summary of the following bullet points only.\n",
+        "    - Specify data input formats and sources.\n",
+        "    - Document ingestion, validation, and transformation logic.\n",
+        "    - Explain how raw data is preprocessed and features are generated.\n",
+        "    Please remove Potential Risks or Failure Points and Assumptions or Limitations sections. Please don't add any other sections.    \"\"\",\n",
+        "    content_id=\"data_handling_notes\"\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='model'> </a>\n",
+        "\n",
+        "<a id='toc9__'></a>\n",
+        "\n",
+        "## Model Implementation Details\n",
+        "Let's document the core implementation details of your model, including its architecture, components, and key algorithms. Understanding the technical implementation is crucial for maintenance, debugging, and future improvements to the codebase. We'll examine how theoretical concepts are translated into working code."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = explain_code(\n",
+        "    user_instructions=\"\"\"\n",
+        "    Please provide a summary of the following bullet points only.\n",
+        "    - Describe the core model code structure (classes, functions).\n",
+        "    - Link code to theoretical models or equations when applicable.\n",
+        "    - Note custom components like loss functions or feature selectors.\n",
+        "    Please remove Potential Risks or Failure Points and Assumptions or Limitations sections. Please don't add any other sections.\n",
+        "    \"\"\",\n",
+        "    content_id=\"model_code_description\"\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='training'></a>\n",
+        "\n",
+        "<a id='toc10__'></a>\n",
+        "\n",
+        "## Model Training Pipeline\n",
+        "\n",
+        "Let's document the training pipeline implementation, including how models are trained, optimized and evaluated. We'll examine the training process workflow, hyperparameter tuning approach, and model checkpointing mechanisms. This section provides insights into how the model learns from data and achieves optimal performance."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = explain_code(\n",
+        "    user_instructions=\"\"\"\n",
+        "    Please provide a summary of the following bullet points only.\n",
+        "    - Explain the training process, optimization strategy, and hyperparameters.\n",
+        "    - Describe logging, checkpointing, and early stopping mechanisms.\n",
+        "    - Include references to training config files or tuning logic.\n",
+        "    Please remove Potential Risks or Failure Points and Assumptions or Limitations sections. Please don't add any other sections.\n",
+        "    \"\"\",\n",
+        "    content_id=\"training_logic_details\"\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='evaluation'></a>\n",
+        "\n",
+        "<a id='toc11__'></a>\n",
+        "\n",
+        "## Evaluation and Validation Code\n",
+        "Let's examine how the model's validation and evaluation code is implemented, including the metrics calculation and validation processes. We'll explore the diagnostic tools and visualization methods used to assess model performance. This section will also cover how validation results are logged and stored for future reference."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = explain_code(\n",
+        "    user_instructions=\"\"\"\n",
+        "    Please provide a summary of the following bullet points only.\n",
+        "    - Describe how validation is implemented and metrics are calculated.\n",
+        "    - Include plots and diagnostic tools (e.g., ROC, SHAP, confusion matrix).\n",
+        "    - State how outputs are logged and persisted.\n",
+        "    Please remove Potential Risks or Failure Points and Assumptions or Limitations sections. Please don't add any other sections.\n",
+        "    \"\"\",\n",
+        "    content_id=\"evaluation_logic_notes\"\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='inference'></a>\n",
+        "\n",
+        "<a id='toc12__'></a>\n",
+        "\n",
+        "## Inference and Scoring Logic\n",
+        "Let's examine how the model performs inference and scoring on new data. This section will cover the implementation details of loading trained models, making predictions, and any required pre/post-processing steps. We'll also look at the APIs and interfaces available for both real-time serving and batch scoring scenarios."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = explain_code(\n",
+        "    user_instructions=\"\"\"\n",
+        "    Please provide a summary of the following bullet points only.\n",
+        "    - Detail how the trained model is loaded and used for predictions.\n",
+        "    - Explain I/O formats and APIs for serving or batch scoring.\n",
+        "    - Include any preprocessing/postprocessing logic required.\n",
+        "    Please remove Potential Risks or Failure Points and Assumptions or Limitations sections. Please don't add any other sections.\n",
+        "    \"\"\",\n",
+        "    content_id=\"inference_mechanism\"\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='config'></a>\n",
+        "\n",
+        "<a id='toc13__'></a>\n",
+        "\n",
+        "## Configuration and Parameters\n",
+        "Let's explore how configuration and parameters are managed in the codebase. We'll examine the configuration files, command-line arguments, environment variables, and other mechanisms used to control model behavior. This section will also cover parameter versioning and how different configurations are tracked across model iterations."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = explain_code(\n",
+        "    user_instructions=\"\"\"\n",
+        "    Please provide a summary of the following bullet points only.\n",
+        "    - Describe configuration management (files, CLI args, env vars).\n",
+        "    - Highlight default parameters and override mechanisms.\n",
+        "    - Reference versioning practices for config files.\n",
+        "    Please remove Potential Risks or Failure Points and Assumptions or Limitations sections. Please don't add any other sections.\n",
+        "    \"\"\",\n",
+        "    content_id=\"config_control_notes\"\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='testing'></a>\n",
+        "\n",
+        "<a id='toc14__'></a>\n",
+        "\n",
+        "## Unit and Integration Testing\n",
+        "Let's examine the testing strategy and implementation in the codebase. We'll analyze the unit tests, integration tests, and testing frameworks used to ensure code quality and reliability. This section will also cover test coverage metrics and continuous integration practices."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = explain_code(\n",
+        "    user_instructions=\"\"\"\n",
+        "    Please provide a summary of the following bullet points only.\n",
+        "    - List unit and integration tests and what they cover.\n",
+        "    - Mention testing frameworks and coverage tools used.\n",
+        "    - Explain testing strategy for production-readiness.\n",
+        "    Please remove Potential Risks or Failure Points and Assumptions or Limitations sections. Please don't add any other sections.\n",
+        "    \"\"\",\n",
+        "    content_id=\"test_strategy_overview\"\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='logging'></a>\n",
+        "\n",
+        "<a id='toc15__'></a>\n",
+        "\n",
+        "## Logging and Monitoring Hooks\n",
+        "Let's analyze how logging and monitoring are implemented in the codebase. We'll examine the logging configuration, monitoring hooks, and key metrics being tracked. This section will also cover any real-time observability integrations and alerting mechanisms in place."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = explain_code(\n",
+        "    user_instructions=\"\"\"\n",
+        "    Please provide a summary of the following bullet points only.\n",
+        "    - Describe logging configuration and structure.\n",
+        "    - Highlight real-time monitoring or observability integrations.\n",
+        "    - List key events, metrics, or alerts tracked.\n",
+        "    Please remove Potential Risks or Failure Points and Assumptions or Limitations sections. Please don't add any other sections.\n",
+        "    \"\"\",\n",
+        "    content_id=\"logging_monitoring_notes\"\n",
+        ")\n"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='versioning'></a>\n",
+        "\n",
+        "<a id='toc16__'></a>\n",
+        "\n",
+        "## Code and Model Versioning\n",
+        "Let's examine how code and model versioning is managed in the codebase. This section will cover version control practices, including Git workflows and model artifact versioning tools like DVC or MLflow. We'll also look at how versioning integrates with the CI/CD pipeline."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = explain_code(\n",
+        "    user_instructions=\"\"\"\n",
+        "    Please provide a summary of the following bullet points only.\n",
+        "      - Describe Git usage, branching, tagging, and commit standards.\n",
+        "      - Include model artifact versioning practices (e.g., DVC, MLflow).\n",
+        "      - Reference any automation in CI/CD.\n",
+        "    Please remove the following sections: \n",
+        "      - Potential Risks or Failure Points\n",
+        "      - Assumptions or Limitations\n",
+        "      - Breakdown of Key Functions or Components\n",
+        "    Please don't add any other sections.\n",
+        "    \"\"\",\n",
+        "    content_id=\"version_tracking_description\"\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='security'></a>\n",
+        "\n",
+        "<a id='toc17__'></a>\n",
+        "\n",
+        "## Security and Access Control\n",
+        "Let's analyze the security and access control measures implemented in the codebase. We'll examine how sensitive data and code are protected through access controls, encryption, and compliance measures. Additionally, we'll review secure deployment practices and any specific handling of PII data."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = explain_code(\n",
+        "    user_instructions=\"\"\"\n",
+        "    Please provide a summary of the following bullet points only.\n",
+        "      - Document access controls for source code and data.\n",
+        "      - Include any encryption, PII handling, or compliance measures.\n",
+        "      - Mention secure deployment practices.\n",
+        "    Please remove the following sections: \n",
+        "      - Potential Risks or Failure Points\n",
+        "      - Assumptions or Limitations\n",
+        "      - Breakdown of Key Functions or Components\n",
+        "    Please don't add any other sections.\n",
+        "    \"\"\",\n",
+        "    content_id=\"security_policies_notes\"\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='examples'></a>\n",
+        "\n",
+        "<a id='toc18__'></a>\n",
+        "\n",
+        "## Example Runs and Scripts\n",
+        "Let's explore example runs and scripts that demonstrate how to use this codebase in practice. We'll look at working examples, command-line usage, and sample notebooks that showcase the core functionality. This section will also point to demo datasets and test scenarios that can help new users get started quickly."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = explain_code(\n",
+        "    user_instructions=\"\"\"\n",
+        "    Please provide a summary of the following bullet points only.\n",
+        "      - Provide working script examples.\n",
+        "      - Include CLI usage instructions or sample notebooks.\n",
+        "      - Link to demo datasets or test scenarios.\n",
+        "    Please remove the following sections: \n",
+        "      - Potential Risks or Failure Points\n",
+        "      - Assumptions or Limitations\n",
+        "      - Breakdown of Key Functions or Components\n",
+        "    Please don't add any other sections.\n",
+        "    \"\"\",\n",
+        "    content_id=\"runnable_examples\"\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='issues'></a>\n",
+        "\n",
+        "<a id='toc19__'></a>\n",
+        "\n",
+        "## Known Issues and Future Improvements\n",
+        "Let's examine the current limitations and areas for improvement in the codebase. This section will document known technical debt, bugs, and feature gaps that need to be addressed. We'll also outline proposed enhancements and reference any existing tickets or GitHub issues tracking these improvements."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = explain_code(\n",
+        "    user_instructions=\"\"\"\n",
+        "    Please provide a summary of the following bullet points only.\n",
+        "      - List current limitations or technical debt.\n",
+        "      - Outline proposed enhancements or refactors.\n",
+        "      - Reference relevant tickets, GitHub issues, or roadmap items.\n",
+        "    Please remove Potential Risks or Failure Points and Assumptions or Limitations sections. Please don't add any other sections.\n",
+        "    \"\"\",\n",
+        "    content_id=\"issues_and_improvements_log\"\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-72ed6e2a48984af3aca5888b96d1f6b6"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "validmind-1QuffXMV-py3.11",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.11.9"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 4
 }
diff --git a/site/notebooks/use_cases/credit_risk/application_scorecard_executive.ipynb b/site/notebooks/use_cases/credit_risk/application_scorecard_executive.ipynb
index cd6e4f1a19..50f2f0202e 100644
--- a/site/notebooks/use_cases/credit_risk/application_scorecard_executive.ipynb
+++ b/site/notebooks/use_cases/credit_risk/application_scorecard_executive.ipynb
@@ -1,385 +1,397 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Document an application scorecard model\n",
-    "\n",
-    "Build and document an *application scorecard model* with the ValidMind Library by using Kaggle's [Lending Club](https://www.kaggle.com/datasets/devanshi23/loan-data-2007-2014/data) sample dataset to build a simple application scorecard.\n",
-    "\n",
-    "An application scorecard model is a type of statistical model used in credit scoring to evaluate the creditworthiness of potential borrowers by generating a score based on various characteristics of an applicant — such as credit history, income, employment status, and other relevant financial data. \n",
-    "\n",
-    "- This score helps lenders make decisions about whether to approve or reject loan applications, as well as determine the terms of the loan, including interest rates and credit limits. \n",
-    "- Application scorecard models enable lenders to manage risk efficiently while making the loan application process faster and more transparent for applicants.\n",
-    "\n",
-    "This interactive notebook provides a step-by-step guide for loading a demo dataset, preprocessing the raw data, training a model for testing, setting up test inputs, initializing the required ValidMind objects, running the test, and then logging the results to ValidMind."
-   ]
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Document an application scorecard model\n",
+        "\n",
+        "Build and document an *application scorecard model* with the ValidMind Library by using Kaggle's [Lending Club](https://www.kaggle.com/datasets/devanshi23/loan-data-2007-2014/data) sample dataset to build a simple application scorecard.\n",
+        "\n",
+        "An application scorecard model is a type of statistical model used in credit scoring to evaluate the creditworthiness of potential borrowers by generating a score based on various characteristics of an applicant — such as credit history, income, employment status, and other relevant financial data. \n",
+        "\n",
+        "- This score helps lenders make decisions about whether to approve or reject loan applications, as well as determine the terms of the loan, including interest rates and credit limits. \n",
+        "- Application scorecard models enable lenders to manage risk efficiently while making the loan application process faster and more transparent for applicants.\n",
+        "\n",
+        "This interactive notebook provides a step-by-step guide for loading a demo dataset, preprocessing the raw data, training a model for testing, setting up test inputs, initializing the required ValidMind objects, running the test, and then logging the results to ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "- [Document the model](#toc3__)    \n",
+        "- [Next steps](#toc4__)    \n",
+        "  - [Work with your model documentation](#toc4_1__)    \n",
+        "  - [Discover more learning resources](#toc4_2__)    \n",
+        "- [Upgrade ValidMind](#toc5__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language.\n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **[template]{.smallcaps}**, select `Credit Risk Scorecard`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "  # api_host = \"...\",\n",
+        "  # api_key = \"...\",\n",
+        "  # api_secret = \"...\",\n",
+        "  # model = \"...\",\n",
+        "  document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Document the model"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.datasets.credit_risk import lending_club\n",
+        "from validmind.utils import preview_test_config\n",
+        "\n",
+        "scorecard = lending_club.load_scorecard()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "lending_club.init_vm_objects(scorecard)"
+      ],
+      "execution_count": 4,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test_config = lending_club.load_test_config(scorecard)\n",
+        "preview_test_config(test_config)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.run_documentation_tests(config=test_config)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
+        "\n",
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Work with your documentation\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "3. Expand the following sections and take a look around:\n",
+        "\n",
+        "   - **2. Data Preparation**\n",
+        "   - **3. Model Development**\n",
+        "\n",
+        "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation (hint: some of the tests in **2.3. Feature Selection and Engineering** look like they need some attention), view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
+        "\n",
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-382e83e3fe1d4928ae90c3917480d27d"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "validmind-eEL8LtKG-py3.10",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.10.13"
+    }
   },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "- [Document the model](#toc3__)    \n",
-    "- [Next steps](#toc4__)    \n",
-    "  - [Work with your model documentation](#toc4_1__)    \n",
-    "  - [Discover more learning resources](#toc4_2__)    \n",
-    "- [Upgrade ValidMind](#toc5__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language.\n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Custom tests**: Custom tests are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "- **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "- **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "- **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom test.\n",
-    "- **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom test. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: The [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **[template]{.smallcaps}**, select `Credit Risk Scorecard`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "  # api_host = \"...\",\n",
-    "  # api_key = \"...\",\n",
-    "  # api_secret = \"...\",\n",
-    "  # model = \"...\",\n",
-    "  document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Document the model"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.datasets.credit_risk import lending_club\n",
-    "from validmind.utils import preview_test_config\n",
-    "\n",
-    "scorecard = lending_club.load_scorecard()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": 4,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "lending_club.init_vm_objects(scorecard)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test_config = lending_club.load_test_config(scorecard)\n",
-    "preview_test_config(test_config)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.run_documentation_tests(config=test_config)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
-    "\n",
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Work with your model documentation\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "3. Expand the following sections and take a look around:\n",
-    "\n",
-    "   - **2. Data Preparation**\n",
-    "   - **3. Model Development**\n",
-    "\n",
-    "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation (hint: some of the tests in **2.3. Feature Selection and Engineering** look like they need some attention), view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)\n",
-    "\n",
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-382e83e3fe1d4928ae90c3917480d27d",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "validmind-eEL8LtKG-py3.10",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
+  "nbformat": 4,
+  "nbformat_minor": 2
 }
diff --git a/site/notebooks/use_cases/credit_risk/application_scorecard_full_suite.ipynb b/site/notebooks/use_cases/credit_risk/application_scorecard_full_suite.ipynb
index e8e567a5b4..2b857a03bc 100644
--- a/site/notebooks/use_cases/credit_risk/application_scorecard_full_suite.ipynb
+++ b/site/notebooks/use_cases/credit_risk/application_scorecard_full_suite.ipynb
@@ -1,905 +1,922 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Document an application scorecard model\n",
-    "\n",
-    "Build and document an *application scorecard model* with the ValidMind Library by using Kaggle's [Lending Club](https://www.kaggle.com/datasets/devanshi23/loan-data-2007-2014/data) sample dataset to build a simple application scorecard.\n",
-    "\n",
-    "An application scorecard model is a type of statistical model used in credit scoring to evaluate the creditworthiness of potential borrowers by generating a score based on various characteristics of an applicant — such as credit history, income, employment status, and other relevant financial data. \n",
-    "\n",
-    "- This score helps lenders make decisions about whether to approve or reject loan applications, as well as determine the terms of the loan, including interest rates and credit limits. \n",
-    "- Application scorecard models enable lenders to manage risk efficiently while making the loan application process faster and more transparent for applicants.\n",
-    "\n",
-    "This interactive notebook provides a step-by-step guide for loading a demo dataset, preprocessing the raw data, training a model for testing, setting up test inputs, initializing the required ValidMind objects, running the test, and then logging the results to ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "  - [Initialize the Python environment](#toc2_3__)    \n",
-    "  - [Preview the documentation template](#toc2_4__)    \n",
-    "- [Load the sample dataset](#toc3__)    \n",
-    "  - [Prepocess the dataset](#toc3_1__)    \n",
-    "  - [Feature engineering](#toc3_2__)    \n",
-    "- [Train the model](#toc4__)    \n",
-    "  - [Compute probabilities](#toc4_1__)    \n",
-    "  - [Compute binary predictions](#toc4_2__)    \n",
-    "- [Document the model](#toc5__)    \n",
-    "  - [Initialize the ValidMind datasets](#toc5_1__)    \n",
-    "  - [Initialize a model object](#toc5_2__)    \n",
-    "  - [Assign prediction values and probabilities to the datasets](#toc5_3__)    \n",
-    "  - [Compute credit risk scores](#toc5_4__)    \n",
-    "  - [Adding custom context to the LLM descriptions](#toc5_5__)    \n",
-    "  - [Run the full suite of tests](#toc5_6__)    \n",
-    "- [Next steps](#toc6__)    \n",
-    "  - [Work with your model documentation](#toc6_1__)    \n",
-    "  - [Discover more learning resources](#toc6_2__)    \n",
-    "- [Upgrade ValidMind](#toc7__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language.\n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Custom tests**: Custom tests are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "- **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "- **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "- **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom test.\n",
-    "- **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom test. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: The [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Credit Risk Scorecard`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "  # api_host = \"...\",\n",
-    "  # api_key = \"...\",\n",
-    "  # api_secret = \"...\",\n",
-    "  # model = \"...\",\n",
-    "  document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Initialize the Python environment\n",
-    "\n",
-    "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import xgboost as xgb\n",
-    "from sklearn.ensemble import RandomForestClassifier\n",
-    "\n",
-    "from validmind.datasets.credit_risk import lending_club\n",
-    "\n",
-    "%matplotlib inline"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_4__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Load the sample dataset\n",
-    "\n",
-    "The sample dataset used here is provided by the ValidMind library. To be able to use it, you'll need to import the dataset and load it into a pandas [DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html), a two-dimensional tabular data structure that makes use of rows and columns:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "df = lending_club.load_data(source=\"offline\")\n",
-    "\n",
-    "df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Prepocess the dataset\n",
-    "\n",
-    "In the preprocessing step we perform a number of operations to get ready for building our application scorecard. \n",
-    "\n",
-    "We use the `lending_club.preprocess` to simplify preprocessing. This function performs the following operations: \n",
-    "- Filters the dataset to include only loans for debt consolidation or credit card purposes\n",
-    "- Removes loans classified under the riskier grades \"F\" and \"G\"\n",
-    "- Excludes uncommon home ownership types and standardizes employment length and loan terms into numerical formats\n",
-    "- Discards unnecessary fields and any entries with missing information to maintain a clean and robust dataset for modeling"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "preprocess_df = lending_club.preprocess(df)\n",
-    "preprocess_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2__'></a>\n",
-    "\n",
-    "### Feature engineering\n",
-    "\n",
-    "In the feature engineering phase, we apply specific transformations to optimize the dataset for predictive modeling in our application scorecard. \n",
-    "\n",
-    "Using the `ending_club.feature_engineering()` function, we conduct the following operations:\n",
-    "- **WoE encoding**: Converts both numerical and categorical features into Weight of Evidence (WoE) values. WoE is a statistical measure used in scorecard modeling that quantifies the relationship between a predictor variable and the binary target variable. It calculates the ratio of the distribution of good outcomes to the distribution of bad outcomes for each category or bin of a feature. This transformation helps to ensure that the features are predictive and consistent in their contribution to the model.\n",
-    "- **Integration of WoE bins**: Ensures that the WoE transformed values are integrated throughout the dataset, replacing the original feature values while excluding the target variable from this transformation. This transformation is used to maintain a consistent scale and impact of each variable within the model, which helps make the predictions more stable and accurate."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "fe_df = lending_club.feature_engineering(preprocess_df)\n",
-    "fe_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Train the model\n",
-    "\n",
-    "In this section, we focus on constructing and refining our predictive model. \n",
-    "- We begin by dividing our data, which is based on Weight of Evidence (WoE) features, into training and testing sets (`train_df`, `test_df`). \n",
-    "- With `lending_club.split`, we employ a simple random split, randomly allocating data points to each set to ensure a mix of examples in both."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Split the data\n",
-    "train_df, test_df = lending_club.split(fe_df, test_size=0.2)\n",
-    "\n",
-    "x_train = train_df.drop(lending_club.target_column, axis=1)\n",
-    "y_train = train_df[lending_club.target_column]\n",
-    "\n",
-    "x_test = test_df.drop(lending_club.target_column, axis=1)\n",
-    "y_test = test_df[lending_club.target_column]"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Define the XGBoost model\n",
-    "xgb_model = xgb.XGBClassifier(\n",
-    "    n_estimators=50, \n",
-    "    random_state=42, \n",
-    "    early_stopping_rounds=10\n",
-    ")\n",
-    "xgb_model.set_params(\n",
-    "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
-    ")\n",
-    "\n",
-    "# Fit the model\n",
-    "xgb_model.fit(\n",
-    "    x_train, \n",
-    "    y_train,\n",
-    "    eval_set=[(x_test, y_test)],\n",
-    "    verbose=False\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Define the Random Forest model\n",
-    "rf_model = RandomForestClassifier(\n",
-    "    n_estimators=50, \n",
-    "    random_state=42,\n",
-    ")\n",
-    "\n",
-    "# Fit the model\n",
-    "rf_model.fit(x_train, y_train)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Compute probabilities"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "train_xgb_prob = xgb_model.predict_proba(x_train)[:, 1]\n",
-    "test_xgb_prob = xgb_model.predict_proba(x_test)[:, 1]\n",
-    "\n",
-    "train_rf_prob = rf_model.predict_proba(x_train)[:, 1]\n",
-    "test_rf_prob = rf_model.predict_proba(x_test)[:, 1]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Compute binary predictions"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "cut_off_threshold = 0.3\n",
-    "\n",
-    "train_xgb_binary_predictions = (train_xgb_prob > cut_off_threshold).astype(int)\n",
-    "test_xgb_binary_predictions = (test_xgb_prob > cut_off_threshold).astype(int)\n",
-    "\n",
-    "train_rf_binary_predictions = (train_rf_prob > cut_off_threshold).astype(int)\n",
-    "test_rf_binary_predictions = (test_rf_prob > cut_off_threshold).astype(int)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Document the model\n",
-    "\n",
-    "To document the model with the ValidMind Library, you'll need to:\n",
-    "1. Preprocess the raw dataset\n",
-    "2. Initialize some training and test datasets\n",
-    "3. Initialize a model object you can use for testing\n",
-    "4. Run the full suite of tests"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_1__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind datasets\n",
-    "\n",
-    "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
-    "\n",
-    "This function takes a number of arguments:\n",
-    "\n",
-    "- `dataset`: The dataset that you want to provide as input to tests.\n",
-    "- `input_id`: A unique identifier that allows tracking what inputs are used when running each individual test.\n",
-    "- `target_column`: A required argument if tests require access to true values. This is the name of the target column in the dataset.\n",
-    "\n",
-    "With all datasets ready, you can now initialize the raw, processed, training and test datasets (`raw_df`, `preprocessed_df`, `fe_df`,  `train_df` and `test_df`) created earlier into their own dataset objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_raw_dataset = vm.init_dataset(\n",
-    "    dataset=df,\n",
-    "    input_id=\"raw_dataset\",\n",
-    "    target_column=lending_club.target_column,\n",
-    ")\n",
-    "\n",
-    "vm_preprocess_dataset = vm.init_dataset(\n",
-    "    dataset=preprocess_df,\n",
-    "    input_id=\"preprocess_dataset\",\n",
-    "    target_column=lending_club.target_column,\n",
-    ")\n",
-    "\n",
-    "vm_fe_dataset = vm.init_dataset(\n",
-    "    dataset=fe_df,\n",
-    "    input_id=\"fe_dataset\",\n",
-    "    target_column=lending_club.target_column,\n",
-    ")\n",
-    "\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    dataset=train_df,\n",
-    "    input_id=\"train_dataset\",\n",
-    "    target_column=lending_club.target_column,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    dataset=test_df,\n",
-    "    input_id=\"test_dataset\",\n",
-    "    target_column=lending_club.target_column,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2__'></a>\n",
-    "\n",
-    "### Initialize a model object\n",
-    "\n",
-    "You will also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data. You simply intialize this model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_xgb_model = vm.init_model(\n",
-    "    xgb_model,\n",
-    "    input_id=\"xgb_model\",\n",
-    ")\n",
-    "\n",
-    "vm_rf_model = vm.init_model(\n",
-    "    rf_model,\n",
-    "    input_id=\"rf_model\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_3__'></a>\n",
-    "\n",
-    "### Assign prediction values and probabilities to the datasets\n",
-    "\n",
-    "With our model now trained, we'll move on to assigning both the predictive probabilities coming directly from the model's predictions, and the binary prediction after applying the cutoff threshold described in the previous steps. \n",
-    "- These tasks are achieved through the use of the `assign_predictions()` method associated with the VM `dataset` object.\n",
-    "- This method links the model's class prediction values and probabilities to our VM train and test datasets."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# XGBoost\n",
-    "vm_train_ds.assign_predictions(\n",
-    "    model=vm_xgb_model,\n",
-    "    prediction_values=train_xgb_binary_predictions,\n",
-    "    prediction_probabilities=train_xgb_prob,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds.assign_predictions(\n",
-    "    model=vm_xgb_model,\n",
-    "    prediction_values=test_xgb_binary_predictions,\n",
-    "    prediction_probabilities=test_xgb_prob,\n",
-    ")\n",
-    "\n",
-    "# Random Forest\n",
-    "vm_train_ds.assign_predictions(\n",
-    "    model=vm_rf_model,\n",
-    "    prediction_values=train_rf_binary_predictions,\n",
-    "    prediction_probabilities=train_rf_prob,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds.assign_predictions(\n",
-    "    model=vm_rf_model,\n",
-    "    prediction_values=test_rf_binary_predictions,\n",
-    "    prediction_probabilities=test_rf_prob,\n",
-    ")\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_4__'></a>\n",
-    "\n",
-    "### Compute credit risk scores\n",
-    "\n",
-    "In this phase, we translate model predictions into actionable scores using probability estimates generated by our trained model."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "train_xgb_scores = lending_club.compute_scores(train_xgb_prob)\n",
-    "test_xgb_scores = lending_club.compute_scores(test_xgb_prob)\n",
-    "\n",
-    "# Assign scores to the datasets\n",
-    "vm_train_ds.add_extra_column(\"xgb_scores\", train_xgb_scores)\n",
-    "vm_test_ds.add_extra_column(\"xgb_scores\", test_xgb_scores)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_5__'></a>\n",
-    "\n",
-    "### Adding custom context to the LLM descriptions\n",
-    "\n",
-    "To enable the LLM descriptions context, you need to set the `VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED` environment variable to `1`. This will enable the LLM descriptions context, which will be used to provide additional context to the LLM descriptions. This is a global setting that will affect all tests."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import os\n",
-    "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED\"] = \"1\"\n",
-    "\n",
-    "context = \"\"\"\n",
-    "FORMAT FOR THE LLM DESCRIPTIONS: \n",
-    "    **<Test Name>** is designed to <begin with a concise overview of what the test does and its primary purpose, \n",
-    "    extracted from the test description>.\n",
-    "\n",
-    "    The test operates by <write a paragraph about the test mechanism, explaining how it works and what it measures. \n",
-    "    Include any relevant formulas or methodologies mentioned in the test description.>\n",
-    "\n",
-    "    The primary advantages of this test include <write a paragraph about the test's strengths and capabilities, \n",
-    "    highlighting what makes it particularly useful for specific scenarios.>\n",
-    "\n",
-    "    Users should be aware that <write a paragraph about the test's limitations and potential risks. \n",
-    "    Include both technical limitations and interpretation challenges. \n",
-    "    If the test description includes specific signs of high risk, incorporate these here.>\n",
-    "\n",
-    "    **Key Insights:**\n",
-    "\n",
-    "    The test results reveal:\n",
-    "\n",
-    "    - **<insight title>**: <comprehensive description of one aspect of the results>\n",
-    "    - **<insight title>**: <comprehensive description of another aspect>\n",
-    "    ...\n",
-    "\n",
-    "    Based on these results, <conclude with a brief paragraph that ties together the test results with the test's \n",
-    "    purpose and provides any final recommendations or considerations.>\n",
-    "\n",
-    "ADDITIONAL INSTRUCTIONS:\n",
-    "    Present insights in order from general to specific, with each insight as a single bullet point with bold title.\n",
-    "\n",
-    "    For each metric in the test results, include in the test overview:\n",
-    "    - The metric's purpose and what it measures\n",
-    "    - Its mathematical formula\n",
-    "    - The range of possible values\n",
-    "    - What constitutes good/bad performance\n",
-    "    - How to interpret different values\n",
-    "\n",
-    "    Each insight should progressively cover:\n",
-    "    1. Overall scope and distribution\n",
-    "    2. Complete breakdown of all elements with specific values\n",
-    "    3. Natural groupings and patterns\n",
-    "    4. Comparative analysis between datasets/categories\n",
-    "    5. Stability and variations\n",
-    "    6. Notable relationships or dependencies\n",
-    "\n",
-    "    Remember:\n",
-    "    - Keep all insights at the same level (no sub-bullets or nested structures)\n",
-    "    - Make each insight complete and self-contained\n",
-    "    - Include specific numerical values and ranges\n",
-    "    - Cover all elements in the results comprehensively\n",
-    "    - Maintain clear, concise language\n",
-    "    - Use only \"- **Title**: Description\" format for insights\n",
-    "    - Progress naturally from general to specific observations\n",
-    "\n",
-    "\"\"\".strip()\n",
-    "\n",
-    "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT\"] = context"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_6__'></a>\n",
-    "\n",
-    "### Run the full suite of tests\n",
-    "\n",
-    "This is where it all comes together: you are now ready to run the documentation tests for the model as defined by the documentation template you looked at earlier.\n",
-    "\n",
-    "The [`vm.run_documentation_tests`](https://docs.validmind.ai/validmind/validmind.html#run_documentation_tests) function finds and runs every test specified in the template and then uploads all the documentation and test artifacts that get generated to the ValidMind Platform.\n",
-    "\n",
-    "The function requires information about the inputs to use on every test. These inputs can be passed as an `inputs` argument if we want to use the same inputs for all tests. It's also possible to pass a `config` argument that has information about the `params` and `inputs` that each test requires. The `config` parameter is a dictionary with the following structure:\n",
-    "\n",
-    "```python\n",
-    "config = {\n",
-    "    \"<test-id>\": {\n",
-    "        \"params\": {\n",
-    "            \"param1\": \"value1\",\n",
-    "            \"param2\": \"value2\",\n",
-    "            ...\n",
-    "        },\n",
-    "        \"inputs\": {\n",
-    "            \"input1\": \"value1\",\n",
-    "            \"input2\": \"value2\",\n",
-    "            ...\n",
-    "        }\n",
-    "    },\n",
-    "    ...\n",
-    "}\n",
-    "```\n",
-    "\n",
-    "Each `<test-id>` above corresponds to the test driven block identifiers shown by `vm.preview_template()`. For this model, we will use the default parameters for all tests, but we'll need to specify the input configuration for each one. The method `get_demo_test_config()` below constructs the default input configuration for our demo."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.utils import preview_test_config\n",
-    "\n",
-    "test_config = lending_club.get_demo_test_config(x_test, y_test)\n",
-    "preview_test_config(test_config)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Now we can pass the input configuration to `vm.run_documentation_tests()` and run the full suite of tests. The variable `full_suite` then holds the result of these tests."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "full_suite = vm.run_documentation_tests(config=test_config)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
-    "\n",
-    "<a id='toc6_1__'></a>\n",
-    "\n",
-    "### Work with your model documentation\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "3. Expand the following sections and take a look around:\n",
-    "\n",
-    "   - **2. Data Preparation**\n",
-    "   - **3. Model Development**\n",
-    "\n",
-    "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation (hint: some of the tests in **2.3. Feature Selection and Engineering** look like they need some attention), view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)\n",
-    "\n",
-    "<a id='toc6_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-11ff9f7bf7724930b1bc81a5585f4a94",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "validmind-eEL8LtKG-py3.10",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Document an application scorecard model\n",
+        "\n",
+        "Build and document an *application scorecard model* with the ValidMind Library by using Kaggle's [Lending Club](https://www.kaggle.com/datasets/devanshi23/loan-data-2007-2014/data) sample dataset to build a simple application scorecard.\n",
+        "\n",
+        "An application scorecard model is a type of statistical model used in credit scoring to evaluate the creditworthiness of potential borrowers by generating a score based on various characteristics of an applicant — such as credit history, income, employment status, and other relevant financial data. \n",
+        "\n",
+        "- This score helps lenders make decisions about whether to approve or reject loan applications, as well as determine the terms of the loan, including interest rates and credit limits. \n",
+        "- Application scorecard models enable lenders to manage risk efficiently while making the loan application process faster and more transparent for applicants.\n",
+        "\n",
+        "This interactive notebook provides a step-by-step guide for loading a demo dataset, preprocessing the raw data, training a model for testing, setting up test inputs, initializing the required ValidMind objects, running the test, and then logging the results to ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "  - [Initialize the Python environment](#toc2_3__)    \n",
+        "  - [Preview the documentation template](#toc2_4__)    \n",
+        "- [Load the sample dataset](#toc3__)    \n",
+        "  - [Prepocess the dataset](#toc3_1__)    \n",
+        "  - [Feature engineering](#toc3_2__)    \n",
+        "- [Train the model](#toc4__)    \n",
+        "  - [Compute probabilities](#toc4_1__)    \n",
+        "  - [Compute binary predictions](#toc4_2__)    \n",
+        "- [Document the model](#toc5__)    \n",
+        "  - [Initialize the ValidMind datasets](#toc5_1__)    \n",
+        "  - [Initialize ValidMind models](#toc5_2__)    \n",
+        "  - [Assign prediction values and probabilities to the datasets](#toc5_3__)    \n",
+        "  - [Compute credit risk scores](#toc5_4__)    \n",
+        "  - [Adding custom context to the LLM descriptions](#toc5_5__)    \n",
+        "  - [Run the full suite of tests](#toc5_6__)    \n",
+        "- [Next steps](#toc6__)    \n",
+        "  - [Work with your documentation](#toc6_1__)    \n",
+        "  - [Discover more learning resources](#toc6_2__)    \n",
+        "- [Upgrade ValidMind](#toc7__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language.\n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Credit Risk Scorecard`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "  # api_host = \"...\",\n",
+        "  # api_key = \"...\",\n",
+        "  # api_secret = \"...\",\n",
+        "  # model = \"...\",\n",
+        "  document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Initialize the Python environment\n",
+        "\n",
+        "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import xgboost as xgb\n",
+        "from sklearn.ensemble import RandomForestClassifier\n",
+        "\n",
+        "from validmind.datasets.credit_risk import lending_club\n",
+        "\n",
+        "%matplotlib inline"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_4__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Load the sample dataset\n",
+        "\n",
+        "The sample dataset used here is provided by the ValidMind library. To be able to use it, you'll need to import the dataset and load it into a pandas [DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html), a two-dimensional tabular data structure that makes use of rows and columns:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "df = lending_club.load_data(source=\"offline\")\n",
+        "\n",
+        "df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Prepocess the dataset\n",
+        "\n",
+        "In the preprocessing step we perform a number of operations to get ready for building our application scorecard. \n",
+        "\n",
+        "We use the `lending_club.preprocess` to simplify preprocessing. This function performs the following operations: \n",
+        "- Filters the dataset to include only loans for debt consolidation or credit card purposes\n",
+        "- Removes loans classified under the riskier grades \"F\" and \"G\"\n",
+        "- Excludes uncommon home ownership types and standardizes employment length and loan terms into numerical formats\n",
+        "- Discards unnecessary fields and any entries with missing information to maintain a clean and robust dataset for modeling"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "preprocess_df = lending_club.preprocess(df)\n",
+        "preprocess_df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2__'></a>\n",
+        "\n",
+        "### Feature engineering\n",
+        "\n",
+        "In the feature engineering phase, we apply specific transformations to optimize the dataset for predictive modeling in our application scorecard. \n",
+        "\n",
+        "Using the `ending_club.feature_engineering()` function, we conduct the following operations:\n",
+        "- **WoE encoding**: Converts both numerical and categorical features into Weight of Evidence (WoE) values. WoE is a statistical measure used in scorecard modeling that quantifies the relationship between a predictor variable and the binary target variable. It calculates the ratio of the distribution of good outcomes to the distribution of bad outcomes for each category or bin of a feature. This transformation helps to ensure that the features are predictive and consistent in their contribution to the model.\n",
+        "- **Integration of WoE bins**: Ensures that the WoE transformed values are integrated throughout the dataset, replacing the original feature values while excluding the target variable from this transformation. This transformation is used to maintain a consistent scale and impact of each variable within the model, which helps make the predictions more stable and accurate."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "fe_df = lending_club.feature_engineering(preprocess_df)\n",
+        "fe_df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Train the model\n",
+        "\n",
+        "In this section, we focus on constructing and refining our predictive model. \n",
+        "- We begin by dividing our data, which is based on Weight of Evidence (WoE) features, into training and testing sets (`train_df`, `test_df`). \n",
+        "- With `lending_club.split`, we employ a simple random split, randomly allocating data points to each set to ensure a mix of examples in both."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Split the data\n",
+        "train_df, test_df = lending_club.split(fe_df, test_size=0.2)\n",
+        "\n",
+        "x_train = train_df.drop(lending_club.target_column, axis=1)\n",
+        "y_train = train_df[lending_club.target_column]\n",
+        "\n",
+        "x_test = test_df.drop(lending_club.target_column, axis=1)\n",
+        "y_test = test_df[lending_club.target_column]"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Define the XGBoost model\n",
+        "xgb_model = xgb.XGBClassifier(\n",
+        "    n_estimators=50, \n",
+        "    random_state=42, \n",
+        "    early_stopping_rounds=10\n",
+        ")\n",
+        "xgb_model.set_params(\n",
+        "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
+        ")\n",
+        "\n",
+        "# Fit the model\n",
+        "xgb_model.fit(\n",
+        "    x_train, \n",
+        "    y_train,\n",
+        "    eval_set=[(x_test, y_test)],\n",
+        "    verbose=False\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Define the Random Forest model\n",
+        "rf_model = RandomForestClassifier(\n",
+        "    n_estimators=50, \n",
+        "    random_state=42,\n",
+        ")\n",
+        "\n",
+        "# Fit the model\n",
+        "rf_model.fit(x_train, y_train)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Compute probabilities"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "train_xgb_prob = xgb_model.predict_proba(x_train)[:, 1]\n",
+        "test_xgb_prob = xgb_model.predict_proba(x_test)[:, 1]\n",
+        "\n",
+        "train_rf_prob = rf_model.predict_proba(x_train)[:, 1]\n",
+        "test_rf_prob = rf_model.predict_proba(x_test)[:, 1]"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Compute binary predictions"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "cut_off_threshold = 0.3\n",
+        "\n",
+        "train_xgb_binary_predictions = (train_xgb_prob > cut_off_threshold).astype(int)\n",
+        "test_xgb_binary_predictions = (test_xgb_prob > cut_off_threshold).astype(int)\n",
+        "\n",
+        "train_rf_binary_predictions = (train_rf_prob > cut_off_threshold).astype(int)\n",
+        "test_rf_binary_predictions = (test_rf_prob > cut_off_threshold).astype(int)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Document the model\n",
+        "\n",
+        "To document the model with the ValidMind Library, you'll need to:\n",
+        "1. Preprocess the raw dataset\n",
+        "2. Initialize some training and test datasets\n",
+        "3. Initialize a model object you can use for testing\n",
+        "4. Run the full suite of tests"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind datasets\n",
+        "\n",
+        "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
+        "\n",
+        "This function takes a number of arguments:\n",
+        "\n",
+        "- `dataset`: The dataset that you want to provide as input to tests.\n",
+        "- `input_id`: A unique identifier that allows tracking what inputs are used when running each individual test.\n",
+        "- `target_column`: A required argument if tests require access to true values. This is the name of the target column in the dataset.\n",
+        "\n",
+        "With all datasets ready, you can now initialize the raw, processed, training and test datasets (`raw_df`, `preprocessed_df`, `fe_df`,  `train_df` and `test_df`) created earlier into their own dataset objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_raw_dataset = vm.init_dataset(\n",
+        "    dataset=df,\n",
+        "    input_id=\"raw_dataset\",\n",
+        "    target_column=lending_club.target_column,\n",
+        ")\n",
+        "\n",
+        "vm_preprocess_dataset = vm.init_dataset(\n",
+        "    dataset=preprocess_df,\n",
+        "    input_id=\"preprocess_dataset\",\n",
+        "    target_column=lending_club.target_column,\n",
+        ")\n",
+        "\n",
+        "vm_fe_dataset = vm.init_dataset(\n",
+        "    dataset=fe_df,\n",
+        "    input_id=\"fe_dataset\",\n",
+        "    target_column=lending_club.target_column,\n",
+        ")\n",
+        "\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    dataset=train_df,\n",
+        "    input_id=\"train_dataset\",\n",
+        "    target_column=lending_club.target_column,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    dataset=test_df,\n",
+        "    input_id=\"test_dataset\",\n",
+        "    target_column=lending_club.target_column,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2__'></a>\n",
+        "\n",
+        "### Initialize ValidMind models\n",
+        "\n",
+        "You'll also need to initialize ValidMind model objects (`vm_model`) that can be passed to other functions for analysis and tests on the data for our modelS.\n",
+        "\n",
+        "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+        "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
+        "\n",
+        "Initialize your model objects with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_xgb_model = vm.init_model(\n",
+        "    xgb_model,\n",
+        "    input_id=\"xgb_model\",\n",
+        ")\n",
+        "\n",
+        "vm_rf_model = vm.init_model(\n",
+        "    rf_model,\n",
+        "    input_id=\"rf_model\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_3__'></a>\n",
+        "\n",
+        "### Assign prediction values and probabilities to the datasets\n",
+        "\n",
+        "With our model now trained, we'll move on to assigning both the predictive probabilities coming directly from the model's predictions, and the binary prediction after applying the cutoff threshold described in the previous steps. \n",
+        "- These tasks are achieved through the use of the `assign_predictions()` method associated with the VM `dataset` object.\n",
+        "- This method links the model's class prediction values and probabilities to our VM train and test datasets."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# XGBoost\n",
+        "vm_train_ds.assign_predictions(\n",
+        "    model=vm_xgb_model,\n",
+        "    prediction_values=train_xgb_binary_predictions,\n",
+        "    prediction_probabilities=train_xgb_prob,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds.assign_predictions(\n",
+        "    model=vm_xgb_model,\n",
+        "    prediction_values=test_xgb_binary_predictions,\n",
+        "    prediction_probabilities=test_xgb_prob,\n",
+        ")\n",
+        "\n",
+        "# Random Forest\n",
+        "vm_train_ds.assign_predictions(\n",
+        "    model=vm_rf_model,\n",
+        "    prediction_values=train_rf_binary_predictions,\n",
+        "    prediction_probabilities=train_rf_prob,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds.assign_predictions(\n",
+        "    model=vm_rf_model,\n",
+        "    prediction_values=test_rf_binary_predictions,\n",
+        "    prediction_probabilities=test_rf_prob,\n",
+        ")\n"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_4__'></a>\n",
+        "\n",
+        "### Compute credit risk scores\n",
+        "\n",
+        "In this phase, we translate model predictions into actionable scores using probability estimates generated by our trained model."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "train_xgb_scores = lending_club.compute_scores(train_xgb_prob)\n",
+        "test_xgb_scores = lending_club.compute_scores(test_xgb_prob)\n",
+        "\n",
+        "# Assign scores to the datasets\n",
+        "vm_train_ds.add_extra_column(\"xgb_scores\", train_xgb_scores)\n",
+        "vm_test_ds.add_extra_column(\"xgb_scores\", test_xgb_scores)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_5__'></a>\n",
+        "\n",
+        "### Adding custom context to the LLM descriptions\n",
+        "\n",
+        "To enable the LLM descriptions context, you need to set the `VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED` environment variable to `1`. This will enable the LLM descriptions context, which will be used to provide additional context to the LLM descriptions. This is a global setting that will affect all tests."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import os\n",
+        "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED\"] = \"1\"\n",
+        "\n",
+        "context = \"\"\"\n",
+        "FORMAT FOR THE LLM DESCRIPTIONS: \n",
+        "    **<Test Name>** is designed to <begin with a concise overview of what the test does and its primary purpose, \n",
+        "    extracted from the test description>.\n",
+        "\n",
+        "    The test operates by <write a paragraph about the test mechanism, explaining how it works and what it measures. \n",
+        "    Include any relevant formulas or methodologies mentioned in the test description.>\n",
+        "\n",
+        "    The primary advantages of this test include <write a paragraph about the test's strengths and capabilities, \n",
+        "    highlighting what makes it particularly useful for specific scenarios.>\n",
+        "\n",
+        "    Users should be aware that <write a paragraph about the test's limitations and potential risks. \n",
+        "    Include both technical limitations and interpretation challenges. \n",
+        "    If the test description includes specific signs of high risk, incorporate these here.>\n",
+        "\n",
+        "    **Key Insights:**\n",
+        "\n",
+        "    The test results reveal:\n",
+        "\n",
+        "    - **<insight title>**: <comprehensive description of one aspect of the results>\n",
+        "    - **<insight title>**: <comprehensive description of another aspect>\n",
+        "    ...\n",
+        "\n",
+        "    Based on these results, <conclude with a brief paragraph that ties together the test results with the test's \n",
+        "    purpose and provides any final recommendations or considerations.>\n",
+        "\n",
+        "ADDITIONAL INSTRUCTIONS:\n",
+        "    Present insights in order from general to specific, with each insight as a single bullet point with bold title.\n",
+        "\n",
+        "    For each metric in the test results, include in the test overview:\n",
+        "    - The metric's purpose and what it measures\n",
+        "    - Its mathematical formula\n",
+        "    - The range of possible values\n",
+        "    - What constitutes good/bad performance\n",
+        "    - How to interpret different values\n",
+        "\n",
+        "    Each insight should progressively cover:\n",
+        "    1. Overall scope and distribution\n",
+        "    2. Complete breakdown of all elements with specific values\n",
+        "    3. Natural groupings and patterns\n",
+        "    4. Comparative analysis between datasets/categories\n",
+        "    5. Stability and variations\n",
+        "    6. Notable relationships or dependencies\n",
+        "\n",
+        "    Remember:\n",
+        "    - Keep all insights at the same level (no sub-bullets or nested structures)\n",
+        "    - Make each insight complete and self-contained\n",
+        "    - Include specific numerical values and ranges\n",
+        "    - Cover all elements in the results comprehensively\n",
+        "    - Maintain clear, concise language\n",
+        "    - Use only \"- **Title**: Description\" format for insights\n",
+        "    - Progress naturally from general to specific observations\n",
+        "\n",
+        "\"\"\".strip()\n",
+        "\n",
+        "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT\"] = context"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_6__'></a>\n",
+        "\n",
+        "### Run the full suite of tests\n",
+        "\n",
+        "This is where it all comes together: you are now ready to run the documentation tests for the model as defined by the documentation template you looked at earlier.\n",
+        "\n",
+        "The [`vm.run_documentation_tests`](https://docs.validmind.ai/validmind/validmind.html#run_documentation_tests) function finds and runs every test specified in the template and then uploads all the documentation and test artifacts that get generated to the ValidMind Platform.\n",
+        "\n",
+        "The function requires information about the inputs to use on every test. These inputs can be passed as an `inputs` argument if we want to use the same inputs for all tests. It's also possible to pass a `config` argument that has information about the `params` and `inputs` that each test requires. The `config` parameter is a dictionary with the following structure:\n",
+        "\n",
+        "```python\n",
+        "config = {\n",
+        "    \"<test-id>\": {\n",
+        "        \"params\": {\n",
+        "            \"param1\": \"value1\",\n",
+        "            \"param2\": \"value2\",\n",
+        "            ...\n",
+        "        },\n",
+        "        \"inputs\": {\n",
+        "            \"input1\": \"value1\",\n",
+        "            \"input2\": \"value2\",\n",
+        "            ...\n",
+        "        }\n",
+        "    },\n",
+        "    ...\n",
+        "}\n",
+        "```\n",
+        "\n",
+        "Each `<test-id>` above corresponds to the test driven block identifiers shown by `vm.preview_template()`. For this model, we will use the default parameters for all tests, but we'll need to specify the input configuration for each one. The method `get_demo_test_config()` below constructs the default input configuration for our demo."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.utils import preview_test_config\n",
+        "\n",
+        "test_config = lending_club.get_demo_test_config(x_test, y_test)\n",
+        "preview_test_config(test_config)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Now we can pass the input configuration to `vm.run_documentation_tests()` and run the full suite of tests. The variable `full_suite` then holds the result of these tests."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "full_suite = vm.run_documentation_tests(config=test_config)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
+        "\n",
+        "<a id='toc6_1__'></a>\n",
+        "\n",
+        "### Work with your documentation\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "3. Expand the following sections and take a look around:\n",
+        "\n",
+        "   - **2. Data Preparation**\n",
+        "   - **3. Model Development**\n",
+        "\n",
+        "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation (hint: some of the tests in **2.3. Feature Selection and Engineering** look like they need some attention), view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
+        "\n",
+        "<a id='toc6_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-a658e3f1bece47cabc255c03460e255f"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "validmind-eEL8LtKG-py3.10",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.10.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 2
 }
diff --git a/site/notebooks/use_cases/credit_risk/application_scorecard_with_bias.ipynb b/site/notebooks/use_cases/credit_risk/application_scorecard_with_bias.ipynb
index e58e831ffc..6f6d23928e 100644
--- a/site/notebooks/use_cases/credit_risk/application_scorecard_with_bias.ipynb
+++ b/site/notebooks/use_cases/credit_risk/application_scorecard_with_bias.ipynb
@@ -1,1550 +1,1567 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Document a credit risk model\n",
-    "\n",
-    "Build and document an *application scorecard model* with the ValidMind Library by using Kaggle's [Lending Club](https://www.kaggle.com/datasets/devanshi23/loan-data-2007-2014/data) sample dataset to build a simple application scorecard.\n",
-    "\n",
-    "An application scorecard model is a type of statistical model used in credit scoring to evaluate the creditworthiness of potential borrowers by generating a score based on various characteristics of an applicant — such as credit history, income, employment status, and other relevant financial data. \n",
-    "\n",
-    "- This score helps lenders make decisions about whether to approve or reject loan applications, as well as determine the terms of the loan, including interest rates and credit limits. \n",
-    "- Application scorecard models enable lenders to manage risk efficiently while making the loan application process faster and more transparent for applicants.\n",
-    "\n",
-    "This interactive notebook provides a step-by-step guide for loading a demo dataset, preprocessing the raw data, training a model for testing, setting up test inputs, initializing the required ValidMind objects, running the test, and then logging the results to ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "  - [Initialize the Python environment](#toc2_3__)    \n",
-    "  - [Preview the documentation template](#toc2_4__)    \n",
-    "- [Load the sample dataset](#toc3__)    \n",
-    "  - [Prepocess the dataset](#toc3_1__)    \n",
-    "- [Train the model](#toc4__)    \n",
-    "  - [Compute probabilities](#toc4_1__)    \n",
-    "  - [Compute binary predictions](#toc4_2__)    \n",
-    "- [Postprocess the dataset](#toc5__)    \n",
-    "- [Document the model](#toc6__)    \n",
-    "  - [Initialize the ValidMind datasets](#toc6_1__)    \n",
-    "  - [Initialize a model object](#toc6_2__)    \n",
-    "  - [Assign predictions](#toc6_3__)    \n",
-    "  - [Run tests](#toc6_4__)    \n",
-    "    - [Data description](#toc6_4_1__)    \n",
-    "    - [Data quality](#toc6_4_2__)    \n",
-    "    - [Correlations](#toc6_4_3__)    \n",
-    "    - [Model training](#toc6_4_4__)    \n",
-    "    - [Model validation](#toc6_4_5__)    \n",
-    "    - [Model explainability](#toc6_4_6__)    \n",
-    "    - [Bias and fairness](#toc6_4_7__)    \n",
-    "- [Next steps](#toc7__)    \n",
-    "  - [Work with your model documentation](#toc7_1__)    \n",
-    "  - [Discover more learning resources](#toc7_2__)    \n",
-    "- [Upgrade ValidMind](#toc8__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language.\n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Custom tests**: Custom tests are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "- **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "- **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "- **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom test.\n",
-    "- **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom test. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: The [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Credit Risk Scorecard`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Initialize the Python environment\n",
-    "\n",
-    "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip -q install aequitas fairlearn vl-convert-python"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import pandas as pd\n",
-    "\n",
-    "from sklearn.ensemble import RandomForestClassifier\n",
-    "from sklearn.preprocessing import OneHotEncoder, StandardScaler\n",
-    "from sklearn.pipeline import Pipeline\n",
-    "from sklearn.impute import SimpleImputer\n",
-    "from sklearn.compose import ColumnTransformer\n",
-    "from sklearn.compose import make_column_selector as selector\n",
-    "\n",
-    "from validmind.tests import run_test\n",
-    "\n",
-    "%matplotlib inline"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_4__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Load the sample dataset\n",
-    "\n",
-    "The sample dataset used here is provided by the ValidMind library. To be able to use it, you'll need to import the dataset and load it into a pandas [DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html), a two-dimensional tabular data structure that makes use of rows and columns:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.datasets.credit_risk import lending_club_bias as demo_dataset\n",
-    "\n",
-    "df = demo_dataset.load_data()\n",
-    "\n",
-    "df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Prepocess the dataset\n",
-    "\n",
-    "In the preprocessing step we perform a number of operations to get ready for building our credit decision model. \n",
-    "\n",
-    "We will in this example, create new feature, fill missing values and encode categorical variables."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "preprocess_df = demo_dataset.preprocess(df)\n",
-    "preprocess_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Train the model\n",
-    "\n",
-    "In this section, we focus on constructing and refining our predictive model. \n",
-    "- We begin by dividing our data into training and testing sets (`train_df`, `test_df`). \n",
-    "- We employ a simple random split, randomly allocating data points to each set to ensure a mix of examples in both."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Split the data into training and testing sets\n",
-    "train_df, test_df = demo_dataset.split(preprocess_df)\n",
-    "\n",
-    "X_train = train_df.drop(demo_dataset.target_column, axis=1)\n",
-    "y_train = train_df[demo_dataset.target_column]\n",
-    "X_test = test_df.drop(demo_dataset.target_column, axis=1)\n",
-    "y_test = test_df[demo_dataset.target_column]"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Train a Random Forest Classifier\n",
-    "model = RandomForestClassifier(n_estimators=50, random_state=42)\n",
-    "model.fit(X_train, y_train)\n",
-    "\n",
-    "# Print feature importances\n",
-    "feature_importances = pd.DataFrame({\n",
-    "    'feature': X_train.columns,\n",
-    "    'importance': model.feature_importances_\n",
-    "}).sort_values('importance', ascending=False)\n",
-    "\n",
-    "print(\"Feature Importances:\")\n",
-    "print(feature_importances)\n",
-    "\n",
-    "# Print model parameters\n",
-    "print(\"\\nModel Parameters:\")\n",
-    "print(model.get_params())\n",
-    "\n",
-    "# Print basic model information\n",
-    "print(f\"\\nNumber of trees: {model.n_estimators}\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Compute probabilities"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "train_probabilities = model.predict_proba(X_train)[:,1]\n",
-    "test_probabilities = model.predict_proba(X_test)[:,1]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Compute binary predictions"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "cut_off_threshold = 0.5\n",
-    "train_binary_predictions = (train_probabilities > cut_off_threshold).astype(int)\n",
-    "test_binary_predictions = (test_probabilities > cut_off_threshold).astype(int)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Postprocess the dataset"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Save the original labels for the protected classes for visualizations and investigation of biased outcomes\n",
-    "protected_classes_df = df[demo_dataset.protected_classes]\n",
-    "\n",
-    "train_df = train_df.merge(\n",
-    "    protected_classes_df,\n",
-    "    left_index=True,\n",
-    "    right_index=True,\n",
-    ")\n",
-    "\n",
-    "test_df = test_df.merge(\n",
-    "    protected_classes_df,\n",
-    "    left_index=True,\n",
-    "    right_index=True,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Document the model\n",
-    "\n",
-    "To document the model with the ValidMind Library, you'll need to:\n",
-    "1. Preprocess the raw dataset\n",
-    "2. Initialize some training and test datasets\n",
-    "3. Initialize a model object you can use for testing\n",
-    "4. Run the full suite of tests"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind datasets\n",
-    "\n",
-    "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
-    "\n",
-    "This function takes a number of arguments:\n",
-    "\n",
-    "- `dataset`: The dataset that you want to provide as input to tests.\n",
-    "- `input_id`: A unique identifier that allows tracking what inputs are used when running each individual test.\n",
-    "- `target_column`: A required argument if tests require access to true values. This is the name of the target column in the dataset.\n",
-    "\n",
-    "With all datasets ready, you can now initialize the raw, training and test datasets created earlier into their own dataset objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Extract feature columns\n",
-    "feature_columns = train_df.drop(\n",
-    "    columns=[demo_dataset.target_column] + demo_dataset.protected_classes\n",
-    ").columns.tolist()\n",
-    "feature_columns"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_raw_ds= vm.init_dataset(\n",
-    "    dataset=df,\n",
-    "    input_id=\"raw_dataset\",\n",
-    "    target_column=demo_dataset.target_column,\n",
-    ")\n",
-    "\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    dataset=train_df,\n",
-    "    input_id=\"train_dataset\",\n",
-    "    target_column=demo_dataset.target_column,\n",
-    "    feature_columns=feature_columns\n",
-    ")\n",
-    "\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    dataset=test_df,\n",
-    "    input_id=\"test_dataset\",\n",
-    "    target_column=demo_dataset.target_column,\n",
-    "    feature_columns=feature_columns\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2__'></a>\n",
-    "\n",
-    "### Initialize a model object\n",
-    "\n",
-    "You will also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data. You simply intialize this model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_model = vm.init_model(\n",
-    "    model,\n",
-    "    input_id=\"random_forest_model\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_3__'></a>\n",
-    "\n",
-    "### Assign predictions\n",
-    "\n",
-    "With our model now trained, we'll move on to assigning both the predictive probabilities coming directly from the model's predictions, and the binary prediction after applying the cutoff threshold described in the previous steps. \n",
-    "- These tasks are achieved through the use of the `assign_predictions()` method associated with the VM `dataset` object.\n",
-    "- This method links the model's class prediction values and probabilities to our VM train and test datasets."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds.assign_predictions(\n",
-    "    model=vm_model,\n",
-    "    prediction_values=train_binary_predictions,\n",
-    "    prediction_probabilities=train_probabilities,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds.assign_predictions(\n",
-    "    model=vm_model,\n",
-    "    prediction_values=test_binary_predictions,\n",
-    "    prediction_probabilities=test_probabilities,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_4__'></a>\n",
-    "\n",
-    "### Run tests"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_4_1__'></a>\n",
-    "\n",
-    "#### Data description"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.DatasetDescription\",\n",
-    "    inputs={\n",
-    "        \"dataset\": \"raw_dataset\",\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.DescriptiveStatistics\",\n",
-    "    inputs={\n",
-    "        \"dataset\": \"raw_dataset\",\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.TabularNumericalHistograms\",\n",
-    "    inputs={\n",
-    "        \"dataset\": \"raw_dataset\"\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.TargetRateBarPlots\",\n",
-    "    inputs={\n",
-    "        \"dataset\": \"raw_dataset\"\n",
-    "    },\n",
-    "    params={\n",
-    "        \"default_column\": demo_dataset.target_column,\n",
-    "        \"columns\": None,\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_4_2__'></a>\n",
-    "\n",
-    "#### Data quality"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.ClassImbalance\",\n",
-    "    inputs={\n",
-    "        \"dataset\": \"raw_dataset\",\n",
-    "    },\n",
-    "    params={\n",
-    "        \"min_percent_threshold\": 10\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.Duplicates\",\n",
-    "    inputs={\n",
-    "        \"dataset\": \"raw_dataset\",\n",
-    "    },\n",
-    "    params={\n",
-    "        \"min_threshold\": 1\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.HighCardinality\",\n",
-    "    inputs={\n",
-    "        \"dataset\": \"raw_dataset\",\n",
-    "    },\n",
-    "    params={\n",
-    "        \"num_threshold\": 100,\n",
-    "        \"percent_threshold\": 0.1,\n",
-    "        \"threshold_type\": \"percent\"\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.MissingValues\",\n",
-    "    inputs={\n",
-    "        \"dataset\": \"raw_dataset\",\n",
-    "    },\n",
-    "    params={\n",
-    "        \"min_percentage_threshold\": 1,\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.Skewness\",\n",
-    "    inputs={\n",
-    "        \"dataset\": \"raw_dataset\",\n",
-    "    },\n",
-    "    params={\n",
-    "        \"max_threshold\": 1,\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.UniqueRows\",\n",
-    "    inputs={\n",
-    "        \"dataset\": \"raw_dataset\",\n",
-    "    },\n",
-    "    params={\n",
-    "        \"min_percent_threshold\": 1,\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.TooManyZeroValues\",\n",
-    "    inputs={\n",
-    "        \"dataset\": \"raw_dataset\",\n",
-    "    },\n",
-    "    params={\n",
-    "        \"max_percent_threshold\": 0.03,\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.IQROutliersTable\",\n",
-    "    inputs={\n",
-    "        \"dataset\": \"raw_dataset\",\n",
-    "    },\n",
-    "    params={\n",
-    "        \"threshold\": 1.5,\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.IQROutliersBarPlot\",\n",
-    "    inputs={\n",
-    "        \"dataset\": \"raw_dataset\",\n",
-    "    },\n",
-    "    params={\n",
-    "        \"threshold\": 1.5,\n",
-    "        \"fig_width\": 800,\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_4_3__'></a>\n",
-    "\n",
-    "#### Correlations"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.PearsonCorrelationMatrix\",\n",
-    "    inputs={\n",
-    "        \"dataset\": \"raw_dataset\",\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.HighPearsonCorrelation\",\n",
-    "    inputs={\n",
-    "        \"dataset\": \"raw_dataset\",\n",
-    "    },\n",
-    "    params={\n",
-    "        \"max_threshold\": 0.3\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_4_4__'></a>\n",
-    "\n",
-    "#### Model training"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.ModelMetadata\",\n",
-    "    inputs={\n",
-    "        \"model\": \"random_forest_model\",\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.DatasetSplit\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [\"train_dataset\", \"test_dataset\"],\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_4_5__'></a>\n",
-    "\n",
-    "#### Model validation"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.PopulationStabilityIndex\",\n",
-    "    inputs={\n",
-    "        \"model\": \"random_forest_model\",\n",
-    "        \"datasets\": [\"train_dataset\", \"test_dataset\"],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"num_bins\": 10,\n",
-    "        \"mode\": \"fixed\"\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.ConfusionMatrix\",\n",
-    "    inputs={\n",
-    "        \"model\": \"random_forest_model\",\n",
-    "        \"dataset\": \"test_dataset\",\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.ClassifierPerformance:in_sample\",\n",
-    "    inputs={\n",
-    "        \"model\": \"random_forest_model\",\n",
-    "        \"dataset\": \"train_dataset\",\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.ClassifierPerformance:out_of_sample\",\n",
-    "    inputs={\n",
-    "        \"model\": \"random_forest_model\",\n",
-    "        \"dataset\": \"test_dataset\",\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.PrecisionRecallCurve\",\n",
-    "    inputs={\n",
-    "        \"model\": \"random_forest_model\",\n",
-    "        \"dataset\": \"test_dataset\",\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.ROCCurve\",\n",
-    "    inputs={\n",
-    "        \"model\": \"random_forest_model\",\n",
-    "        \"dataset\": \"test_dataset\",\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.TrainingTestDegradation\",\n",
-    "    inputs={\n",
-    "        \"model\": \"random_forest_model\",\n",
-    "        \"datasets\": [\"train_dataset\", \"test_dataset\"],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"metrics\": [\"accuracy\", \"precision\", \"recall\", \"f1\"],\n",
-    "        \"max_threshold\": 0.1\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.MinimumAccuracy\",\n",
-    "    inputs={\n",
-    "        \"model\": \"random_forest_model\",\n",
-    "        \"dataset\": \"test_dataset\",\n",
-    "    },\n",
-    "    params={\n",
-    "        \"min_threshold\": 0.7\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.MinimumF1Score\",\n",
-    "    inputs={\n",
-    "        \"model\": \"random_forest_model\",\n",
-    "        \"dataset\": \"test_dataset\",\n",
-    "    },\n",
-    "    params={\n",
-    "        \"min_threshold\": 0.7\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.MinimumROCAUCScore\",\n",
-    "    inputs={\n",
-    "        \"model\": \"random_forest_model\",\n",
-    "        \"dataset\": \"test_dataset\",\n",
-    "    },\n",
-    "    params={\n",
-    "        \"min_threshold\": 0.5\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.statsmodels.GINITable\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "        \"model\": [vm_model],\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.statsmodels.PredictionProbabilitiesHistogram\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "        \"model\": [vm_model],\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.statsmodels.CumulativePredictionProbabilities\",\n",
-    "    input_grid={\n",
-    "        \"model\": [vm_model],\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_4_6__'></a>\n",
-    "\n",
-    "#### Model explainability"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.PermutationFeatureImportance\",\n",
-    "    inputs={\n",
-    "        \"model\": \"random_forest_model\",\n",
-    "        \"dataset\": \"test_dataset\",\n",
-    "    },\n",
-    "    params={\n",
-    "        \"fontsize\": None,\n",
-    "        \"figure_height\": 1000\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "\"validmind.model_validation.sklearn.SHAPGlobalImportance\",\n",
-    "inputs={\n",
-    "    \"model\": \"random_forest_model\",\n",
-    "    \"dataset\": \"train_dataset\",\n",
-    "    },\n",
-    "    params={\n",
-    "        \"kernel_explainer_samples\": 10,\n",
-    "        \"tree_or_linear_explainer_samples\": 200\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.WeakspotsDiagnosis\",\n",
-    "    inputs={\n",
-    "        \"model\": \"random_forest_model\",\n",
-    "        \"datasets\": [\"train_dataset\", \"test_dataset\"],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"features_columns\": None,\n",
-    "        \"thresholds\": {\n",
-    "            \"accuracy\": 0.75,\n",
-    "            \"precision\": 0.5,\n",
-    "            \"recall\": 0.5,\n",
-    "            \"f1\": 0.7\n",
-    "        }\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.OverfitDiagnosis\",\n",
-    "    inputs={\n",
-    "        \"model\": \"random_forest_model\",\n",
-    "        \"datasets\": [\"train_dataset\", \"test_dataset\"],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"metric\": None,\n",
-    "        \"cut_off_threshold\": 0.04\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.RobustnessDiagnosis\",\n",
-    "    inputs={\n",
-    "        \"model\": \"random_forest_model\",\n",
-    "        \"datasets\": [\"train_dataset\", \"test_dataset\"],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"metric\": None,\n",
-    "        \"scaling_factor_std_dev_list\": [0.1, 0.2, 0.3, 0.4, 0.5],\n",
-    "        \"performance_decay_threshold\": 0.05\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_4_7__'></a>\n",
-    "\n",
-    "#### Bias and fairness"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = run_test(\n",
-    "    \"validmind.data_validation.ProtectedClassesDescription\",\n",
-    "    inputs={\n",
-    "        \"dataset\": \"test_dataset\"\n",
-    "    },\n",
-    "    params={\n",
-    "        'protected_classes': demo_dataset.protected_classes\n",
-    "    })\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Now we are going to focus our analysis on the fairness metric(s) of interest in this case study: FNR/FPR across different groups. The `aequitas` plot module exposes the `disparities_metrics()` plot, which displays both the disparities and the group-wise metric results side by side."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = run_test(\n",
-    "    \"validmind.data_validation.ProtectedClassesDisparity\",\n",
-    "    inputs={\n",
-    "        \"dataset\": \"test_dataset\",\n",
-    "        \"model\": \"random_forest_model\"\n",
-    "    },\n",
-    "    params={\n",
-    "        \"protected_classes\": demo_dataset.protected_classes,\n",
-    "        \"disparity_tolerance\": 1.25,\n",
-    "        \"metrics\": [\"fnr\", \"fpr\", \"tpr\"]\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.ProtectedClassesCombination\",\n",
-    "    inputs={\n",
-    "        \"dataset\": \"test_dataset\",\n",
-    "        \"model\": \"random_forest_model\"\n",
-    "    },\n",
-    "    params={\n",
-    "        \"protected_classes\": demo_dataset.protected_classes\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "The following code defines a preprocessing `Pipeline` that handles both numeric and categorical features. Numeric data is imputed and scaled, while categorical data is imputed with the most frequent value and one-hot encoded. The pipelines are then combined using a `ColumnTransformer` and integrated with a classifier."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Define a pipeline for numeric features\n",
-    "numeric_transformer = Pipeline(\n",
-    "    steps=[\n",
-    "        (\"impute\", SimpleImputer()),  # Impute missing values\n",
-    "        (\"scaler\", StandardScaler()),  # Scale numeric features\n",
-    "    ]\n",
-    ")\n",
-    "\n",
-    "# Define a pipeline for categorical features\n",
-    "categorical_transformer = Pipeline(\n",
-    "    [\n",
-    "        (\"impute\", SimpleImputer(strategy=\"most_frequent\")),  # Impute missing values with most frequent\n",
-    "        (\"ohe\", OneHotEncoder(handle_unknown=\"ignore\")),  # One-hot encode categorical features\n",
-    "    ]\n",
-    ")\n",
-    "\n",
-    "# Combine numeric and categorical pipelines\n",
-    "preprocessor = ColumnTransformer(\n",
-    "    transformers=[\n",
-    "        (\"num\", numeric_transformer, selector(dtype_exclude=\"category\")),  # Apply numeric transformer to non-categorical columns\n",
-    "        (\"cat\", categorical_transformer, selector(dtype_include=\"category\")),  # Apply categorical transformer to categorical columns\n",
-    "    ]\n",
-    ")\n",
-    "\n",
-    "# Create the full pipeline including preprocessing and classification\n",
-    "pipeline = Pipeline(\n",
-    "    steps=[\n",
-    "        (\"preprocessor\", preprocessor),  # Apply the preprocessor\n",
-    "        (\n",
-    "            \"classifier\",\n",
-    "            model,  # Use the previously defined model for classification\n",
-    "        ),\n",
-    "    ]\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "sensitive_features = ['Gender_encoded','Race_encoded','Marital_Status_encoded']\n",
-    "\n",
-    "run_test(\n",
-    "    \"validmind.data_validation.ProtectedClassesThresholdOptimizer\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_test_ds\n",
-    "    },\n",
-    "    params={\n",
-    "        \"pipeline\":pipeline,\n",
-    "        \"protected_classes\": sensitive_features,\n",
-    "        \"X_train\":X_train,\n",
-    "        \"y_train\":y_train,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
-    "\n",
-    "<a id='toc7_1__'></a>\n",
-    "\n",
-    "### Work with your model documentation\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "3. Expand the following sections and take a look around:\n",
-    "\n",
-    "   - **2. Data Preparation**\n",
-    "   - **3. Model Development**\n",
-    "\n",
-    "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation (hint: some of the tests in **2.3. Feature Selection and Engineering** look like they need some attention), view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)\n",
-    "\n",
-    "<a id='toc7_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc8__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-f527b18ca3b94779bf6194547accab31",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "validmind-eEL8LtKG-py3.10",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.8.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Document a credit risk model\n",
+        "\n",
+        "Build and document an *application scorecard model* with the ValidMind Library by using Kaggle's [Lending Club](https://www.kaggle.com/datasets/devanshi23/loan-data-2007-2014/data) sample dataset to build a simple application scorecard.\n",
+        "\n",
+        "An application scorecard model is a type of statistical model used in credit scoring to evaluate the creditworthiness of potential borrowers by generating a score based on various characteristics of an applicant — such as credit history, income, employment status, and other relevant financial data. \n",
+        "\n",
+        "- This score helps lenders make decisions about whether to approve or reject loan applications, as well as determine the terms of the loan, including interest rates and credit limits. \n",
+        "- Application scorecard models enable lenders to manage risk efficiently while making the loan application process faster and more transparent for applicants.\n",
+        "\n",
+        "This interactive notebook provides a step-by-step guide for loading a demo dataset, preprocessing the raw data, training a model for testing, setting up test inputs, initializing the required ValidMind objects, running the test, and then logging the results to ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "  - [Initialize the Python environment](#toc2_3__)    \n",
+        "  - [Preview the documentation template](#toc2_4__)    \n",
+        "- [Load the sample dataset](#toc3__)    \n",
+        "  - [Prepocess the dataset](#toc3_1__)    \n",
+        "- [Train the model](#toc4__)    \n",
+        "  - [Compute probabilities](#toc4_1__)    \n",
+        "  - [Compute binary predictions](#toc4_2__)    \n",
+        "- [Postprocess the dataset](#toc5__)    \n",
+        "- [Document the model](#toc6__)    \n",
+        "  - [Initialize the ValidMind datasets](#toc6_1__)    \n",
+        "  - [Initialize the ValidMind model](#toc6_2__)    \n",
+        "  - [Assign predictions](#toc6_3__)    \n",
+        "  - [Run tests](#toc6_4__)    \n",
+        "    - [Data description](#toc6_4_1__)    \n",
+        "    - [Data quality](#toc6_4_2__)    \n",
+        "    - [Correlations](#toc6_4_3__)    \n",
+        "    - [Model training](#toc6_4_4__)    \n",
+        "    - [Model validation](#toc6_4_5__)    \n",
+        "    - [Model explainability](#toc6_4_6__)    \n",
+        "    - [Bias and fairness](#toc6_4_7__)    \n",
+        "- [Next steps](#toc7__)    \n",
+        "  - [Work with your documentation](#toc7_1__)    \n",
+        "  - [Discover more learning resources](#toc7_2__)    \n",
+        "- [Upgrade ValidMind](#toc8__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language.\n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Credit Risk Scorecard`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Initialize the Python environment\n",
+        "\n",
+        "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip -q install aequitas fairlearn vl-convert-python"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import pandas as pd\n",
+        "\n",
+        "from sklearn.ensemble import RandomForestClassifier\n",
+        "from sklearn.preprocessing import OneHotEncoder, StandardScaler\n",
+        "from sklearn.pipeline import Pipeline\n",
+        "from sklearn.impute import SimpleImputer\n",
+        "from sklearn.compose import ColumnTransformer\n",
+        "from sklearn.compose import make_column_selector as selector\n",
+        "\n",
+        "from validmind.tests import run_test\n",
+        "\n",
+        "%matplotlib inline"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_4__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Load the sample dataset\n",
+        "\n",
+        "The sample dataset used here is provided by the ValidMind library. To be able to use it, you'll need to import the dataset and load it into a pandas [DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html), a two-dimensional tabular data structure that makes use of rows and columns:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.datasets.credit_risk import lending_club_bias as demo_dataset\n",
+        "\n",
+        "df = demo_dataset.load_data()\n",
+        "\n",
+        "df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Prepocess the dataset\n",
+        "\n",
+        "In the preprocessing step we perform a number of operations to get ready for building our credit decision model. \n",
+        "\n",
+        "We will in this example, create new feature, fill missing values and encode categorical variables."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "preprocess_df = demo_dataset.preprocess(df)\n",
+        "preprocess_df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Train the model\n",
+        "\n",
+        "In this section, we focus on constructing and refining our predictive model. \n",
+        "- We begin by dividing our data into training and testing sets (`train_df`, `test_df`). \n",
+        "- We employ a simple random split, randomly allocating data points to each set to ensure a mix of examples in both."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Split the data into training and testing sets\n",
+        "train_df, test_df = demo_dataset.split(preprocess_df)\n",
+        "\n",
+        "X_train = train_df.drop(demo_dataset.target_column, axis=1)\n",
+        "y_train = train_df[demo_dataset.target_column]\n",
+        "X_test = test_df.drop(demo_dataset.target_column, axis=1)\n",
+        "y_test = test_df[demo_dataset.target_column]"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Train a Random Forest Classifier\n",
+        "model = RandomForestClassifier(n_estimators=50, random_state=42)\n",
+        "model.fit(X_train, y_train)\n",
+        "\n",
+        "# Print feature importances\n",
+        "feature_importances = pd.DataFrame({\n",
+        "    'feature': X_train.columns,\n",
+        "    'importance': model.feature_importances_\n",
+        "}).sort_values('importance', ascending=False)\n",
+        "\n",
+        "print(\"Feature Importances:\")\n",
+        "print(feature_importances)\n",
+        "\n",
+        "# Print model parameters\n",
+        "print(\"\\nModel Parameters:\")\n",
+        "print(model.get_params())\n",
+        "\n",
+        "# Print basic model information\n",
+        "print(f\"\\nNumber of trees: {model.n_estimators}\")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Compute probabilities"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "train_probabilities = model.predict_proba(X_train)[:,1]\n",
+        "test_probabilities = model.predict_proba(X_test)[:,1]"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Compute binary predictions"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "cut_off_threshold = 0.5\n",
+        "train_binary_predictions = (train_probabilities > cut_off_threshold).astype(int)\n",
+        "test_binary_predictions = (test_probabilities > cut_off_threshold).astype(int)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Postprocess the dataset"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Save the original labels for the protected classes for visualizations and investigation of biased outcomes\n",
+        "protected_classes_df = df[demo_dataset.protected_classes]\n",
+        "\n",
+        "train_df = train_df.merge(\n",
+        "    protected_classes_df,\n",
+        "    left_index=True,\n",
+        "    right_index=True,\n",
+        ")\n",
+        "\n",
+        "test_df = test_df.merge(\n",
+        "    protected_classes_df,\n",
+        "    left_index=True,\n",
+        "    right_index=True,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Document the model\n",
+        "\n",
+        "To document the model with the ValidMind Library, you'll need to:\n",
+        "1. Preprocess the raw dataset\n",
+        "2. Initialize some training and test datasets\n",
+        "3. Initialize a ValidMind model object for use with testing\n",
+        "4. Run the full suite of tests"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_1__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind datasets\n",
+        "\n",
+        "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
+        "\n",
+        "This function takes a number of arguments:\n",
+        "\n",
+        "- `dataset`: The dataset that you want to provide as input to tests.\n",
+        "- `input_id`: A unique identifier that allows tracking what inputs are used when running each individual test.\n",
+        "- `target_column`: A required argument if tests require access to true values. This is the name of the target column in the dataset.\n",
+        "\n",
+        "With all datasets ready, you can now initialize the raw, training and test datasets created earlier into their own dataset objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Extract feature columns\n",
+        "feature_columns = train_df.drop(\n",
+        "    columns=[demo_dataset.target_column] + demo_dataset.protected_classes\n",
+        ").columns.tolist()\n",
+        "feature_columns"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_raw_ds= vm.init_dataset(\n",
+        "    dataset=df,\n",
+        "    input_id=\"raw_dataset\",\n",
+        "    target_column=demo_dataset.target_column,\n",
+        ")\n",
+        "\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    dataset=train_df,\n",
+        "    input_id=\"train_dataset\",\n",
+        "    target_column=demo_dataset.target_column,\n",
+        "    feature_columns=feature_columns\n",
+        ")\n",
+        "\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    dataset=test_df,\n",
+        "    input_id=\"test_dataset\",\n",
+        "    target_column=demo_dataset.target_column,\n",
+        "    feature_columns=feature_columns\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind model\n",
+        "\n",
+        "You will also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data.\n",
+        "\n",
+        "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+        "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
+        "\n",
+        "Initialize your model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_model = vm.init_model(\n",
+        "    model,\n",
+        "    input_id=\"random_forest_model\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_3__'></a>\n",
+        "\n",
+        "### Assign predictions\n",
+        "\n",
+        "With our model now trained, we'll move on to assigning both the predictive probabilities coming directly from the model's predictions, and the binary prediction after applying the cutoff threshold described in the previous steps. \n",
+        "- These tasks are achieved through the use of the `assign_predictions()` method associated with the VM `dataset` object.\n",
+        "- This method links the model's class prediction values and probabilities to our VM train and test datasets."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds.assign_predictions(\n",
+        "    model=vm_model,\n",
+        "    prediction_values=train_binary_predictions,\n",
+        "    prediction_probabilities=train_probabilities,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds.assign_predictions(\n",
+        "    model=vm_model,\n",
+        "    prediction_values=test_binary_predictions,\n",
+        "    prediction_probabilities=test_probabilities,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_4__'></a>\n",
+        "\n",
+        "### Run tests"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_4_1__'></a>\n",
+        "\n",
+        "#### Data description"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.DatasetDescription\",\n",
+        "    inputs={\n",
+        "        \"dataset\": \"raw_dataset\",\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.DescriptiveStatistics\",\n",
+        "    inputs={\n",
+        "        \"dataset\": \"raw_dataset\",\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.TabularNumericalHistograms\",\n",
+        "    inputs={\n",
+        "        \"dataset\": \"raw_dataset\"\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.TargetRateBarPlots\",\n",
+        "    inputs={\n",
+        "        \"dataset\": \"raw_dataset\"\n",
+        "    },\n",
+        "    params={\n",
+        "        \"default_column\": demo_dataset.target_column,\n",
+        "        \"columns\": None,\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_4_2__'></a>\n",
+        "\n",
+        "#### Data quality"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.ClassImbalance\",\n",
+        "    inputs={\n",
+        "        \"dataset\": \"raw_dataset\",\n",
+        "    },\n",
+        "    params={\n",
+        "        \"min_percent_threshold\": 10\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.Duplicates\",\n",
+        "    inputs={\n",
+        "        \"dataset\": \"raw_dataset\",\n",
+        "    },\n",
+        "    params={\n",
+        "        \"min_threshold\": 1\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.HighCardinality\",\n",
+        "    inputs={\n",
+        "        \"dataset\": \"raw_dataset\",\n",
+        "    },\n",
+        "    params={\n",
+        "        \"num_threshold\": 100,\n",
+        "        \"percent_threshold\": 0.1,\n",
+        "        \"threshold_type\": \"percent\"\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.MissingValues\",\n",
+        "    inputs={\n",
+        "        \"dataset\": \"raw_dataset\",\n",
+        "    },\n",
+        "    params={\n",
+        "        \"min_percentage_threshold\": 1,\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.Skewness\",\n",
+        "    inputs={\n",
+        "        \"dataset\": \"raw_dataset\",\n",
+        "    },\n",
+        "    params={\n",
+        "        \"max_threshold\": 1,\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.UniqueRows\",\n",
+        "    inputs={\n",
+        "        \"dataset\": \"raw_dataset\",\n",
+        "    },\n",
+        "    params={\n",
+        "        \"min_percent_threshold\": 1,\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.TooManyZeroValues\",\n",
+        "    inputs={\n",
+        "        \"dataset\": \"raw_dataset\",\n",
+        "    },\n",
+        "    params={\n",
+        "        \"max_percent_threshold\": 0.03,\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.IQROutliersTable\",\n",
+        "    inputs={\n",
+        "        \"dataset\": \"raw_dataset\",\n",
+        "    },\n",
+        "    params={\n",
+        "        \"threshold\": 1.5,\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.IQROutliersBarPlot\",\n",
+        "    inputs={\n",
+        "        \"dataset\": \"raw_dataset\",\n",
+        "    },\n",
+        "    params={\n",
+        "        \"threshold\": 1.5,\n",
+        "        \"fig_width\": 800,\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_4_3__'></a>\n",
+        "\n",
+        "#### Correlations"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.PearsonCorrelationMatrix\",\n",
+        "    inputs={\n",
+        "        \"dataset\": \"raw_dataset\",\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.HighPearsonCorrelation\",\n",
+        "    inputs={\n",
+        "        \"dataset\": \"raw_dataset\",\n",
+        "    },\n",
+        "    params={\n",
+        "        \"max_threshold\": 0.3\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_4_4__'></a>\n",
+        "\n",
+        "#### Model training"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.ModelMetadata\",\n",
+        "    inputs={\n",
+        "        \"model\": \"random_forest_model\",\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.DatasetSplit\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [\"train_dataset\", \"test_dataset\"],\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_4_5__'></a>\n",
+        "\n",
+        "#### Model validation"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.PopulationStabilityIndex\",\n",
+        "    inputs={\n",
+        "        \"model\": \"random_forest_model\",\n",
+        "        \"datasets\": [\"train_dataset\", \"test_dataset\"],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"num_bins\": 10,\n",
+        "        \"mode\": \"fixed\"\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.ConfusionMatrix\",\n",
+        "    inputs={\n",
+        "        \"model\": \"random_forest_model\",\n",
+        "        \"dataset\": \"test_dataset\",\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.ClassifierPerformance:in_sample\",\n",
+        "    inputs={\n",
+        "        \"model\": \"random_forest_model\",\n",
+        "        \"dataset\": \"train_dataset\",\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.ClassifierPerformance:out_of_sample\",\n",
+        "    inputs={\n",
+        "        \"model\": \"random_forest_model\",\n",
+        "        \"dataset\": \"test_dataset\",\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.PrecisionRecallCurve\",\n",
+        "    inputs={\n",
+        "        \"model\": \"random_forest_model\",\n",
+        "        \"dataset\": \"test_dataset\",\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.ROCCurve\",\n",
+        "    inputs={\n",
+        "        \"model\": \"random_forest_model\",\n",
+        "        \"dataset\": \"test_dataset\",\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.TrainingTestDegradation\",\n",
+        "    inputs={\n",
+        "        \"model\": \"random_forest_model\",\n",
+        "        \"datasets\": [\"train_dataset\", \"test_dataset\"],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"metrics\": [\"accuracy\", \"precision\", \"recall\", \"f1\"],\n",
+        "        \"max_threshold\": 0.1\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.MinimumAccuracy\",\n",
+        "    inputs={\n",
+        "        \"model\": \"random_forest_model\",\n",
+        "        \"dataset\": \"test_dataset\",\n",
+        "    },\n",
+        "    params={\n",
+        "        \"min_threshold\": 0.7\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.MinimumF1Score\",\n",
+        "    inputs={\n",
+        "        \"model\": \"random_forest_model\",\n",
+        "        \"dataset\": \"test_dataset\",\n",
+        "    },\n",
+        "    params={\n",
+        "        \"min_threshold\": 0.7\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.MinimumROCAUCScore\",\n",
+        "    inputs={\n",
+        "        \"model\": \"random_forest_model\",\n",
+        "        \"dataset\": \"test_dataset\",\n",
+        "    },\n",
+        "    params={\n",
+        "        \"min_threshold\": 0.5\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.statsmodels.GINITable\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "        \"model\": [vm_model],\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.statsmodels.PredictionProbabilitiesHistogram\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "        \"model\": [vm_model],\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.statsmodels.CumulativePredictionProbabilities\",\n",
+        "    input_grid={\n",
+        "        \"model\": [vm_model],\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_4_6__'></a>\n",
+        "\n",
+        "#### Model explainability"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.PermutationFeatureImportance\",\n",
+        "    inputs={\n",
+        "        \"model\": \"random_forest_model\",\n",
+        "        \"dataset\": \"test_dataset\",\n",
+        "    },\n",
+        "    params={\n",
+        "        \"fontsize\": None,\n",
+        "        \"figure_height\": 1000\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "\"validmind.model_validation.sklearn.SHAPGlobalImportance\",\n",
+        "inputs={\n",
+        "    \"model\": \"random_forest_model\",\n",
+        "    \"dataset\": \"train_dataset\",\n",
+        "    },\n",
+        "    params={\n",
+        "        \"kernel_explainer_samples\": 10,\n",
+        "        \"tree_or_linear_explainer_samples\": 200\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.WeakspotsDiagnosis\",\n",
+        "    inputs={\n",
+        "        \"model\": \"random_forest_model\",\n",
+        "        \"datasets\": [\"train_dataset\", \"test_dataset\"],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"features_columns\": None,\n",
+        "        \"thresholds\": {\n",
+        "            \"accuracy\": 0.75,\n",
+        "            \"precision\": 0.5,\n",
+        "            \"recall\": 0.5,\n",
+        "            \"f1\": 0.7\n",
+        "        }\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.OverfitDiagnosis\",\n",
+        "    inputs={\n",
+        "        \"model\": \"random_forest_model\",\n",
+        "        \"datasets\": [\"train_dataset\", \"test_dataset\"],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"metric\": None,\n",
+        "        \"cut_off_threshold\": 0.04\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.RobustnessDiagnosis\",\n",
+        "    inputs={\n",
+        "        \"model\": \"random_forest_model\",\n",
+        "        \"datasets\": [\"train_dataset\", \"test_dataset\"],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"metric\": None,\n",
+        "        \"scaling_factor_std_dev_list\": [0.1, 0.2, 0.3, 0.4, 0.5],\n",
+        "        \"performance_decay_threshold\": 0.05\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_4_7__'></a>\n",
+        "\n",
+        "#### Bias and fairness"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = run_test(\n",
+        "    \"validmind.data_validation.ProtectedClassesDescription\",\n",
+        "    inputs={\n",
+        "        \"dataset\": \"test_dataset\"\n",
+        "    },\n",
+        "    params={\n",
+        "        'protected_classes': demo_dataset.protected_classes\n",
+        "    })\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Now we are going to focus our analysis on the fairness metric(s) of interest in this case study: FNR/FPR across different groups. The `aequitas` plot module exposes the `disparities_metrics()` plot, which displays both the disparities and the group-wise metric results side by side."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = run_test(\n",
+        "    \"validmind.data_validation.ProtectedClassesDisparity\",\n",
+        "    inputs={\n",
+        "        \"dataset\": \"test_dataset\",\n",
+        "        \"model\": \"random_forest_model\"\n",
+        "    },\n",
+        "    params={\n",
+        "        \"protected_classes\": demo_dataset.protected_classes,\n",
+        "        \"disparity_tolerance\": 1.25,\n",
+        "        \"metrics\": [\"fnr\", \"fpr\", \"tpr\"]\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.ProtectedClassesCombination\",\n",
+        "    inputs={\n",
+        "        \"dataset\": \"test_dataset\",\n",
+        "        \"model\": \"random_forest_model\"\n",
+        "    },\n",
+        "    params={\n",
+        "        \"protected_classes\": demo_dataset.protected_classes\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "The following code defines a preprocessing `Pipeline` that handles both numeric and categorical features. Numeric data is imputed and scaled, while categorical data is imputed with the most frequent value and one-hot encoded. The pipelines are then combined using a `ColumnTransformer` and integrated with a classifier."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Define a pipeline for numeric features\n",
+        "numeric_transformer = Pipeline(\n",
+        "    steps=[\n",
+        "        (\"impute\", SimpleImputer()),  # Impute missing values\n",
+        "        (\"scaler\", StandardScaler()),  # Scale numeric features\n",
+        "    ]\n",
+        ")\n",
+        "\n",
+        "# Define a pipeline for categorical features\n",
+        "categorical_transformer = Pipeline(\n",
+        "    [\n",
+        "        (\"impute\", SimpleImputer(strategy=\"most_frequent\")),  # Impute missing values with most frequent\n",
+        "        (\"ohe\", OneHotEncoder(handle_unknown=\"ignore\")),  # One-hot encode categorical features\n",
+        "    ]\n",
+        ")\n",
+        "\n",
+        "# Combine numeric and categorical pipelines\n",
+        "preprocessor = ColumnTransformer(\n",
+        "    transformers=[\n",
+        "        (\"num\", numeric_transformer, selector(dtype_exclude=\"category\")),  # Apply numeric transformer to non-categorical columns\n",
+        "        (\"cat\", categorical_transformer, selector(dtype_include=\"category\")),  # Apply categorical transformer to categorical columns\n",
+        "    ]\n",
+        ")\n",
+        "\n",
+        "# Create the full pipeline including preprocessing and classification\n",
+        "pipeline = Pipeline(\n",
+        "    steps=[\n",
+        "        (\"preprocessor\", preprocessor),  # Apply the preprocessor\n",
+        "        (\n",
+        "            \"classifier\",\n",
+        "            model,  # Use the previously defined model for classification\n",
+        "        ),\n",
+        "    ]\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "sensitive_features = ['Gender_encoded','Race_encoded','Marital_Status_encoded']\n",
+        "\n",
+        "run_test(\n",
+        "    \"validmind.data_validation.ProtectedClassesThresholdOptimizer\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_test_ds\n",
+        "    },\n",
+        "    params={\n",
+        "        \"pipeline\":pipeline,\n",
+        "        \"protected_classes\": sensitive_features,\n",
+        "        \"X_train\":X_train,\n",
+        "        \"y_train\":y_train,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
+        "\n",
+        "<a id='toc7_1__'></a>\n",
+        "\n",
+        "### Work with your documentation\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "3. Expand the following sections and take a look around:\n",
+        "\n",
+        "   - **2. Data Preparation**\n",
+        "   - **3. Model Development**\n",
+        "\n",
+        "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation (hint: some of the tests in **2.3. Feature Selection and Engineering** look like they need some attention), view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
+        "\n",
+        "<a id='toc7_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-6a74bc76beda4633a0cfff2eaa20949e"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "validmind-eEL8LtKG-py3.10",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.8.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 2
 }
diff --git a/site/notebooks/use_cases/credit_risk/application_scorecard_with_ml.ipynb b/site/notebooks/use_cases/credit_risk/application_scorecard_with_ml.ipynb
index dd04e2b6a2..a735cbf5b1 100644
--- a/site/notebooks/use_cases/credit_risk/application_scorecard_with_ml.ipynb
+++ b/site/notebooks/use_cases/credit_risk/application_scorecard_with_ml.ipynb
@@ -1,2000 +1,2017 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Document an application scorecard model\n",
-    "\n",
-    "Build and document an *application scorecard model* with the ValidMind Library by using Kaggle's [Lending Club](https://www.kaggle.com/datasets/devanshi23/loan-data-2007-2014/data) sample dataset to build a simple application scorecard.\n",
-    "\n",
-    "An application scorecard model is a type of statistical model used in credit scoring to evaluate the creditworthiness of potential borrowers by generating a score based on various characteristics of an applicant — such as credit history, income, employment status, and other relevant financial data. \n",
-    "\n",
-    "- This score helps lenders make decisions about whether to approve or reject loan applications, as well as determine the terms of the loan, including interest rates and credit limits. \n",
-    "- Application scorecard models enable lenders to manage risk efficiently while making the loan application process faster and more transparent for applicants.\n",
-    "\n",
-    "This interactive notebook provides a step-by-step guide for loading a demo dataset, preprocessing the raw data, training a model for testing, setting up test inputs, initializing the required ValidMind objects, running the test, and then logging the results to ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "  - [Initialize the Python environment](#toc2_3__)    \n",
-    "  - [Preview the documentation template](#toc2_4__)    \n",
-    "- [Load the sample dataset](#toc3__)    \n",
-    "  - [Prepocess the dataset](#toc3_1__)    \n",
-    "  - [Feature engineering](#toc3_2__)    \n",
-    "- [Train the model](#toc4__)    \n",
-    "  - [Compute probabilities](#toc4_1__)    \n",
-    "  - [Compute binary predictions](#toc4_2__)    \n",
-    "- [Document the model](#toc5__)    \n",
-    "  - [Initialize the ValidMind datasets](#toc5_1__)    \n",
-    "  - [Initialize a model object](#toc5_2__)    \n",
-    "  - [Assign prediction values and probabilities to the datasets](#toc5_3__)    \n",
-    "  - [Compute credit risk scores](#toc5_4__)    \n",
-    "  - [Adding custom context to the LLM descriptions](#toc5_5__)    \n",
-    "  - [Raw data](#toc5_6__)    \n",
-    "  - [Pre-processed data](#toc5_7__)    \n",
-    "  - [Development data](#toc5_8__)    \n",
-    "  - [Feature selection](#toc5_9__)    \n",
-    "  - [Model training](#toc5_10__)    \n",
-    "  - [Model selection](#toc5_11__)    \n",
-    "  - [Class discrimination](#toc5_12__)    \n",
-    "  - [Classification accuracy](#toc5_13__)    \n",
-    "  - [Model diagnosis](#toc5_14__)    \n",
-    "  - [Model explainability](#toc5_15__)    \n",
-    "  - [Scoring evaluation](#toc5_16__)    \n",
-    "- [Custom tests](#toc6__)    \n",
-    "  - [In-line custom tests](#toc6_1__)    \n",
-    "  - [Local test provider](#toc6_2__)    \n",
-    "- [Next steps](#toc7__)    \n",
-    "  - [Work with your model documentation](#toc7_1__)    \n",
-    "  - [Discover more learning resources](#toc7_2__)    \n",
-    "- [Upgrade ValidMind](#toc8__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language.\n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Custom tests**: Custom tests are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "- **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "- **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "- **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom test.\n",
-    "- **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom test. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: The [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Credit Risk Scorecard`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "  # api_host = \"...\",\n",
-    "  # api_key = \"...\",\n",
-    "  # api_secret = \"...\",\n",
-    "  # model = \"...\",\n",
-    "  document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Initialize the Python environment\n",
-    "\n",
-    "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import xgboost as xgb\n",
-    "from sklearn.ensemble import RandomForestClassifier\n",
-    "\n",
-    "from validmind.tests import run_test\n",
-    "from validmind.datasets.credit_risk import lending_club\n",
-    "\n",
-    "%matplotlib inline"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_4__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Load the sample dataset\n",
-    "\n",
-    "The sample dataset used here is provided by the ValidMind library. To be able to use it, you'll need to import the dataset and load it into a pandas [DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html), a two-dimensional tabular data structure that makes use of rows and columns:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "df = lending_club.load_data(source=\"offline\")\n",
-    "\n",
-    "df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Prepocess the dataset\n",
-    "\n",
-    "In the preprocessing step we perform a number of operations to get ready for building our application scorecard. \n",
-    "\n",
-    "We use the `lending_club.preprocess` to simplify preprocessing. This function performs the following operations: \n",
-    "- Filters the dataset to include only loans for debt consolidation or credit card purposes\n",
-    "- Removes loans classified under the riskier grades \"F\" and \"G\"\n",
-    "- Excludes uncommon home ownership types and standardizes employment length and loan terms into numerical formats\n",
-    "- Discards unnecessary fields and any entries with missing information to maintain a clean and robust dataset for modeling"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "preprocess_df = lending_club.preprocess(df)\n",
-    "preprocess_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2__'></a>\n",
-    "\n",
-    "### Feature engineering\n",
-    "\n",
-    "In the feature engineering phase, we apply specific transformations to optimize the dataset for predictive modeling in our application scorecard. \n",
-    "\n",
-    "Using the `ending_club.feature_engineering()` function, we conduct the following operations:\n",
-    "- **WoE encoding**: Converts both numerical and categorical features into Weight of Evidence (WoE) values. WoE is a statistical measure used in scorecard modeling that quantifies the relationship between a predictor variable and the binary target variable. It calculates the ratio of the distribution of good outcomes to the distribution of bad outcomes for each category or bin of a feature. This transformation helps to ensure that the features are predictive and consistent in their contribution to the model.\n",
-    "- **Integration of WoE bins**: Ensures that the WoE transformed values are integrated throughout the dataset, replacing the original feature values while excluding the target variable from this transformation. This transformation is used to maintain a consistent scale and impact of each variable within the model, which helps make the predictions more stable and accurate."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "fe_df = lending_club.feature_engineering(preprocess_df)\n",
-    "fe_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Train the model\n",
-    "\n",
-    "In this section, we focus on constructing and refining our predictive model. \n",
-    "- We begin by dividing our data, which is based on Weight of Evidence (WoE) features, into training and testing sets (`train_df`, `test_df`). \n",
-    "- With `lending_club.split`, we employ a simple random split, randomly allocating data points to each set to ensure a mix of examples in both."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Split the data\n",
-    "train_df, test_df = lending_club.split(fe_df, test_size=0.2)\n",
-    "\n",
-    "x_train = train_df.drop(lending_club.target_column, axis=1)\n",
-    "y_train = train_df[lending_club.target_column]\n",
-    "\n",
-    "x_test = test_df.drop(lending_club.target_column, axis=1)\n",
-    "y_test = test_df[lending_club.target_column]"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Define the XGBoost model\n",
-    "xgb_model = xgb.XGBClassifier(\n",
-    "    n_estimators=50, \n",
-    "    random_state=42, \n",
-    "    early_stopping_rounds=10\n",
-    ")\n",
-    "xgb_model.set_params(\n",
-    "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
-    ")\n",
-    "\n",
-    "# Fit the model\n",
-    "xgb_model.fit(\n",
-    "    x_train, \n",
-    "    y_train,\n",
-    "    eval_set=[(x_test, y_test)],\n",
-    "    verbose=False\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Define the Random Forest model\n",
-    "rf_model = RandomForestClassifier(\n",
-    "    n_estimators=50, \n",
-    "    random_state=42,\n",
-    ")\n",
-    "\n",
-    "# Fit the model\n",
-    "rf_model.fit(x_train, y_train)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Compute probabilities"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "train_xgb_prob = xgb_model.predict_proba(x_train)[:, 1]\n",
-    "test_xgb_prob = xgb_model.predict_proba(x_test)[:, 1]\n",
-    "\n",
-    "train_rf_prob = rf_model.predict_proba(x_train)[:, 1]\n",
-    "test_rf_prob = rf_model.predict_proba(x_test)[:, 1]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Compute binary predictions"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "cut_off_threshold = 0.3\n",
-    "\n",
-    "train_xgb_binary_predictions = (train_xgb_prob > cut_off_threshold).astype(int)\n",
-    "test_xgb_binary_predictions = (test_xgb_prob > cut_off_threshold).astype(int)\n",
-    "\n",
-    "train_rf_binary_predictions = (train_rf_prob > cut_off_threshold).astype(int)\n",
-    "test_rf_binary_predictions = (test_rf_prob > cut_off_threshold).astype(int)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Document the model\n",
-    "\n",
-    "To document the model with the ValidMind Library, you'll need to:\n",
-    "1. Preprocess the raw dataset\n",
-    "2. Initialize some training and test datasets\n",
-    "3. Initialize a model object you can use for testing\n",
-    "4. Run the full suite of tests"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_1__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind datasets\n",
-    "\n",
-    "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
-    "\n",
-    "This function takes a number of arguments:\n",
-    "\n",
-    "- `dataset`: The dataset that you want to provide as input to tests.\n",
-    "- `input_id`: A unique identifier that allows tracking what inputs are used when running each individual test.\n",
-    "- `target_column`: A required argument if tests require access to true values. This is the name of the target column in the dataset.\n",
-    "\n",
-    "With all datasets ready, you can now initialize the raw, processed, training and test datasets (`raw_df`, `preprocessed_df`, `fe_df`,  `train_df` and `test_df`) created earlier into their own dataset objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_raw_dataset = vm.init_dataset(\n",
-    "    dataset=df,\n",
-    "    input_id=\"raw_dataset\",\n",
-    "    target_column=lending_club.target_column,\n",
-    ")\n",
-    "\n",
-    "vm_preprocess_dataset = vm.init_dataset(\n",
-    "    dataset=preprocess_df,\n",
-    "    input_id=\"preprocess_dataset\",\n",
-    "    target_column=lending_club.target_column,\n",
-    ")\n",
-    "\n",
-    "vm_fe_dataset = vm.init_dataset(\n",
-    "    dataset=fe_df,\n",
-    "    input_id=\"fe_dataset\",\n",
-    "    target_column=lending_club.target_column,\n",
-    ")\n",
-    "\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    dataset=train_df,\n",
-    "    input_id=\"train_dataset\",\n",
-    "    target_column=lending_club.target_column,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    dataset=test_df,\n",
-    "    input_id=\"test_dataset\",\n",
-    "    target_column=lending_club.target_column,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2__'></a>\n",
-    "\n",
-    "### Initialize a model object\n",
-    "\n",
-    "You will also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data. You simply intialize this model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_xgb_model = vm.init_model(\n",
-    "    xgb_model,\n",
-    "    input_id=\"xgb_model\",\n",
-    ")\n",
-    "\n",
-    "vm_rf_model = vm.init_model(\n",
-    "    rf_model,\n",
-    "    input_id=\"rf_model\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_3__'></a>\n",
-    "\n",
-    "### Assign prediction values and probabilities to the datasets\n",
-    "\n",
-    "With our model now trained, we'll move on to assigning both the predictive probabilities coming directly from the model's predictions, and the binary prediction after applying the cutoff threshold described in the previous steps. \n",
-    "- These tasks are achieved through the use of the `assign_predictions()` method associated with the VM `dataset` object.\n",
-    "- This method links the model's class prediction values and probabilities to our VM train and test datasets."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# XGBoost\n",
-    "vm_train_ds.assign_predictions(\n",
-    "    model=vm_xgb_model,\n",
-    "    prediction_values=train_xgb_binary_predictions,\n",
-    "    prediction_probabilities=train_xgb_prob,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds.assign_predictions(\n",
-    "    model=vm_xgb_model,\n",
-    "    prediction_values=test_xgb_binary_predictions,\n",
-    "    prediction_probabilities=test_xgb_prob,\n",
-    ")\n",
-    "\n",
-    "# Random Forest\n",
-    "vm_train_ds.assign_predictions(\n",
-    "    model=vm_rf_model,\n",
-    "    prediction_values=train_rf_binary_predictions,\n",
-    "    prediction_probabilities=train_rf_prob,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds.assign_predictions(\n",
-    "    model=vm_rf_model,\n",
-    "    prediction_values=test_rf_binary_predictions,\n",
-    "    prediction_probabilities=test_rf_prob,\n",
-    ")\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_4__'></a>\n",
-    "\n",
-    "### Compute credit risk scores\n",
-    "\n",
-    "In this phase, we translate model predictions into actionable scores using probability estimates generated by our trained model."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "train_xgb_scores = lending_club.compute_scores(train_xgb_prob)\n",
-    "test_xgb_scores = lending_club.compute_scores(test_xgb_prob)\n",
-    "\n",
-    "# Assign scores to the datasets\n",
-    "vm_train_ds.add_extra_column(\"xgb_scores\", train_xgb_scores)\n",
-    "vm_test_ds.add_extra_column(\"xgb_scores\", test_xgb_scores)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_5__'></a>\n",
-    "\n",
-    "### Adding custom context to the LLM descriptions\n",
-    "\n",
-    "To enable the LLM descriptions context, you need to set the `VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED` environment variable to `1`. This will enable the LLM descriptions context, which will be used to provide additional context to the LLM descriptions. This is a global setting that will affect all tests."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import os\n",
-    "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED\"] = \"1\"\n",
-    "\n",
-    "context = \"\"\"\n",
-    "FORMAT FOR THE LLM DESCRIPTIONS: \n",
-    "    **<Test Name>** is designed to <begin with a concise overview of what the test does and its primary purpose, \n",
-    "    extracted from the test description>.\n",
-    "\n",
-    "    The test operates by <write a paragraph about the test mechanism, explaining how it works and what it measures. \n",
-    "    Include any relevant formulas or methodologies mentioned in the test description.>\n",
-    "\n",
-    "    The primary advantages of this test include <write a paragraph about the test's strengths and capabilities, \n",
-    "    highlighting what makes it particularly useful for specific scenarios.>\n",
-    "\n",
-    "    Users should be aware that <write a paragraph about the test's limitations and potential risks. \n",
-    "    Include both technical limitations and interpretation challenges. \n",
-    "    If the test description includes specific signs of high risk, incorporate these here.>\n",
-    "\n",
-    "    **Key Insights:**\n",
-    "\n",
-    "    The test results reveal:\n",
-    "\n",
-    "    - **<insight title>**: <comprehensive description of one aspect of the results>\n",
-    "    - **<insight title>**: <comprehensive description of another aspect>\n",
-    "    ...\n",
-    "\n",
-    "    Based on these results, <conclude with a brief paragraph that ties together the test results with the test's \n",
-    "    purpose and provides any final recommendations or considerations.>\n",
-    "\n",
-    "ADDITIONAL INSTRUCTIONS:\n",
-    "    Present insights in order from general to specific, with each insight as a single bullet point with bold title.\n",
-    "\n",
-    "    For each metric in the test results, include in the test overview:\n",
-    "    - The metric's purpose and what it measures\n",
-    "    - Its mathematical formula\n",
-    "    - The range of possible values\n",
-    "    - What constitutes good/bad performance\n",
-    "    - How to interpret different values\n",
-    "\n",
-    "    Each insight should progressively cover:\n",
-    "    1. Overall scope and distribution\n",
-    "    2. Complete breakdown of all elements with specific values\n",
-    "    3. Natural groupings and patterns\n",
-    "    4. Comparative analysis between datasets/categories\n",
-    "    5. Stability and variations\n",
-    "    6. Notable relationships or dependencies\n",
-    "\n",
-    "    Remember:\n",
-    "    - Keep all insights at the same level (no sub-bullets or nested structures)\n",
-    "    - Make each insight complete and self-contained\n",
-    "    - Include specific numerical values and ranges\n",
-    "    - Cover all elements in the results comprehensively\n",
-    "    - Maintain clear, concise language\n",
-    "    - Use only \"- **Title**: Description\" format for insights\n",
-    "    - Progress naturally from general to specific observations\n",
-    "\n",
-    "\"\"\".strip()\n",
-    "\n",
-    "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT\"] = context"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_6__'></a>\n",
-    "\n",
-    "### Raw data"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.DatasetDescription:raw_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_raw_dataset,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.DescriptiveStatistics:raw_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_raw_dataset,\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.MissingValues:raw_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_raw_dataset,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"min_percentage_threshold\": 1\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.ClassImbalance:raw_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_raw_dataset,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"min_percent_threshold\": 10\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.Duplicates:raw_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_raw_dataset,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"min_percentage_threshold\": 1\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.HighCardinality:raw_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_raw_dataset,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"num_threshold\": 100,\n",
-    "        \"percent_threshold\": 0.1,\n",
-    "        \"threshold_type\": \"percent\"\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.Skewness:raw_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_raw_dataset,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"max_threshold\": 1\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.UniqueRows:raw_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_raw_dataset,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"min_percent_threshold\": 1\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.TooManyZeroValues:raw_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_raw_dataset,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"max_percent_threshold\": 0.03\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.IQROutliersTable:raw_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_raw_dataset,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"threshold\": 5\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_7__'></a>\n",
-    "\n",
-    "### Pre-processed data"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.DescriptiveStatistics:preprocessed_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_preprocess_dataset,\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.TabularDescriptionTables:preprocessed_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_preprocess_dataset\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.MissingValues:preprocessed_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_preprocess_dataset,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"min_threshold\": 1\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.TabularNumericalHistograms:preprocessed_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_preprocess_dataset\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.TabularCategoricalBarPlots:preprocessed_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_preprocess_dataset\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.TargetRateBarPlots:preprocessed_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_preprocess_dataset\n",
-    "    },\n",
-    "    params={\n",
-    "        \"default_column\": lending_club.target_column,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_8__'></a>\n",
-    "\n",
-    "### Development data"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.DescriptiveStatistics:development_data\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.TabularDescriptionTables:development_data\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.ClassImbalance:development_data\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"min_percent_threshold\": 10\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.UniqueRows:development_data\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"min_percent_threshold\": 1\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.TabularNumericalHistograms:development_data\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_9__'></a>\n",
-    "\n",
-    "### Feature selection"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.MutualInformation:development_data\",\n",
-    "    input_grid  ={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"min_threshold\": 0.01,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.PearsonCorrelationMatrix:development_data\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.HighPearsonCorrelation:development_data\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"max_threshold\": 0.3,\n",
-    "        \"top_n_correlations\": 10\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.WOEBinTable\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_preprocess_dataset]\n",
-    "    },\n",
-    "    params={\n",
-    "        \"breaks_adj\": lending_club.breaks_adj,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.WOEBinPlots\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_preprocess_dataset]\n",
-    "    },\n",
-    "    params={\n",
-    "        \"breaks_adj\": lending_club.breaks_adj,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_10__'></a>\n",
-    "\n",
-    "### Model training"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.DatasetSplit\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_train_ds, vm_test_ds],\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.ModelMetadata\",\n",
-    "    input_grid={\n",
-    "        \"model\": [vm_xgb_model, vm_rf_model],\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.ModelParameters\",\n",
-    "    input_grid={\n",
-    "        \"model\": [vm_xgb_model, vm_rf_model],\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_11__'></a>\n",
-    "\n",
-    "### Model selection"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.statsmodels.GINITable\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "        \"model\": [vm_xgb_model, vm_rf_model],\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.ClassifierPerformance\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "        \"model\": [vm_xgb_model, vm_rf_model],\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.TrainingTestDegradation:XGBoost\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_train_ds, vm_test_ds],\n",
-    "        \"model\": vm_xgb_model,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"max_threshold\": 0.1\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.TrainingTestDegradation:RandomForest\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_train_ds, vm_test_ds],\n",
-    "        \"model\": vm_rf_model,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"max_threshold\": 0.1\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.HyperParametersTuning\",\n",
-    "    inputs={\n",
-    "        \"model\": vm_xgb_model,\n",
-    "        \"dataset\": vm_train_ds,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"param_grid\": {'n_estimators': [50, 100]},\n",
-    "        \"scoring\": ['roc_auc', 'recall'],\n",
-    "        \"fit_params\": {'eval_set': [(x_test, y_test)], 'verbose': False},\n",
-    "        \"thresholds\": [0.3, 0.5],\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_12__'></a>\n",
-    "\n",
-    "### Class discrimination"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.ROCCurve\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "        \"model\": [vm_xgb_model],\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.MinimumROCAUCScore\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "        \"model\": [vm_xgb_model],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"min_threshold\": 0.5\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.statsmodels.PredictionProbabilitiesHistogram\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "        \"model\": [vm_xgb_model],\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.statsmodels.CumulativePredictionProbabilities\",\n",
-    "    input_grid={\n",
-    "        \"model\": [vm_xgb_model],\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.PopulationStabilityIndex\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_train_ds, vm_test_ds],\n",
-    "        \"model\": vm_xgb_model,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"num_bins\": 10,\n",
-    "        \"mode\": \"fixed\"\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_13__'></a>\n",
-    "\n",
-    "### Classification accuracy"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.ClassifierThresholdOptimization\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_train_ds,\n",
-    "        \"model\": vm_xgb_model\n",
-    "    },\n",
-    "    params={\n",
-    "        \"target_recall\": 0.8 # Find a threshold that achieves a recall of 80%\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.CalibrationCurve\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "        \"model\": [vm_xgb_model],\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.ConfusionMatrix\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "        \"model\": [vm_xgb_model],\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.MinimumAccuracy\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "        \"model\": [vm_xgb_model],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"min_threshold\": 0.7\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.MinimumF1Score\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "        \"model\": [vm_xgb_model],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"min_threshold\": 0.5\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.PrecisionRecallCurve\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "        \"model\": [vm_xgb_model]\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_14__'></a>\n",
-    "\n",
-    "### Model diagnosis"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.WeakspotsDiagnosis\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_train_ds, vm_test_ds],\n",
-    "        \"model\": vm_xgb_model,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.OverfitDiagnosis\",\n",
-    "    inputs={\n",
-    "        \"model\": vm_xgb_model,\n",
-    "        \"datasets\": [vm_train_ds, vm_test_ds],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"cut_off_threshold\": 0.04\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.RobustnessDiagnosis\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_train_ds, vm_test_ds],\n",
-    "        \"model\": vm_xgb_model,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"scaling_factor_std_dev_list\": [\n",
-    "            0.1,\n",
-    "            0.2,\n",
-    "            0.3,\n",
-    "            0.4,\n",
-    "            0.5\n",
-    "        ],\n",
-    "        \"performance_decay_threshold\": 0.05\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_15__'></a>\n",
-    "\n",
-    "### Model explainability"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.PermutationFeatureImportance\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "        \"model\": [vm_xgb_model]\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.FeaturesAUC\",\n",
-    "    input_grid={\n",
-    "        \"model\": [vm_xgb_model],\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.SHAPGlobalImportance\",\n",
-    "    input_grid={\n",
-    "        \"model\": [vm_xgb_model],\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"kernel_explainer_samples\": 10,\n",
-    "        \"tree_or_linear_explainer_samples\": 200,\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_16__'></a>\n",
-    "\n",
-    "### Scoring evaluation"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.statsmodels.ScorecardHistogram\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"score_column\": \"xgb_scores\",\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.ScoreBandDefaultRates\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds],\n",
-    "        \"model\": [vm_xgb_model],\n",
-    "    },\n",
-    "    params = {\n",
-    "        \"score_column\": \"xgb_scores\",\n",
-    "        \"score_bands\": [500, 540, 570]\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.ScoreProbabilityAlignment\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_train_ds],\n",
-    "        \"model\": [vm_xgb_model],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"score_column\": \"xgb_scores\",\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Custom tests\n",
-    "\n",
-    "Custom tests extend the functionality of ValidMind, allowing you to document any model or use case with added flexibility.\n",
-    "\n",
-    "ValidMind provides a comprehensive set of tests out-of-the-box to evaluate and document your models and datasets. We recognize there will be cases where the default tests do not support a model or dataset, or specific documentation is needed. In these cases, you can create and use your own custom code to accomplish what you need. To streamline custom code integration, we support the creation of custom test functions."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1__'></a>\n",
-    "\n",
-    "### In-line custom tests\n",
-    "\n",
-    "The `@vm.test` decorator is doing the work of creating a wrapper around the function that will allow it to be run by the ValidMind Library. It also registers the test so it can be found by the ID `my_custom_tests.ScoreToOdds\"`. The function `score_to_odds_analysis` takes three arguments `dataset`, `score_column`, and `score_bands`. This is a `VMDataset` and the rest are parameters that can be passed in."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import numpy as np\n",
-    "import pandas as pd\n",
-    "import plotly.graph_objects as go\n",
-    "\n",
-    "\n",
-    "@vm.test(\"my_custom_tests.ScoreToOdds\")\n",
-    "def score_to_odds_analysis(dataset, score_column='score', score_bands=[410, 440, 470]):\n",
-    "    \"\"\"\n",
-    "    Analyzes the relationship between score bands and odds (good:bad ratio).\n",
-    "    Good odds = (1 - default_rate) / default_rate\n",
-    "    \n",
-    "    Higher scores should correspond to higher odds of being good.\n",
-    "    \"\"\"\n",
-    "    df = dataset.df\n",
-    "    \n",
-    "    # Create score bands\n",
-    "    df['score_band'] = pd.cut(\n",
-    "        df[score_column],\n",
-    "        bins=[-np.inf] + score_bands + [np.inf],\n",
-    "        labels=[f'<{score_bands[0]}'] + \n",
-    "               [f'{score_bands[i]}-{score_bands[i+1]}' for i in range(len(score_bands)-1)] +\n",
-    "               [f'>{score_bands[-1]}']\n",
-    "    )\n",
-    "    \n",
-    "    # Calculate metrics per band\n",
-    "    results = df.groupby('score_band').agg({\n",
-    "        dataset.target_column: ['mean', 'count']\n",
-    "    })\n",
-    "    \n",
-    "    results.columns = ['Default Rate', 'Total']\n",
-    "    results['Good Count'] = results['Total'] - (results['Default Rate'] * results['Total'])\n",
-    "    results['Bad Count'] = results['Default Rate'] * results['Total']\n",
-    "    results['Odds'] = results['Good Count'] / results['Bad Count']\n",
-    "    \n",
-    "    # Create visualization\n",
-    "    fig = go.Figure()\n",
-    "    \n",
-    "    # Add odds bars\n",
-    "    fig.add_trace(go.Bar(\n",
-    "        name='Odds (Good:Bad)',\n",
-    "        x=results.index,\n",
-    "        y=results['Odds'],\n",
-    "        marker_color='blue'\n",
-    "    ))\n",
-    "    \n",
-    "    fig.update_layout(\n",
-    "        title='Score-to-Odds Analysis',\n",
-    "        yaxis=dict(title='Odds Ratio (Good:Bad)'),\n",
-    "        showlegend=False\n",
-    "    )\n",
-    "    \n",
-    "    return fig"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"my_custom_tests.ScoreToOdds\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_test_ds,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"score_column\": \"xgb_scores\",\n",
-    "        \"score_bands\": [500, 540, 570],\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2__'></a>\n",
-    "\n",
-    "### Local test provider\n",
-    "\n",
-    "The ValidMind Library offers the ability to extend the built-in library of tests with custom tests. A test \"Provider\" is a Python class that gets registered with the ValidMind Library and loads tests based on a test ID, for example `my_test_provider.my_test_id`. The built-in suite of tests that ValidMind offers is technically its own test provider. You can use one the built-in test provider offered by ValidMind (`validmind.tests.test_providers.LocalTestProvider`) or you can create your own. More than likely, you'll want to use the `LocalTestProvider` to add a directory of custom tests but there's flexibility to be able to load tests from any source."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.tests import LocalTestProvider\n",
-    "\n",
-    "# Define the folder where your tests are located\n",
-    "tests_folder = \"custom_tests\"\n",
-    "\n",
-    "# initialize the test provider with the tests folder we created earlier\n",
-    "my_test_provider = LocalTestProvider(tests_folder)\n",
-    "\n",
-    "vm.tests.register_test_provider(\n",
-    "    namespace=\"my_test_provider\",\n",
-    "    test_provider=my_test_provider,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Now that we have our test provider set up, we can run any test that's located in our tests folder by using the `run_test()` method. This function is your entry point to running single tests in the ValidMind Library. It takes a test ID and runs the test associated with that ID. For our custom tests, the test ID will be the `namespace` specified when registering the provider, followed by the path to the test file relative to the tests folder. For example, the Confusion Matrix test we created earlier will have the test ID `my_test_provider.ConfusionMatrix`. You could organize the tests in subfolders, say `classification` and `regression`, and the test ID for the Confusion Matrix test would then be `my_test_provider.classification.ConfusionMatrix`."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"my_test_provider.ScoreBandDiscriminationMetrics\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_test_ds,\n",
-    "        \"model\": vm_xgb_model,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"score_column\": \"xgb_scores\",\n",
-    "        \"score_bands\": [500, 540, 570],\n",
-    "    }\n",
-    ").log(section_id=\"interpretability_insights\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
-    "\n",
-    "<a id='toc7_1__'></a>\n",
-    "\n",
-    "### Work with your model documentation\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "3. Expand the following sections and take a look around:\n",
-    "\n",
-    "   - **2. Data Preparation**\n",
-    "   - **3. Model Development**\n",
-    "\n",
-    "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation (hint: some of the tests in **2.3. Feature Selection and Engineering** look like they need some attention), view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)\n",
-    "\n",
-    "<a id='toc7_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc8__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-ced6c79ffe99424fa8a48ed9ce2be9a5",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "validmind-eEL8LtKG-py3.10",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Document an application scorecard model\n",
+        "\n",
+        "Build and document an *application scorecard model* with the ValidMind Library by using Kaggle's [Lending Club](https://www.kaggle.com/datasets/devanshi23/loan-data-2007-2014/data) sample dataset to build a simple application scorecard.\n",
+        "\n",
+        "An application scorecard model is a type of statistical model used in credit scoring to evaluate the creditworthiness of potential borrowers by generating a score based on various characteristics of an applicant — such as credit history, income, employment status, and other relevant financial data. \n",
+        "\n",
+        "- This score helps lenders make decisions about whether to approve or reject loan applications, as well as determine the terms of the loan, including interest rates and credit limits. \n",
+        "- Application scorecard models enable lenders to manage risk efficiently while making the loan application process faster and more transparent for applicants.\n",
+        "\n",
+        "This interactive notebook provides a step-by-step guide for loading a demo dataset, preprocessing the raw data, training a model for testing, setting up test inputs, initializing the required ValidMind objects, running the test, and then logging the results to ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "  - [Initialize the Python environment](#toc2_3__)    \n",
+        "  - [Preview the documentation template](#toc2_4__)    \n",
+        "- [Load the sample dataset](#toc3__)    \n",
+        "  - [Prepocess the dataset](#toc3_1__)    \n",
+        "  - [Feature engineering](#toc3_2__)    \n",
+        "- [Train the model](#toc4__)    \n",
+        "  - [Compute probabilities](#toc4_1__)    \n",
+        "  - [Compute binary predictions](#toc4_2__)    \n",
+        "- [Document the model](#toc5__)    \n",
+        "  - [Initialize the ValidMind datasets](#toc5_1__)    \n",
+        "  - [Initialize the ValidMind models](#toc5_2__)    \n",
+        "  - [Assign prediction values and probabilities to the datasets](#toc5_3__)    \n",
+        "  - [Compute credit risk scores](#toc5_4__)    \n",
+        "  - [Adding custom context to the LLM descriptions](#toc5_5__)    \n",
+        "  - [Raw data](#toc5_6__)    \n",
+        "  - [Pre-processed data](#toc5_7__)    \n",
+        "  - [Development data](#toc5_8__)    \n",
+        "  - [Feature selection](#toc5_9__)    \n",
+        "  - [Model training](#toc5_10__)    \n",
+        "  - [Model selection](#toc5_11__)    \n",
+        "  - [Class discrimination](#toc5_12__)    \n",
+        "  - [Classification accuracy](#toc5_13__)    \n",
+        "  - [Model diagnosis](#toc5_14__)    \n",
+        "  - [Model explainability](#toc5_15__)    \n",
+        "  - [Scoring evaluation](#toc5_16__)    \n",
+        "- [Custom tests](#toc6__)    \n",
+        "  - [In-line custom tests](#toc6_1__)    \n",
+        "  - [Local test provider](#toc6_2__)    \n",
+        "- [Next steps](#toc7__)    \n",
+        "  - [Work with your documentation](#toc7_1__)    \n",
+        "  - [Discover more learning resources](#toc7_2__)    \n",
+        "- [Upgrade ValidMind](#toc8__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language.\n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Credit Risk Scorecard`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "  # api_host = \"...\",\n",
+        "  # api_key = \"...\",\n",
+        "  # api_secret = \"...\",\n",
+        "  # model = \"...\",\n",
+        "  document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Initialize the Python environment\n",
+        "\n",
+        "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import xgboost as xgb\n",
+        "from sklearn.ensemble import RandomForestClassifier\n",
+        "\n",
+        "from validmind.tests import run_test\n",
+        "from validmind.datasets.credit_risk import lending_club\n",
+        "\n",
+        "%matplotlib inline"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_4__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Load the sample dataset\n",
+        "\n",
+        "The sample dataset used here is provided by the ValidMind library. To be able to use it, you'll need to import the dataset and load it into a pandas [DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html), a two-dimensional tabular data structure that makes use of rows and columns:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "df = lending_club.load_data(source=\"offline\")\n",
+        "\n",
+        "df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Prepocess the dataset\n",
+        "\n",
+        "In the preprocessing step we perform a number of operations to get ready for building our application scorecard. \n",
+        "\n",
+        "We use the `lending_club.preprocess` to simplify preprocessing. This function performs the following operations: \n",
+        "- Filters the dataset to include only loans for debt consolidation or credit card purposes\n",
+        "- Removes loans classified under the riskier grades \"F\" and \"G\"\n",
+        "- Excludes uncommon home ownership types and standardizes employment length and loan terms into numerical formats\n",
+        "- Discards unnecessary fields and any entries with missing information to maintain a clean and robust dataset for modeling"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "preprocess_df = lending_club.preprocess(df)\n",
+        "preprocess_df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2__'></a>\n",
+        "\n",
+        "### Feature engineering\n",
+        "\n",
+        "In the feature engineering phase, we apply specific transformations to optimize the dataset for predictive modeling in our application scorecard. \n",
+        "\n",
+        "Using the `ending_club.feature_engineering()` function, we conduct the following operations:\n",
+        "- **WoE encoding**: Converts both numerical and categorical features into Weight of Evidence (WoE) values. WoE is a statistical measure used in scorecard modeling that quantifies the relationship between a predictor variable and the binary target variable. It calculates the ratio of the distribution of good outcomes to the distribution of bad outcomes for each category or bin of a feature. This transformation helps to ensure that the features are predictive and consistent in their contribution to the model.\n",
+        "- **Integration of WoE bins**: Ensures that the WoE transformed values are integrated throughout the dataset, replacing the original feature values while excluding the target variable from this transformation. This transformation is used to maintain a consistent scale and impact of each variable within the model, which helps make the predictions more stable and accurate."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "fe_df = lending_club.feature_engineering(preprocess_df)\n",
+        "fe_df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Train the model\n",
+        "\n",
+        "In this section, we focus on constructing and refining our predictive model. \n",
+        "- We begin by dividing our data, which is based on Weight of Evidence (WoE) features, into training and testing sets (`train_df`, `test_df`). \n",
+        "- With `lending_club.split`, we employ a simple random split, randomly allocating data points to each set to ensure a mix of examples in both."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Split the data\n",
+        "train_df, test_df = lending_club.split(fe_df, test_size=0.2)\n",
+        "\n",
+        "x_train = train_df.drop(lending_club.target_column, axis=1)\n",
+        "y_train = train_df[lending_club.target_column]\n",
+        "\n",
+        "x_test = test_df.drop(lending_club.target_column, axis=1)\n",
+        "y_test = test_df[lending_club.target_column]"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Define the XGBoost model\n",
+        "xgb_model = xgb.XGBClassifier(\n",
+        "    n_estimators=50, \n",
+        "    random_state=42, \n",
+        "    early_stopping_rounds=10\n",
+        ")\n",
+        "xgb_model.set_params(\n",
+        "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
+        ")\n",
+        "\n",
+        "# Fit the model\n",
+        "xgb_model.fit(\n",
+        "    x_train, \n",
+        "    y_train,\n",
+        "    eval_set=[(x_test, y_test)],\n",
+        "    verbose=False\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Define the Random Forest model\n",
+        "rf_model = RandomForestClassifier(\n",
+        "    n_estimators=50, \n",
+        "    random_state=42,\n",
+        ")\n",
+        "\n",
+        "# Fit the model\n",
+        "rf_model.fit(x_train, y_train)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Compute probabilities"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "train_xgb_prob = xgb_model.predict_proba(x_train)[:, 1]\n",
+        "test_xgb_prob = xgb_model.predict_proba(x_test)[:, 1]\n",
+        "\n",
+        "train_rf_prob = rf_model.predict_proba(x_train)[:, 1]\n",
+        "test_rf_prob = rf_model.predict_proba(x_test)[:, 1]"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Compute binary predictions"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "cut_off_threshold = 0.3\n",
+        "\n",
+        "train_xgb_binary_predictions = (train_xgb_prob > cut_off_threshold).astype(int)\n",
+        "test_xgb_binary_predictions = (test_xgb_prob > cut_off_threshold).astype(int)\n",
+        "\n",
+        "train_rf_binary_predictions = (train_rf_prob > cut_off_threshold).astype(int)\n",
+        "test_rf_binary_predictions = (test_rf_prob > cut_off_threshold).astype(int)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Document the model\n",
+        "\n",
+        "To document the model with the ValidMind Library, you'll need to:\n",
+        "1. Preprocess the raw dataset\n",
+        "2. Initialize some training and test datasets\n",
+        "3. Initialize a ValidMind model object for use with testing\n",
+        "4. Run the full suite of tests"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind datasets\n",
+        "\n",
+        "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
+        "\n",
+        "This function takes a number of arguments:\n",
+        "\n",
+        "- `dataset`: The dataset that you want to provide as input to tests.\n",
+        "- `input_id`: A unique identifier that allows tracking what inputs are used when running each individual test.\n",
+        "- `target_column`: A required argument if tests require access to true values. This is the name of the target column in the dataset.\n",
+        "\n",
+        "With all datasets ready, you can now initialize the raw, processed, training and test datasets (`raw_df`, `preprocessed_df`, `fe_df`,  `train_df` and `test_df`) created earlier into their own dataset objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_raw_dataset = vm.init_dataset(\n",
+        "    dataset=df,\n",
+        "    input_id=\"raw_dataset\",\n",
+        "    target_column=lending_club.target_column,\n",
+        ")\n",
+        "\n",
+        "vm_preprocess_dataset = vm.init_dataset(\n",
+        "    dataset=preprocess_df,\n",
+        "    input_id=\"preprocess_dataset\",\n",
+        "    target_column=lending_club.target_column,\n",
+        ")\n",
+        "\n",
+        "vm_fe_dataset = vm.init_dataset(\n",
+        "    dataset=fe_df,\n",
+        "    input_id=\"fe_dataset\",\n",
+        "    target_column=lending_club.target_column,\n",
+        ")\n",
+        "\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    dataset=train_df,\n",
+        "    input_id=\"train_dataset\",\n",
+        "    target_column=lending_club.target_column,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    dataset=test_df,\n",
+        "    input_id=\"test_dataset\",\n",
+        "    target_column=lending_club.target_column,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind models\n",
+        "\n",
+        "You'll also need to initialize ValidMind model objects (`vm_model`) that can be passed to other functions for analysis and tests on the data for our modelS.\n",
+        "\n",
+        "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+        "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
+        "\n",
+        "Initialize your model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_xgb_model = vm.init_model(\n",
+        "    xgb_model,\n",
+        "    input_id=\"xgb_model\",\n",
+        ")\n",
+        "\n",
+        "vm_rf_model = vm.init_model(\n",
+        "    rf_model,\n",
+        "    input_id=\"rf_model\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_3__'></a>\n",
+        "\n",
+        "### Assign prediction values and probabilities to the datasets\n",
+        "\n",
+        "With our model now trained, we'll move on to assigning both the predictive probabilities coming directly from the model's predictions, and the binary prediction after applying the cutoff threshold described in the previous steps. \n",
+        "- These tasks are achieved through the use of the `assign_predictions()` method associated with the VM `dataset` object.\n",
+        "- This method links the model's class prediction values and probabilities to our VM train and test datasets."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# XGBoost\n",
+        "vm_train_ds.assign_predictions(\n",
+        "    model=vm_xgb_model,\n",
+        "    prediction_values=train_xgb_binary_predictions,\n",
+        "    prediction_probabilities=train_xgb_prob,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds.assign_predictions(\n",
+        "    model=vm_xgb_model,\n",
+        "    prediction_values=test_xgb_binary_predictions,\n",
+        "    prediction_probabilities=test_xgb_prob,\n",
+        ")\n",
+        "\n",
+        "# Random Forest\n",
+        "vm_train_ds.assign_predictions(\n",
+        "    model=vm_rf_model,\n",
+        "    prediction_values=train_rf_binary_predictions,\n",
+        "    prediction_probabilities=train_rf_prob,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds.assign_predictions(\n",
+        "    model=vm_rf_model,\n",
+        "    prediction_values=test_rf_binary_predictions,\n",
+        "    prediction_probabilities=test_rf_prob,\n",
+        ")\n"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_4__'></a>\n",
+        "\n",
+        "### Compute credit risk scores\n",
+        "\n",
+        "In this phase, we translate model predictions into actionable scores using probability estimates generated by our trained model."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "train_xgb_scores = lending_club.compute_scores(train_xgb_prob)\n",
+        "test_xgb_scores = lending_club.compute_scores(test_xgb_prob)\n",
+        "\n",
+        "# Assign scores to the datasets\n",
+        "vm_train_ds.add_extra_column(\"xgb_scores\", train_xgb_scores)\n",
+        "vm_test_ds.add_extra_column(\"xgb_scores\", test_xgb_scores)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_5__'></a>\n",
+        "\n",
+        "### Adding custom context to the LLM descriptions\n",
+        "\n",
+        "To enable the LLM descriptions context, you need to set the `VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED` environment variable to `1`. This will enable the LLM descriptions context, which will be used to provide additional context to the LLM descriptions. This is a global setting that will affect all tests."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import os\n",
+        "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED\"] = \"1\"\n",
+        "\n",
+        "context = \"\"\"\n",
+        "FORMAT FOR THE LLM DESCRIPTIONS: \n",
+        "    **<Test Name>** is designed to <begin with a concise overview of what the test does and its primary purpose, \n",
+        "    extracted from the test description>.\n",
+        "\n",
+        "    The test operates by <write a paragraph about the test mechanism, explaining how it works and what it measures. \n",
+        "    Include any relevant formulas or methodologies mentioned in the test description.>\n",
+        "\n",
+        "    The primary advantages of this test include <write a paragraph about the test's strengths and capabilities, \n",
+        "    highlighting what makes it particularly useful for specific scenarios.>\n",
+        "\n",
+        "    Users should be aware that <write a paragraph about the test's limitations and potential risks. \n",
+        "    Include both technical limitations and interpretation challenges. \n",
+        "    If the test description includes specific signs of high risk, incorporate these here.>\n",
+        "\n",
+        "    **Key Insights:**\n",
+        "\n",
+        "    The test results reveal:\n",
+        "\n",
+        "    - **<insight title>**: <comprehensive description of one aspect of the results>\n",
+        "    - **<insight title>**: <comprehensive description of another aspect>\n",
+        "    ...\n",
+        "\n",
+        "    Based on these results, <conclude with a brief paragraph that ties together the test results with the test's \n",
+        "    purpose and provides any final recommendations or considerations.>\n",
+        "\n",
+        "ADDITIONAL INSTRUCTIONS:\n",
+        "    Present insights in order from general to specific, with each insight as a single bullet point with bold title.\n",
+        "\n",
+        "    For each metric in the test results, include in the test overview:\n",
+        "    - The metric's purpose and what it measures\n",
+        "    - Its mathematical formula\n",
+        "    - The range of possible values\n",
+        "    - What constitutes good/bad performance\n",
+        "    - How to interpret different values\n",
+        "\n",
+        "    Each insight should progressively cover:\n",
+        "    1. Overall scope and distribution\n",
+        "    2. Complete breakdown of all elements with specific values\n",
+        "    3. Natural groupings and patterns\n",
+        "    4. Comparative analysis between datasets/categories\n",
+        "    5. Stability and variations\n",
+        "    6. Notable relationships or dependencies\n",
+        "\n",
+        "    Remember:\n",
+        "    - Keep all insights at the same level (no sub-bullets or nested structures)\n",
+        "    - Make each insight complete and self-contained\n",
+        "    - Include specific numerical values and ranges\n",
+        "    - Cover all elements in the results comprehensively\n",
+        "    - Maintain clear, concise language\n",
+        "    - Use only \"- **Title**: Description\" format for insights\n",
+        "    - Progress naturally from general to specific observations\n",
+        "\n",
+        "\"\"\".strip()\n",
+        "\n",
+        "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT\"] = context"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_6__'></a>\n",
+        "\n",
+        "### Raw data"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.DatasetDescription:raw_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_raw_dataset,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.DescriptiveStatistics:raw_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_raw_dataset,\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.MissingValues:raw_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_raw_dataset,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"min_percentage_threshold\": 1\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.ClassImbalance:raw_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_raw_dataset,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"min_percent_threshold\": 10\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.Duplicates:raw_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_raw_dataset,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"min_percentage_threshold\": 1\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.HighCardinality:raw_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_raw_dataset,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"num_threshold\": 100,\n",
+        "        \"percent_threshold\": 0.1,\n",
+        "        \"threshold_type\": \"percent\"\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.Skewness:raw_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_raw_dataset,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"max_threshold\": 1\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.UniqueRows:raw_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_raw_dataset,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"min_percent_threshold\": 1\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.TooManyZeroValues:raw_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_raw_dataset,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"max_percent_threshold\": 0.03\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.IQROutliersTable:raw_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_raw_dataset,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"threshold\": 5\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_7__'></a>\n",
+        "\n",
+        "### Pre-processed data"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.DescriptiveStatistics:preprocessed_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_preprocess_dataset,\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.TabularDescriptionTables:preprocessed_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_preprocess_dataset\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.MissingValues:preprocessed_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_preprocess_dataset,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"min_threshold\": 1\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.TabularNumericalHistograms:preprocessed_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_preprocess_dataset\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.TabularCategoricalBarPlots:preprocessed_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_preprocess_dataset\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.TargetRateBarPlots:preprocessed_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_preprocess_dataset\n",
+        "    },\n",
+        "    params={\n",
+        "        \"default_column\": lending_club.target_column,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_8__'></a>\n",
+        "\n",
+        "### Development data"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.DescriptiveStatistics:development_data\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.TabularDescriptionTables:development_data\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.ClassImbalance:development_data\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"min_percent_threshold\": 10\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.UniqueRows:development_data\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"min_percent_threshold\": 1\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.TabularNumericalHistograms:development_data\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_9__'></a>\n",
+        "\n",
+        "### Feature selection"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.MutualInformation:development_data\",\n",
+        "    input_grid  ={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"min_threshold\": 0.01,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.PearsonCorrelationMatrix:development_data\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.HighPearsonCorrelation:development_data\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"max_threshold\": 0.3,\n",
+        "        \"top_n_correlations\": 10\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.WOEBinTable\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_preprocess_dataset]\n",
+        "    },\n",
+        "    params={\n",
+        "        \"breaks_adj\": lending_club.breaks_adj,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.WOEBinPlots\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_preprocess_dataset]\n",
+        "    },\n",
+        "    params={\n",
+        "        \"breaks_adj\": lending_club.breaks_adj,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_10__'></a>\n",
+        "\n",
+        "### Model training"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.DatasetSplit\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_train_ds, vm_test_ds],\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.ModelMetadata\",\n",
+        "    input_grid={\n",
+        "        \"model\": [vm_xgb_model, vm_rf_model],\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.ModelParameters\",\n",
+        "    input_grid={\n",
+        "        \"model\": [vm_xgb_model, vm_rf_model],\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_11__'></a>\n",
+        "\n",
+        "### Model selection"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.statsmodels.GINITable\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "        \"model\": [vm_xgb_model, vm_rf_model],\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.ClassifierPerformance\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "        \"model\": [vm_xgb_model, vm_rf_model],\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.TrainingTestDegradation:XGBoost\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_train_ds, vm_test_ds],\n",
+        "        \"model\": vm_xgb_model,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"max_threshold\": 0.1\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.TrainingTestDegradation:RandomForest\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_train_ds, vm_test_ds],\n",
+        "        \"model\": vm_rf_model,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"max_threshold\": 0.1\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.HyperParametersTuning\",\n",
+        "    inputs={\n",
+        "        \"model\": vm_xgb_model,\n",
+        "        \"dataset\": vm_train_ds,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"param_grid\": {'n_estimators': [50, 100]},\n",
+        "        \"scoring\": ['roc_auc', 'recall'],\n",
+        "        \"fit_params\": {'eval_set': [(x_test, y_test)], 'verbose': False},\n",
+        "        \"thresholds\": [0.3, 0.5],\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_12__'></a>\n",
+        "\n",
+        "### Class discrimination"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.ROCCurve\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "        \"model\": [vm_xgb_model],\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.MinimumROCAUCScore\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "        \"model\": [vm_xgb_model],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"min_threshold\": 0.5\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.statsmodels.PredictionProbabilitiesHistogram\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "        \"model\": [vm_xgb_model],\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.statsmodels.CumulativePredictionProbabilities\",\n",
+        "    input_grid={\n",
+        "        \"model\": [vm_xgb_model],\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.PopulationStabilityIndex\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_train_ds, vm_test_ds],\n",
+        "        \"model\": vm_xgb_model,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"num_bins\": 10,\n",
+        "        \"mode\": \"fixed\"\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_13__'></a>\n",
+        "\n",
+        "### Classification accuracy"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.ClassifierThresholdOptimization\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_train_ds,\n",
+        "        \"model\": vm_xgb_model\n",
+        "    },\n",
+        "    params={\n",
+        "        \"target_recall\": 0.8 # Find a threshold that achieves a recall of 80%\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.CalibrationCurve\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "        \"model\": [vm_xgb_model],\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.ConfusionMatrix\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "        \"model\": [vm_xgb_model],\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.MinimumAccuracy\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "        \"model\": [vm_xgb_model],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"min_threshold\": 0.7\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.MinimumF1Score\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "        \"model\": [vm_xgb_model],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"min_threshold\": 0.5\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.PrecisionRecallCurve\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "        \"model\": [vm_xgb_model]\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_14__'></a>\n",
+        "\n",
+        "### Model diagnosis"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.WeakspotsDiagnosis\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_train_ds, vm_test_ds],\n",
+        "        \"model\": vm_xgb_model,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.OverfitDiagnosis\",\n",
+        "    inputs={\n",
+        "        \"model\": vm_xgb_model,\n",
+        "        \"datasets\": [vm_train_ds, vm_test_ds],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"cut_off_threshold\": 0.04\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.RobustnessDiagnosis\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_train_ds, vm_test_ds],\n",
+        "        \"model\": vm_xgb_model,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"scaling_factor_std_dev_list\": [\n",
+        "            0.1,\n",
+        "            0.2,\n",
+        "            0.3,\n",
+        "            0.4,\n",
+        "            0.5\n",
+        "        ],\n",
+        "        \"performance_decay_threshold\": 0.05\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_15__'></a>\n",
+        "\n",
+        "### Model explainability"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.PermutationFeatureImportance\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "        \"model\": [vm_xgb_model]\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.FeaturesAUC\",\n",
+        "    input_grid={\n",
+        "        \"model\": [vm_xgb_model],\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.SHAPGlobalImportance\",\n",
+        "    input_grid={\n",
+        "        \"model\": [vm_xgb_model],\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"kernel_explainer_samples\": 10,\n",
+        "        \"tree_or_linear_explainer_samples\": 200,\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_16__'></a>\n",
+        "\n",
+        "### Scoring evaluation"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.statsmodels.ScorecardHistogram\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds, vm_test_ds],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"score_column\": \"xgb_scores\",\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.ScoreBandDefaultRates\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds],\n",
+        "        \"model\": [vm_xgb_model],\n",
+        "    },\n",
+        "    params = {\n",
+        "        \"score_column\": \"xgb_scores\",\n",
+        "        \"score_bands\": [500, 540, 570]\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.ScoreProbabilityAlignment\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_train_ds],\n",
+        "        \"model\": [vm_xgb_model],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"score_column\": \"xgb_scores\",\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Custom tests\n",
+        "\n",
+        "Custom tests extend the functionality of ValidMind, allowing you to document any model or use case with added flexibility.\n",
+        "\n",
+        "ValidMind provides a comprehensive set of tests out-of-the-box to evaluate and document your models and datasets. We recognize there will be cases where the default tests do not support a model or dataset, or specific documentation is needed. In these cases, you can create and use your own custom code to accomplish what you need. To streamline custom code integration, we support the creation of custom test functions."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_1__'></a>\n",
+        "\n",
+        "### In-line custom tests\n",
+        "\n",
+        "The `@vm.test` decorator is doing the work of creating a wrapper around the function that will allow it to be run by the ValidMind Library. It also registers the test so it can be found by the ID `my_custom_tests.ScoreToOdds\"`. The function `score_to_odds_analysis` takes three arguments `dataset`, `score_column`, and `score_bands`. This is a `VMDataset` and the rest are parameters that can be passed in."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import numpy as np\n",
+        "import pandas as pd\n",
+        "import plotly.graph_objects as go\n",
+        "\n",
+        "\n",
+        "@vm.test(\"my_custom_tests.ScoreToOdds\")\n",
+        "def score_to_odds_analysis(dataset, score_column='score', score_bands=[410, 440, 470]):\n",
+        "    \"\"\"\n",
+        "    Analyzes the relationship between score bands and odds (good:bad ratio).\n",
+        "    Good odds = (1 - default_rate) / default_rate\n",
+        "    \n",
+        "    Higher scores should correspond to higher odds of being good.\n",
+        "    \"\"\"\n",
+        "    df = dataset.df\n",
+        "    \n",
+        "    # Create score bands\n",
+        "    df['score_band'] = pd.cut(\n",
+        "        df[score_column],\n",
+        "        bins=[-np.inf] + score_bands + [np.inf],\n",
+        "        labels=[f'<{score_bands[0]}'] + \n",
+        "               [f'{score_bands[i]}-{score_bands[i+1]}' for i in range(len(score_bands)-1)] +\n",
+        "               [f'>{score_bands[-1]}']\n",
+        "    )\n",
+        "    \n",
+        "    # Calculate metrics per band\n",
+        "    results = df.groupby('score_band').agg({\n",
+        "        dataset.target_column: ['mean', 'count']\n",
+        "    })\n",
+        "    \n",
+        "    results.columns = ['Default Rate', 'Total']\n",
+        "    results['Good Count'] = results['Total'] - (results['Default Rate'] * results['Total'])\n",
+        "    results['Bad Count'] = results['Default Rate'] * results['Total']\n",
+        "    results['Odds'] = results['Good Count'] / results['Bad Count']\n",
+        "    \n",
+        "    # Create visualization\n",
+        "    fig = go.Figure()\n",
+        "    \n",
+        "    # Add odds bars\n",
+        "    fig.add_trace(go.Bar(\n",
+        "        name='Odds (Good:Bad)',\n",
+        "        x=results.index,\n",
+        "        y=results['Odds'],\n",
+        "        marker_color='blue'\n",
+        "    ))\n",
+        "    \n",
+        "    fig.update_layout(\n",
+        "        title='Score-to-Odds Analysis',\n",
+        "        yaxis=dict(title='Odds Ratio (Good:Bad)'),\n",
+        "        showlegend=False\n",
+        "    )\n",
+        "    \n",
+        "    return fig"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"my_custom_tests.ScoreToOdds\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_test_ds,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"score_column\": \"xgb_scores\",\n",
+        "        \"score_bands\": [500, 540, 570],\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2__'></a>\n",
+        "\n",
+        "### Local test provider\n",
+        "\n",
+        "The ValidMind Library offers the ability to extend the built-in library of tests with custom tests. A test \"Provider\" is a Python class that gets registered with the ValidMind Library and loads tests based on a test ID, for example `my_test_provider.my_test_id`. The built-in suite of tests that ValidMind offers is technically its own test provider. You can use one the built-in test provider offered by ValidMind (`validmind.tests.test_providers.LocalTestProvider`) or you can create your own. More than likely, you'll want to use the `LocalTestProvider` to add a directory of custom tests but there's flexibility to be able to load tests from any source."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.tests import LocalTestProvider\n",
+        "\n",
+        "# Define the folder where your tests are located\n",
+        "tests_folder = \"custom_tests\"\n",
+        "\n",
+        "# initialize the test provider with the tests folder we created earlier\n",
+        "my_test_provider = LocalTestProvider(tests_folder)\n",
+        "\n",
+        "vm.tests.register_test_provider(\n",
+        "    namespace=\"my_test_provider\",\n",
+        "    test_provider=my_test_provider,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Now that we have our test provider set up, we can run any test that's located in our tests folder by using the `run_test()` method. This function is your entry point to running single tests in the ValidMind Library. It takes a test ID and runs the test associated with that ID. For our custom tests, the test ID will be the `namespace` specified when registering the provider, followed by the path to the test file relative to the tests folder. For example, the Confusion Matrix test we created earlier will have the test ID `my_test_provider.ConfusionMatrix`. You could organize the tests in subfolders, say `classification` and `regression`, and the test ID for the Confusion Matrix test would then be `my_test_provider.classification.ConfusionMatrix`."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"my_test_provider.ScoreBandDiscriminationMetrics\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_test_ds,\n",
+        "        \"model\": vm_xgb_model,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"score_column\": \"xgb_scores\",\n",
+        "        \"score_bands\": [500, 540, 570],\n",
+        "    }\n",
+        ").log(section_id=\"interpretability_insights\")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
+        "\n",
+        "<a id='toc7_1__'></a>\n",
+        "\n",
+        "### Work with your documentation\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "3. Expand the following sections and take a look around:\n",
+        "\n",
+        "   - **2. Data Preparation**\n",
+        "   - **3. Model Development**\n",
+        "\n",
+        "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation (hint: some of the tests in **2.3. Feature Selection and Engineering** look like they need some attention), view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
+        "\n",
+        "<a id='toc7_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-245d3f2bfcad480aa6baa2bde87c76e6"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "validmind-eEL8LtKG-py3.10",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.10.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 2
 }
diff --git a/site/notebooks/use_cases/credit_risk/document_excel_application_scorecard.ipynb b/site/notebooks/use_cases/credit_risk/document_excel_application_scorecard.ipynb
index be351497c2..fa8e86113a 100644
--- a/site/notebooks/use_cases/credit_risk/document_excel_application_scorecard.ipynb
+++ b/site/notebooks/use_cases/credit_risk/document_excel_application_scorecard.ipynb
@@ -1,1007 +1,1022 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Document an Excel-based application scorecard model\n",
-    "\n",
-    "Build and document an Excel-based application scorecard model with the ValidMind Library. Learn how to load an Excel-based model, prepare your datasets and model for testing, run tests and log those test results to the ValidMind Platform.\n",
-    "\n",
-    "An *application scorecard model* is a type of statistical model used in credit scoring to evaluate the creditworthiness of potential borrowers by generating a score based on various characteristics of an applicant such as credit history, income, employment status, and other relevant financial data.\n",
-    "\n",
-    " - This score assists lenders in making informed decisions about whether to approve or reject loan applications, as well as in determining the terms of the loan, including interest rates and credit limits.\n",
-    " - Effective validation of application scorecard models ensures that lenders can manage risk efficiently while maintaining a fast and transparent loan application process for applicants."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "  - [Initialize the Python environment](#toc2_3__)    \n",
-    "  - [Preview the documentation template](#toc2_4__)    \n",
-    "- [Loading the sample datasets](#toc3__)    \n",
-    "  - [Load the raw dataset](#toc3_1__)    \n",
-    "  - [Load the preprocessed dataset](#toc3_2__)    \n",
-    "  - [Load the training and test datasets](#toc3_3__)    \n",
-    "- [Initialize the ValidMind datasets](#toc4__)    \n",
-    "- [Initializing a model object](#toc5__)    \n",
-    "  - [Link predictions](#toc5_1__)    \n",
-    "- [Running tests](#toc6__)    \n",
-    "  - [Enable custom context for test descriptions](#toc6_1__)    \n",
-    "  - [Define tests to run](#toc6_2__)    \n",
-    "  - [Run defined tests](#toc6_3__)    \n",
-    "- [Next steps](#toc7__)    \n",
-    "  - [Work with your model documentation](#toc7_1__)    \n",
-    "    - [Add individual test results to documentation](#toc7_1_1__)    \n",
-    "  - [Discover more learning resources](#toc7_2__)    \n",
-    "- [Upgrade ValidMind](#toc8__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language.\n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "If you haven't already seen our [Get started with the ValidMind Library](https://docs.validmind.ai/developer/get-started-validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models, find code samples, or read our developer reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Custom tests**: Custom tests are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "- **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "- **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "- **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom test.\n",
-    "- **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom test. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: The [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2); border-radius: 5px;\">\n",
-    "  <span style=\"color: #083E44;\"><b>Recommended Python versions</b></span><br />\n",
-    "  Python 3.8 ≤ x ≤ 3.11\n",
-    "</div>\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Credit Risk Scorecard`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Initialize the Python environment\n",
-    "\n",
-    "Then, let's import the necessary libraries and set up your Python environment for data analysis:\n",
-    "\n",
-    "- Install **OpenPyPL** (openpyxl) which will allow us to read and write `.xlsx` files.\n",
-    "- Import `pandas`, a Python library for data manipulation and analytics, as an alias.\n",
-    "- Enable `matplotlib`, a plotting library used for visualizing data. Ensures that any plots you generate will render inline in our notebook output rather than opening in a separate window."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install openpyxl\n",
-    "\n",
-    "import pandas as pd\n",
-    "\n",
-    "%matplotlib inline"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_4__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Loading the sample datasets\n",
-    "\n",
-    "Let's import our sample dataset in the form of an Excel workbook ([CreditRiskData.xlsx](CreditRiskData.xlsx)) with five sheets indexed 0 to 3, each representing a different stage of data preparation:\n",
-    "\n",
-    "0. **Raw Data** – The original unprocessed dataset.\n",
-    "1. **Preprocessed Data** – A cleaned and prepared version of the raw data.\n",
-    "2. **Train Data** – A training subset used to fit your model.\n",
-    "3. **Test Data** – A testing subset used to evaluate model performance."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Load the raw dataset\n",
-    "\n",
-    "We'll start by loading the **Raw Data** sheet (index `0`) into a [Pandas DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "df = pd.read_excel('CreditRiskData.xlsx', sheet_name=0,engine='openpyxl')\n",
-    "\n",
-    "df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2__'></a>\n",
-    "\n",
-    "### Load the preprocessed dataset\n",
-    "\n",
-    "Next, load the **Preprocessed Data** sheet (index `1`), containing cleaned inputs ready for scoring:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "preprocess_df = pd.read_excel('CreditRiskData.xlsx', sheet_name=1,engine='openpyxl')\n",
-    "preprocess_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_3__'></a>\n",
-    "\n",
-    "### Load the training and test datasets\n",
-    "\n",
-    "Finally, load the split training (**Train Data**, index `2`) and testing (**Test Data**, index `3`) sets:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "train_df = pd.read_excel('CreditRiskData.xlsx', sheet_name=2,engine='openpyxl')\n",
-    "test_df = pd.read_excel('CreditRiskData.xlsx', sheet_name=3,engine='openpyxl')"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Initialize the ValidMind datasets\n",
-    "\n",
-    "Before you can run tests with your loaded datasets, you must first initialize a ValidMind `Dataset` object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module. **This step is always necessary every time you want to connect a dataset to documentation and produce test results through ValidMind,** but you only need to do it once per dataset.\n",
-    "\n",
-    "For this example, we'll pass in the following arguments:\n",
-    "\n",
-    "- **`dataset`:** The input DataFrame to test.\n",
-    "- **`input_id`:** A unique identifier for tracking test inputs.\n",
-    "- **`target_column`:** Required for tests that compare predictions to actual outcomes; specify the name of the column with the true values."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize the raw dataset\n",
-    "vm_raw_dataset = vm.init_dataset(\n",
-    "    dataset=df,\n",
-    "    input_id=\"raw_dataset\",\n",
-    "    target_column='loan_status',\n",
-    ")\n",
-    "\n",
-    "# Initialize the preprocessed dataset\n",
-    "vm_preprocess_dataset = vm.init_dataset(\n",
-    "    dataset=preprocess_df,\n",
-    "    input_id=\"preprocess_dataset\",\n",
-    "    target_column='loan_status',\n",
-    ")\n",
-    "\n",
-    "# Initialize the training dataset\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    dataset=train_df,\n",
-    "    input_id=\"train_dataset\",\n",
-    "    target_column='loan_status',\n",
-    ")\n",
-    "\n",
-    "# Initialize the testing dataset\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    dataset=test_df,\n",
-    "    input_id=\"test_dataset\",\n",
-    "    target_column='loan_status',\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Initializing a model object\n",
-    "\n",
-    "In this Excel-based use case, predictions are precomputed and included in the Excel file. While there's no model logic to run, a ValidMind model object (`vm_model`) is still required for passing to other functions for analysis and tests on the data.\n",
-    "\n",
-    "Simply define a placeholder model using [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Prediction logic placeholder\n",
-    "def dummy(X, **kwargs):\n",
-    "    return None\n",
-    "\n",
-    "xgb_model = vm.init_model(\n",
-    "        input_id=\"xgb_model\",\n",
-    "        predict_fn=dummy\n",
-    "    )"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_1__'></a>\n",
-    "\n",
-    "### Link predictions\n",
-    "\n",
-    "Once the model has been registered, you can assign model predictions to the training and testing datasets.\n",
-    "\n",
-    "Use the [`assign_predictions()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#assign_predictions) from the `Dataset` object to link the prediction values and probabilities from the relevant columns on our Excel spreadsheet to the training and testing datasets:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds.assign_predictions(model=xgb_model, prediction_column=\"xgb_model_prediction\",probability_column='xgb_model_probabilities')\n",
-    "vm_test_ds.assign_predictions(model=xgb_model, prediction_column=\"xgb_model_prediction\",probability_column='xgb_model_probabilities')"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Running tests\n",
-    "\n",
-    "This is where it all comes together — we'll use our previously initialized datasets as inputs to run tests, then log the results to the ValidMind Platform.\n",
-    "\n",
-    "We'll run some tests that are defined out-of-the-box by the template we previewed earlier in this notebook, as well as some additional tests for more evidence. For the example in this section, we've selected and defined the tests for you.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about navigating ValidMind tests?</b></span>\n",
-    "<br></br>\n",
-    "Refer to our notebook outlining the utilities available for viewing and understanding available ValidMind tests: <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/explore_tests/explore_tests.html\" style=\"color: #DE257E;\"><b>Explore tests</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1__'></a>\n",
-    "\n",
-    "### Enable custom context for test descriptions\n",
-    "\n",
-    "When you run ValidMind tests, test descriptions are automatically generated with LLM using the test results, the test name, and the static test definitions provided in the test’s docstring. While this metadata offers valuable high-level overviews of tests, insights produced by the LLM-based descriptions may not always align with your specific use cases or incorporate organizational policy requirements.\n",
-    "\n",
-    "Before we run our tests, we'll include some custom use case context to improve the clarity, structure, and interpretability of the test descriptions returned. By default, custom context for LLM-generated descriptions is disabled, meaning that the output will not include any additional context. To enable custom use case context, set the `VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED` environment variable to `1`.\n",
-    "\n",
-    "This is a global setting that will affect all tests for your linked model:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import os\n",
-    "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED\"] = \"1\"\n",
-    "\n",
-    "context = \"\"\"\n",
-    "FORMAT FOR THE LLM DESCRIPTIONS: \n",
-    "    **<Test Name>** is designed to <begin with a concise overview of what the test does and its primary purpose, \n",
-    "    extracted from the test description>.\n",
-    "\n",
-    "    The test operates by <write a paragraph about the test mechanism, explaining how it works and what it measures. \n",
-    "    Include any relevant formulas or methodologies mentioned in the test description.>\n",
-    "\n",
-    "    The primary advantages of this test include <write a paragraph about the test's strengths and capabilities, \n",
-    "    highlighting what makes it particularly useful for specific scenarios.>\n",
-    "\n",
-    "    Users should be aware that <write a paragraph about the test's limitations and potential risks. \n",
-    "    Include both technical limitations and interpretation challenges. \n",
-    "    If the test description includes specific signs of high risk, incorporate these here.>\n",
-    "\n",
-    "    **Key Insights:**\n",
-    "\n",
-    "    The test results reveal:\n",
-    "\n",
-    "    - **<insight title>**: <comprehensive description of one aspect of the results>\n",
-    "    - **<insight title>**: <comprehensive description of another aspect>\n",
-    "    ...\n",
-    "\n",
-    "    Based on these results, <conclude with a brief paragraph that ties together the test results with the test's \n",
-    "    purpose and provides any final recommendations or considerations.>\n",
-    "\n",
-    "ADDITIONAL INSTRUCTIONS:\n",
-    "    Present insights in order from general to specific, with each insight as a single bullet point with bold title.\n",
-    "\n",
-    "    For each metric in the test results, include in the test overview:\n",
-    "    - The metric's purpose and what it measures\n",
-    "    - Its mathematical formula\n",
-    "    - The range of possible values\n",
-    "    - What constitutes good/bad performance\n",
-    "    - How to interpret different values\n",
-    "\n",
-    "    Each insight should progressively cover:\n",
-    "    1. Overall scope and distribution\n",
-    "    2. Complete breakdown of all elements with specific values\n",
-    "    3. Natural groupings and patterns\n",
-    "    4. Comparative analysis between datasets/categories\n",
-    "    5. Stability and variations\n",
-    "    6. Notable relationships or dependencies\n",
-    "\n",
-    "    Remember:\n",
-    "    - Keep all insights at the same level (no sub-bullets or nested structures)\n",
-    "    - Make each insight complete and self-contained\n",
-    "    - Include specific numerical values and ranges\n",
-    "    - Cover all elements in the results comprehensively\n",
-    "    - Maintain clear, concise language\n",
-    "    - Use only \"- **Title**: Description\" format for insights\n",
-    "    - Progress naturally from general to specific observations\n",
-    "\n",
-    "\"\"\".strip()\n",
-    "\n",
-    "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT\"] = context"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2__'></a>\n",
-    "\n",
-    "### Define tests to run\n",
-    "\n",
-    "First, we'll specify all the tests we'd like to independently run in a dictionary called `test_config`, including information about the `params` and `inputs` that each test requires.\n",
-    "\n",
-    "-  Note here that `inputs` and `input_grid` expect the `input_id` of the dataset or model as the value rather than the variable name we specified**.\n",
-    "- When running individual tests, you can use a custom `result_id` to tag the individual result with a unique identifier by appending this `result_id` to the `test_id` with a `:` separator. (Example: `:raw_data` for tests run with our raw dataset.)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test_config = {\n",
-    "\n",
-    "    # Data validation tests run with raw dataset\n",
-    "    'validmind.data_validation.DatasetDescription:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'}\n",
-    "    },\n",
-    "    'validmind.data_validation.DescriptiveStatistics:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'}\n",
-    "    },\n",
-    "    'validmind.data_validation.MissingValues:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'min_percentage_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.ClassImbalance:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'min_percent_threshold': 10}\n",
-    "    },\n",
-    "    'validmind.data_validation.Duplicates:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'min_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.HighCardinality:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {\n",
-    "            'num_threshold': 100,\n",
-    "            'percent_threshold': 0.1,\n",
-    "            'threshold_type': 'percent'\n",
-    "        }\n",
-    "    },\n",
-    "    'validmind.data_validation.Skewness:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'max_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.UniqueRows:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'min_percent_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.TooManyZeroValues:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'max_percent_threshold': 0.03}\n",
-    "    },\n",
-    "    'validmind.data_validation.IQROutliersTable:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'threshold': 5}\n",
-    "    },\n",
-    "\n",
-    "    # Data validation tests run with preprocessed dataset\n",
-    "    'validmind.data_validation.DescriptiveStatistics:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'preprocess_dataset'}\n",
-    "    },\n",
-    "    'validmind.data_validation.TabularDescriptionTables:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'preprocess_dataset'}\n",
-    "    },\n",
-    "    'validmind.data_validation.MissingValues:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'preprocess_dataset'},\n",
-    "        'params': {'min_percentage_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.TabularNumericalHistograms:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'preprocess_dataset'}\n",
-    "    },\n",
-    "    'validmind.data_validation.TabularCategoricalBarPlots:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'preprocess_dataset'}\n",
-    "    },\n",
-    "    'validmind.data_validation.TargetRateBarPlots:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'preprocess_dataset'},\n",
-    "        'params': {'default_column': 'loan_status'}\n",
-    "    },\n",
-    "\n",
-    "    'validmind.data_validation.WOEBinTable': {\n",
-    "        'input_grid': {'dataset': ['preprocess_dataset']},\n",
-    "        'params': {\n",
-    "            'breaks_adj': {\n",
-    "                'loan_amnt': [5000, 10000, 15000, 20000, 25000],\n",
-    "                'int_rate': [10, 15, 20],\n",
-    "                'annual_inc': [50000, 100000, 150000]\n",
-    "            }\n",
-    "        }\n",
-    "    },\n",
-    "    'validmind.data_validation.WOEBinPlots': {\n",
-    "        'input_grid': {'dataset': ['preprocess_dataset']},\n",
-    "        'params': {\n",
-    "            'breaks_adj': {\n",
-    "                'loan_amnt': [5000, 10000, 15000, 20000, 25000],\n",
-    "                'int_rate': [10, 15, 20],\n",
-    "                'annual_inc': [50000, 100000, 150000]\n",
-    "            }\n",
-    "        }\n",
-    "    },\n",
-    "\n",
-    "    # Data validation tests run with training & testing datasets\n",
-    "    'validmind.data_validation.DescriptiveStatistics:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']}\n",
-    "    },\n",
-    "    'validmind.data_validation.TabularDescriptionTables:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']}\n",
-    "    },\n",
-    "    'validmind.data_validation.ClassImbalance:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']},\n",
-    "        'params': {'min_percent_threshold': 10}\n",
-    "    },\n",
-    "    'validmind.data_validation.UniqueRows:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']},\n",
-    "        'params': {'min_percent_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.TabularNumericalHistograms:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']}\n",
-    "    },\n",
-    "    'validmind.data_validation.MutualInformation:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']},\n",
-    "        'params': {'min_threshold': 0.01}\n",
-    "    },\n",
-    "    'validmind.data_validation.PearsonCorrelationMatrix:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']}\n",
-    "    },\n",
-    "    'validmind.data_validation.HighPearsonCorrelation:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']},\n",
-    "        'params': {'max_threshold': 0.3, 'top_n_correlations': 10}\n",
-    "    },\n",
-    "    'validmind.data_validation.ScoreBandDefaultRates:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset'], 'model': ['xgb_model']},\n",
-    "        'params': {'score_column': 'xgb_scores', 'score_bands': [504, 537, 570]}\n",
-    "    },\n",
-    "    'validmind.data_validation.DatasetSplit:development_data': {\n",
-    "        'inputs': {'datasets': ['train_dataset', 'test_dataset']}\n",
-    "    },\n",
-    "\n",
-    "    # Model validation tests\n",
-    "    'validmind.model_validation.statsmodels.GINITable': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model']}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.ClassifierPerformance': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model']}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.TrainingTestDegradation:XGBoost': {\n",
-    "        'inputs': {\n",
-    "            'datasets': ['train_dataset', 'test_dataset'],\n",
-    "            'model': 'xgb_model'\n",
-    "        },\n",
-    "        'params': {'max_threshold': 0.1}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.ROCCurve': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model']}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.MinimumROCAUCScore': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model']},\n",
-    "        'params': {'min_threshold': 0.5}\n",
-    "    },\n",
-    "    'validmind.model_validation.statsmodels.PredictionProbabilitiesHistogram': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model']}\n",
-    "    },\n",
-    "    'validmind.model_validation.statsmodels.CumulativePredictionProbabilities': {\n",
-    "        'input_grid': {'model': ['xgb_model'], 'dataset': ['train_dataset', 'test_dataset']}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.PopulationStabilityIndex': {\n",
-    "        'inputs': {\n",
-    "            'datasets': ['train_dataset', 'test_dataset'],\n",
-    "            'model': 'xgb_model'\n",
-    "        },\n",
-    "        'params': {'num_bins': 10, 'mode': 'fixed'}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.ConfusionMatrix': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model']}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.MinimumAccuracy': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model']},\n",
-    "        'params': {'min_threshold': 0.7}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.MinimumF1Score': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model']},\n",
-    "        'params': {'min_threshold': 0.5}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.PrecisionRecallCurve': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model']}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.CalibrationCurve': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model']}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.ClassifierThresholdOptimization': {\n",
-    "        'inputs': {'dataset': 'train_dataset', 'model': 'xgb_model'},\n",
-    "        'params': {'target_recall': 0.8}\n",
-    "    },\n",
-    "    'validmind.model_validation.statsmodels.ScorecardHistogram': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']},\n",
-    "        'params': {'score_column': 'xgb_scores'}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.ScoreProbabilityAlignment': {\n",
-    "        'input_grid': {'dataset': ['train_dataset'], 'model': ['xgb_model']},\n",
-    "        'params': {'score_column': 'xgb_scores'}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.WeakspotsDiagnosis': {\n",
-    "        'inputs': {'datasets': ['train_dataset', 'test_dataset'], 'model': 'xgb_model'}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.OverfitDiagnosis': {\n",
-    "        'inputs': {'model': 'xgb_model', 'datasets': ['train_dataset', 'test_dataset']},\n",
-    "        'params': {'cut_off_threshold': 0.04}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.RobustnessDiagnosis': {\n",
-    "        'inputs': {'datasets': ['train_dataset', 'test_dataset'], 'model': 'xgb_model'},\n",
-    "        'params': {\n",
-    "            'scaling_factor_std_dev_list': [0.1, 0.2, 0.3, 0.4, 0.5],\n",
-    "            'performance_decay_threshold': 0.05\n",
-    "        }\n",
-    "    },\n",
-    "    'validmind.model_validation.FeaturesAUC': {\n",
-    "        'input_grid': {'model': ['xgb_model'], 'dataset': ['train_dataset', 'test_dataset']}\n",
-    "    }\n",
-    "}"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_3__'></a>\n",
-    "\n",
-    "### Run defined tests\n",
-    "\n",
-    "Then, we'll define a utility wrapper around [the `run_test` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test) provided by the `validmind.tests` module in a function called `run_doc_tests`.\n",
-    "\n",
-    "- Every test result returned by the `run_test()` function has a [`.log()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#TestResult.log) that can be used to send the test results to the ValidMind Platform.\n",
-    "- Our function requires information about the inputs to use on every test — which is why we specified these inputs above in `test_config`."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def run_doc_tests(test_config):\n",
-    "    for test_name, test_cfg in test_config.items():\n",
-    "        print(test_name)\n",
-    "        try:\n",
-    "            # Collect available keyword arguments\n",
-    "            kwargs = {\n",
-    "                key: test_cfg[key]\n",
-    "                for key in (\"params\", \"input_grid\", \"inputs\")\n",
-    "                if key in test_cfg\n",
-    "            }\n",
-    "            kwargs[\"show\"] = False\n",
-    "\n",
-    "            # Execute the test and log the results\n",
-    "            vm.tests.run_test(test_name, **kwargs).log()\n",
-    "\n",
-    "        except Exception as e:\n",
-    "            print(f\"Error running test {test_name}: {e}\")\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Finally, we can pass the input configuration to `run_doc_tests` and run the full suite of tests!\n",
-    "\n",
-    "The variable `full_suite` then holds the result of these tests:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "full_suite = run_doc_tests(test_config)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the outputs returned indicating that certain test-driven blocks don't currently exist in your model's documentation for this particular test ID. </b></span>\n",
-    "<br></br>\n",
-    "That's expected, as when we run individual tests not defined by the documentation template out-of-the-box, the results logged need to be manually added to your documentation within the ValidMind Platform.</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way, use the ValidMind Platform to work with your model documentation.\n",
-    "\n",
-    "<a id='toc7_1__'></a>\n",
-    "\n",
-    "### Work with your model documentation\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "   What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready.\n",
-    "\n",
-    "3. Expand the following section to review tests automatically inserted into your documentation template: **2.3. Feature Selection and Engineering**\n",
-    "\n",
-    "<a id='toc7_1_1__'></a>\n",
-    "\n",
-    "#### Add individual test results to documentation\n",
-    "\n",
-    "Let's also add our additional test results into the documentation. These were results sent by individual tests not defined out-of-the-box by our template. For example ([Need more help?](https://docs.validmind.ai/developer/model-documentation/work-with-test-results.html)):\n",
-    "\n",
-    "1. Locate the Data Preparation section of your documentation and click on **2.2. Correlations and Interactions** to expand that section.\n",
-    "\n",
-    "4. Hover under the Pearson Correlation Matrix content block until a horizontal dashed line with a **+** button appears, indicating that you can insert a new block.\n",
-    "\n",
-    "    <img src= \"../../tutorials/model_development/add-content-block.gif\" alt=\"Screenshot showing insert block button in model documentation\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
-    "    <br><br>\n",
-    "\n",
-    "5. Click **+** and then select **Test-Driven Block** under FROM LIBRARY:\n",
-    "\n",
-    "    - Click on **VM Library** under TEST-DRIVEN in the left sidebar.\n",
-    "    - In the search bar, type in `HighPearsonCorrelation`.\n",
-    "    - Select `HighPearsonCorrelation:development_data` as the test.\n",
-    "\n",
-    "6. Finally, click **Insert 1 Test Result to Document** to add the test result to the documentation.\n",
-    "\n",
-    "    Confirm that the individual results for the high correlation test has been correctly inserted into section **2.3. Correlations and Interactions** of the documentation.\n",
-    "\n",
-    "<a id='toc7_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc8__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-d5682d445de64cada526101fd53872e2",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 4
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Document an Excel-based application scorecard model\n",
+        "\n",
+        "Build and document an Excel-based application scorecard model with the ValidMind Library. Learn how to load an Excel-based model, prepare your datasets and model for testing, run tests and log those test results to the ValidMind Platform.\n",
+        "\n",
+        "An *application scorecard model* is a type of statistical model used in credit scoring to evaluate the creditworthiness of potential borrowers by generating a score based on various characteristics of an applicant such as credit history, income, employment status, and other relevant financial data.\n",
+        "\n",
+        " - This score assists lenders in making informed decisions about whether to approve or reject loan applications, as well as in determining the terms of the loan, including interest rates and credit limits.\n",
+        " - Effective validation of application scorecard models ensures that lenders can manage risk efficiently while maintaining a fast and transparent loan application process for applicants."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "  - [Initialize the Python environment](#toc2_3__)    \n",
+        "  - [Preview the documentation template](#toc2_4__)    \n",
+        "- [Loading the sample datasets](#toc3__)    \n",
+        "  - [Load the raw dataset](#toc3_1__)    \n",
+        "  - [Load the preprocessed dataset](#toc3_2__)    \n",
+        "  - [Load the training and test datasets](#toc3_3__)    \n",
+        "- [Initialize the ValidMind datasets](#toc4__)    \n",
+        "- [Initialize the ValidMind model](#toc5__)    \n",
+        "  - [Link predictions](#toc5_1__)    \n",
+        "- [Running tests](#toc6__)    \n",
+        "  - [Enable custom context for test descriptions](#toc6_1__)    \n",
+        "  - [Define tests to run](#toc6_2__)    \n",
+        "  - [Run defined tests](#toc6_3__)    \n",
+        "- [Next steps](#toc7__)    \n",
+        "  - [Work with your documentation](#toc7_1__)    \n",
+        "    - [Add individual test results to documentation](#toc7_1_1__)    \n",
+        "  - [Discover more learning resources](#toc7_2__)    \n",
+        "- [Upgrade ValidMind](#toc8__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language.\n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2); border-radius: 5px;\">\n",
+        "  <span style=\"color: #083E44;\"><b>Recommended Python versions</b></span><br />\n",
+        "  Python 3.8 ≤ x ≤ 3.11\n",
+        "</div>\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Credit Risk Scorecard`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Initialize the Python environment\n",
+        "\n",
+        "Then, let's import the necessary libraries and set up your Python environment for data analysis:\n",
+        "\n",
+        "- Install **OpenPyPL** (openpyxl) which will allow us to read and write `.xlsx` files.\n",
+        "- Import `pandas`, a Python library for data manipulation and analytics, as an alias.\n",
+        "- Enable `matplotlib`, a plotting library used for visualizing data. Ensures that any plots you generate will render inline in our notebook output rather than opening in a separate window."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install openpyxl\n",
+        "\n",
+        "import pandas as pd\n",
+        "\n",
+        "%matplotlib inline"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_4__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Loading the sample datasets\n",
+        "\n",
+        "Let's import our sample dataset in the form of an Excel workbook ([CreditRiskData.xlsx](CreditRiskData.xlsx)) with five sheets indexed 0 to 3, each representing a different stage of data preparation:\n",
+        "\n",
+        "0. **Raw Data** – The original unprocessed dataset.\n",
+        "1. **Preprocessed Data** – A cleaned and prepared version of the raw data.\n",
+        "2. **Train Data** – A training subset used to fit your model.\n",
+        "3. **Test Data** – A testing subset used to evaluate model performance."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Load the raw dataset\n",
+        "\n",
+        "We'll start by loading the **Raw Data** sheet (index `0`) into a [Pandas DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "df = pd.read_excel('CreditRiskData.xlsx', sheet_name=0,engine='openpyxl')\n",
+        "\n",
+        "df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2__'></a>\n",
+        "\n",
+        "### Load the preprocessed dataset\n",
+        "\n",
+        "Next, load the **Preprocessed Data** sheet (index `1`), containing cleaned inputs ready for scoring:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "preprocess_df = pd.read_excel('CreditRiskData.xlsx', sheet_name=1,engine='openpyxl')\n",
+        "preprocess_df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_3__'></a>\n",
+        "\n",
+        "### Load the training and test datasets\n",
+        "\n",
+        "Finally, load the split training (**Train Data**, index `2`) and testing (**Test Data**, index `3`) sets:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "train_df = pd.read_excel('CreditRiskData.xlsx', sheet_name=2,engine='openpyxl')\n",
+        "test_df = pd.read_excel('CreditRiskData.xlsx', sheet_name=3,engine='openpyxl')"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Initialize the ValidMind datasets\n",
+        "\n",
+        "Before you can run tests with your loaded datasets, you must first initialize a ValidMind `Dataset` object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module. **This step is always necessary every time you want to connect a dataset to documentation and produce test results through ValidMind,** but you only need to do it once per dataset.\n",
+        "\n",
+        "For this example, we'll pass in the following arguments:\n",
+        "\n",
+        "- **`dataset`:** The input DataFrame to test.\n",
+        "- **`input_id`:** A unique identifier for tracking test inputs.\n",
+        "- **`target_column`:** Required for tests that compare predictions to actual outcomes; specify the name of the column with the true values."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Initialize the raw dataset\n",
+        "vm_raw_dataset = vm.init_dataset(\n",
+        "    dataset=df,\n",
+        "    input_id=\"raw_dataset\",\n",
+        "    target_column='loan_status',\n",
+        ")\n",
+        "\n",
+        "# Initialize the preprocessed dataset\n",
+        "vm_preprocess_dataset = vm.init_dataset(\n",
+        "    dataset=preprocess_df,\n",
+        "    input_id=\"preprocess_dataset\",\n",
+        "    target_column='loan_status',\n",
+        ")\n",
+        "\n",
+        "# Initialize the training dataset\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    dataset=train_df,\n",
+        "    input_id=\"train_dataset\",\n",
+        "    target_column='loan_status',\n",
+        ")\n",
+        "\n",
+        "# Initialize the testing dataset\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    dataset=test_df,\n",
+        "    input_id=\"test_dataset\",\n",
+        "    target_column='loan_status',\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Initialize the ValidMind model\n",
+        "\n",
+        "In this Excel-based use case, predictions are precomputed and included in the Excel file. While there's no model logic to run, a ValidMind model object (`vm_model`) is still required for passing to other functions for analysis and tests on the data.\n",
+        "\n",
+        "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+        "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
+        "\n",
+        "Initialize your model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Prediction logic placeholder\n",
+        "def dummy(X, **kwargs):\n",
+        "    return None\n",
+        "\n",
+        "xgb_model = vm.init_model(\n",
+        "        input_id=\"xgb_model\",\n",
+        "        predict_fn=dummy\n",
+        "    )"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Link predictions\n",
+        "\n",
+        "Once the model has been registered, you can assign model predictions to the training and testing datasets.\n",
+        "\n",
+        "Use the [`assign_predictions()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#assign_predictions) from the `Dataset` object to link the prediction values and probabilities from the relevant columns on our Excel spreadsheet to the training and testing datasets:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds.assign_predictions(model=xgb_model, prediction_column=\"xgb_model_prediction\",probability_column='xgb_model_probabilities')\n",
+        "vm_test_ds.assign_predictions(model=xgb_model, prediction_column=\"xgb_model_prediction\",probability_column='xgb_model_probabilities')"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Running tests\n",
+        "\n",
+        "This is where it all comes together — we'll use our previously initialized datasets as inputs to run tests, then log the results to the ValidMind Platform.\n",
+        "\n",
+        "We'll run some tests that are defined out-of-the-box by the template we previewed earlier in this notebook, as well as some additional tests for more evidence. For the example in this section, we've selected and defined the tests for you.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about navigating ValidMind tests?</b></span>\n",
+        "<br></br>\n",
+        "Refer to our notebook outlining the utilities available for viewing and understanding available ValidMind tests: <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/explore_tests/explore_tests.html\" style=\"color: #DE257E;\"><b>Explore tests</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_1__'></a>\n",
+        "\n",
+        "### Enable custom context for test descriptions\n",
+        "\n",
+        "When you run ValidMind tests, test descriptions are automatically generated with LLM using the test results, the test name, and the static test definitions provided in the test’s docstring. While this metadata offers valuable high-level overviews of tests, insights produced by the LLM-based descriptions may not always align with your specific use cases or incorporate organizational policy requirements.\n",
+        "\n",
+        "Before we run our tests, we'll include some custom use case context to improve the clarity, structure, and interpretability of the test descriptions returned. By default, custom context for LLM-generated descriptions is disabled, meaning that the output will not include any additional context. To enable custom use case context, set the `VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED` environment variable to `1`.\n",
+        "\n",
+        "This is a global setting that will affect all tests for your linked model:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import os\n",
+        "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED\"] = \"1\"\n",
+        "\n",
+        "context = \"\"\"\n",
+        "FORMAT FOR THE LLM DESCRIPTIONS: \n",
+        "    **<Test Name>** is designed to <begin with a concise overview of what the test does and its primary purpose, \n",
+        "    extracted from the test description>.\n",
+        "\n",
+        "    The test operates by <write a paragraph about the test mechanism, explaining how it works and what it measures. \n",
+        "    Include any relevant formulas or methodologies mentioned in the test description.>\n",
+        "\n",
+        "    The primary advantages of this test include <write a paragraph about the test's strengths and capabilities, \n",
+        "    highlighting what makes it particularly useful for specific scenarios.>\n",
+        "\n",
+        "    Users should be aware that <write a paragraph about the test's limitations and potential risks. \n",
+        "    Include both technical limitations and interpretation challenges. \n",
+        "    If the test description includes specific signs of high risk, incorporate these here.>\n",
+        "\n",
+        "    **Key Insights:**\n",
+        "\n",
+        "    The test results reveal:\n",
+        "\n",
+        "    - **<insight title>**: <comprehensive description of one aspect of the results>\n",
+        "    - **<insight title>**: <comprehensive description of another aspect>\n",
+        "    ...\n",
+        "\n",
+        "    Based on these results, <conclude with a brief paragraph that ties together the test results with the test's \n",
+        "    purpose and provides any final recommendations or considerations.>\n",
+        "\n",
+        "ADDITIONAL INSTRUCTIONS:\n",
+        "    Present insights in order from general to specific, with each insight as a single bullet point with bold title.\n",
+        "\n",
+        "    For each metric in the test results, include in the test overview:\n",
+        "    - The metric's purpose and what it measures\n",
+        "    - Its mathematical formula\n",
+        "    - The range of possible values\n",
+        "    - What constitutes good/bad performance\n",
+        "    - How to interpret different values\n",
+        "\n",
+        "    Each insight should progressively cover:\n",
+        "    1. Overall scope and distribution\n",
+        "    2. Complete breakdown of all elements with specific values\n",
+        "    3. Natural groupings and patterns\n",
+        "    4. Comparative analysis between datasets/categories\n",
+        "    5. Stability and variations\n",
+        "    6. Notable relationships or dependencies\n",
+        "\n",
+        "    Remember:\n",
+        "    - Keep all insights at the same level (no sub-bullets or nested structures)\n",
+        "    - Make each insight complete and self-contained\n",
+        "    - Include specific numerical values and ranges\n",
+        "    - Cover all elements in the results comprehensively\n",
+        "    - Maintain clear, concise language\n",
+        "    - Use only \"- **Title**: Description\" format for insights\n",
+        "    - Progress naturally from general to specific observations\n",
+        "\n",
+        "\"\"\".strip()\n",
+        "\n",
+        "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT\"] = context"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2__'></a>\n",
+        "\n",
+        "### Define tests to run\n",
+        "\n",
+        "First, we'll specify all the tests we'd like to independently run in a dictionary called `test_config`, including information about the `params` and `inputs` that each test requires.\n",
+        "\n",
+        "-  Note here that `inputs` and `input_grid` expect the `input_id` of the dataset or model as the value rather than the variable name we specified**.\n",
+        "- When running individual tests, you can use a custom `result_id` to tag the individual result with a unique identifier by appending this `result_id` to the `test_id` with a `:` separator. (Example: `:raw_data` for tests run with our raw dataset.)"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test_config = {\n",
+        "\n",
+        "    # Data validation tests run with raw dataset\n",
+        "    'validmind.data_validation.DatasetDescription:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'}\n",
+        "    },\n",
+        "    'validmind.data_validation.DescriptiveStatistics:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'}\n",
+        "    },\n",
+        "    'validmind.data_validation.MissingValues:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'min_percentage_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.ClassImbalance:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'min_percent_threshold': 10}\n",
+        "    },\n",
+        "    'validmind.data_validation.Duplicates:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'min_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.HighCardinality:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {\n",
+        "            'num_threshold': 100,\n",
+        "            'percent_threshold': 0.1,\n",
+        "            'threshold_type': 'percent'\n",
+        "        }\n",
+        "    },\n",
+        "    'validmind.data_validation.Skewness:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'max_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.UniqueRows:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'min_percent_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.TooManyZeroValues:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'max_percent_threshold': 0.03}\n",
+        "    },\n",
+        "    'validmind.data_validation.IQROutliersTable:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'threshold': 5}\n",
+        "    },\n",
+        "\n",
+        "    # Data validation tests run with preprocessed dataset\n",
+        "    'validmind.data_validation.DescriptiveStatistics:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'preprocess_dataset'}\n",
+        "    },\n",
+        "    'validmind.data_validation.TabularDescriptionTables:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'preprocess_dataset'}\n",
+        "    },\n",
+        "    'validmind.data_validation.MissingValues:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'preprocess_dataset'},\n",
+        "        'params': {'min_percentage_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.TabularNumericalHistograms:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'preprocess_dataset'}\n",
+        "    },\n",
+        "    'validmind.data_validation.TabularCategoricalBarPlots:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'preprocess_dataset'}\n",
+        "    },\n",
+        "    'validmind.data_validation.TargetRateBarPlots:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'preprocess_dataset'},\n",
+        "        'params': {'default_column': 'loan_status'}\n",
+        "    },\n",
+        "\n",
+        "    'validmind.data_validation.WOEBinTable': {\n",
+        "        'input_grid': {'dataset': ['preprocess_dataset']},\n",
+        "        'params': {\n",
+        "            'breaks_adj': {\n",
+        "                'loan_amnt': [5000, 10000, 15000, 20000, 25000],\n",
+        "                'int_rate': [10, 15, 20],\n",
+        "                'annual_inc': [50000, 100000, 150000]\n",
+        "            }\n",
+        "        }\n",
+        "    },\n",
+        "    'validmind.data_validation.WOEBinPlots': {\n",
+        "        'input_grid': {'dataset': ['preprocess_dataset']},\n",
+        "        'params': {\n",
+        "            'breaks_adj': {\n",
+        "                'loan_amnt': [5000, 10000, 15000, 20000, 25000],\n",
+        "                'int_rate': [10, 15, 20],\n",
+        "                'annual_inc': [50000, 100000, 150000]\n",
+        "            }\n",
+        "        }\n",
+        "    },\n",
+        "\n",
+        "    # Data validation tests run with training & testing datasets\n",
+        "    'validmind.data_validation.DescriptiveStatistics:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']}\n",
+        "    },\n",
+        "    'validmind.data_validation.TabularDescriptionTables:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']}\n",
+        "    },\n",
+        "    'validmind.data_validation.ClassImbalance:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']},\n",
+        "        'params': {'min_percent_threshold': 10}\n",
+        "    },\n",
+        "    'validmind.data_validation.UniqueRows:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']},\n",
+        "        'params': {'min_percent_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.TabularNumericalHistograms:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']}\n",
+        "    },\n",
+        "    'validmind.data_validation.MutualInformation:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']},\n",
+        "        'params': {'min_threshold': 0.01}\n",
+        "    },\n",
+        "    'validmind.data_validation.PearsonCorrelationMatrix:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']}\n",
+        "    },\n",
+        "    'validmind.data_validation.HighPearsonCorrelation:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']},\n",
+        "        'params': {'max_threshold': 0.3, 'top_n_correlations': 10}\n",
+        "    },\n",
+        "    'validmind.data_validation.ScoreBandDefaultRates:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset'], 'model': ['xgb_model']},\n",
+        "        'params': {'score_column': 'xgb_scores', 'score_bands': [504, 537, 570]}\n",
+        "    },\n",
+        "    'validmind.data_validation.DatasetSplit:development_data': {\n",
+        "        'inputs': {'datasets': ['train_dataset', 'test_dataset']}\n",
+        "    },\n",
+        "\n",
+        "    # Model validation tests\n",
+        "    'validmind.model_validation.statsmodels.GINITable': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model']}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.ClassifierPerformance': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model']}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.TrainingTestDegradation:XGBoost': {\n",
+        "        'inputs': {\n",
+        "            'datasets': ['train_dataset', 'test_dataset'],\n",
+        "            'model': 'xgb_model'\n",
+        "        },\n",
+        "        'params': {'max_threshold': 0.1}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.ROCCurve': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model']}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.MinimumROCAUCScore': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model']},\n",
+        "        'params': {'min_threshold': 0.5}\n",
+        "    },\n",
+        "    'validmind.model_validation.statsmodels.PredictionProbabilitiesHistogram': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model']}\n",
+        "    },\n",
+        "    'validmind.model_validation.statsmodels.CumulativePredictionProbabilities': {\n",
+        "        'input_grid': {'model': ['xgb_model'], 'dataset': ['train_dataset', 'test_dataset']}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.PopulationStabilityIndex': {\n",
+        "        'inputs': {\n",
+        "            'datasets': ['train_dataset', 'test_dataset'],\n",
+        "            'model': 'xgb_model'\n",
+        "        },\n",
+        "        'params': {'num_bins': 10, 'mode': 'fixed'}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.ConfusionMatrix': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model']}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.MinimumAccuracy': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model']},\n",
+        "        'params': {'min_threshold': 0.7}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.MinimumF1Score': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model']},\n",
+        "        'params': {'min_threshold': 0.5}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.PrecisionRecallCurve': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model']}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.CalibrationCurve': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model']}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.ClassifierThresholdOptimization': {\n",
+        "        'inputs': {'dataset': 'train_dataset', 'model': 'xgb_model'},\n",
+        "        'params': {'target_recall': 0.8}\n",
+        "    },\n",
+        "    'validmind.model_validation.statsmodels.ScorecardHistogram': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']},\n",
+        "        'params': {'score_column': 'xgb_scores'}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.ScoreProbabilityAlignment': {\n",
+        "        'input_grid': {'dataset': ['train_dataset'], 'model': ['xgb_model']},\n",
+        "        'params': {'score_column': 'xgb_scores'}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.WeakspotsDiagnosis': {\n",
+        "        'inputs': {'datasets': ['train_dataset', 'test_dataset'], 'model': 'xgb_model'}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.OverfitDiagnosis': {\n",
+        "        'inputs': {'model': 'xgb_model', 'datasets': ['train_dataset', 'test_dataset']},\n",
+        "        'params': {'cut_off_threshold': 0.04}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.RobustnessDiagnosis': {\n",
+        "        'inputs': {'datasets': ['train_dataset', 'test_dataset'], 'model': 'xgb_model'},\n",
+        "        'params': {\n",
+        "            'scaling_factor_std_dev_list': [0.1, 0.2, 0.3, 0.4, 0.5],\n",
+        "            'performance_decay_threshold': 0.05\n",
+        "        }\n",
+        "    },\n",
+        "    'validmind.model_validation.FeaturesAUC': {\n",
+        "        'input_grid': {'model': ['xgb_model'], 'dataset': ['train_dataset', 'test_dataset']}\n",
+        "    }\n",
+        "}"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_3__'></a>\n",
+        "\n",
+        "### Run defined tests\n",
+        "\n",
+        "Then, we'll define a utility wrapper around [the `run_test` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test) provided by the `validmind.tests` module in a function called `run_doc_tests`.\n",
+        "\n",
+        "- Every test result returned by the `run_test()` function has a [`.log()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#TestResult.log) that can be used to send the test results to the ValidMind Platform.\n",
+        "- Our function requires information about the inputs to use on every test — which is why we specified these inputs above in `test_config`."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "def run_doc_tests(test_config):\n",
+        "    for test_name, test_cfg in test_config.items():\n",
+        "        print(test_name)\n",
+        "        try:\n",
+        "            # Collect available keyword arguments\n",
+        "            kwargs = {\n",
+        "                key: test_cfg[key]\n",
+        "                for key in (\"params\", \"input_grid\", \"inputs\")\n",
+        "                if key in test_cfg\n",
+        "            }\n",
+        "            kwargs[\"show\"] = False\n",
+        "\n",
+        "            # Execute the test and log the results\n",
+        "            vm.tests.run_test(test_name, **kwargs).log()\n",
+        "\n",
+        "        except Exception as e:\n",
+        "            print(f\"Error running test {test_name}: {e}\")\n"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Finally, we can pass the input configuration to `run_doc_tests` and run the full suite of tests!\n",
+        "\n",
+        "The variable `full_suite` then holds the result of these tests:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "full_suite = run_doc_tests(test_config)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the outputs returned indicating that certain test-driven blocks don't currently exist in your documentation for this particular test ID. </b></span>\n",
+        "<br></br>\n",
+        "That's expected, as when we run individual tests not defined by the documentation template out-of-the-box, the results logged need to be manually added to your documentation within the ValidMind Platform.</div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way, use the ValidMind Platform to work with your documentation.\n",
+        "\n",
+        "<a id='toc7_1__'></a>\n",
+        "\n",
+        "### Work with your documentation\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "   What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready.\n",
+        "\n",
+        "3. Expand the following section to review tests automatically inserted into your documentation template: **2.3. Feature Selection and Engineering**\n",
+        "\n",
+        "<a id='toc7_1_1__'></a>\n",
+        "\n",
+        "#### Add individual test results to documentation\n",
+        "\n",
+        "Let's also add our additional test results into the documentation. These were results sent by individual tests not defined out-of-the-box by our template. For example (**Learn more:** [Work with test results](https://docs.validmind.ai/guide/documentation/work-with-test-results.html)):\n",
+        "\n",
+        "1. Locate the Data Preparation section of your documentation and click on **2.2. Correlations and Interactions** to expand that section.\n",
+        "\n",
+        "4. Hover under the Pearson Correlation Matrix content block until a horizontal dashed line with a **+** button appears, indicating that you can insert a new block.\n",
+        "\n",
+        "    <img src= \"../../tutorials/development/add-content-block.gif\" alt=\"Screenshot showing insert block button in model documentation\" style=\"border: 2px solid #083E44; border-radius: 8px; border-right-width: 2px; border-bottom-width: 3px;\">\n",
+        "    <br><br>\n",
+        "\n",
+        "5. Click **+** and then select **Test-Driven Block** under FROM LIBRARY:\n",
+        "\n",
+        "    - Click on **VM Library** under TEST-DRIVEN in the left sidebar.\n",
+        "    - In the search bar, type in `HighPearsonCorrelation`.\n",
+        "    - Select `HighPearsonCorrelation:development_data` as the test.\n",
+        "\n",
+        "6. Finally, click **Insert 1 Test Result to Document** to add the test result to the documentation.\n",
+        "\n",
+        "    Confirm that the individual results for the high correlation test has been correctly inserted into section **2.3. Correlations and Interactions** of the documentation.\n",
+        "\n",
+        "<a id='toc7_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-9a4dd2ee254f496292698e9be3d8f799"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.10.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 4
 }
diff --git a/site/notebooks/use_cases/model_validation/validate_application_scorecard.ipynb b/site/notebooks/use_cases/model_validation/validate_application_scorecard.ipynb
deleted file mode 100644
index 7857d42e0a..0000000000
--- a/site/notebooks/use_cases/model_validation/validate_application_scorecard.ipynb
+++ /dev/null
@@ -1,1874 +0,0 @@
-{
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Validate an application scorecard model\n",
-    "\n",
-    "Learn how to independently assess an application scorecard model developed using the ValidMind Library as a validator. You'll evaluate the development of the model by conducting thorough testing and analysis, including the use of challenger models to benchmark performance.\n",
-    "\n",
-    "An *application scorecard model* is a type of statistical model used in credit scoring to evaluate the creditworthiness of potential borrowers by generating a score based on various characteristics of an applicant such as credit history, income, employment status, and other relevant financial data.\n",
-    "\n",
-    " - This score assists lenders in making informed decisions about whether to approve or reject loan applications, as well as in determining the terms of the loan, including interest rates and credit limits.\n",
-    " - Effective validation of application scorecard models ensures that lenders can manage risk efficiently while maintaining a fast and transparent loan application process for applicants.\n",
-    "\n",
-    "This interactive notebook provides a step-by-step guide for:\n",
-    "\n",
-    "- Verifying the data quality steps performed by the model development team\n",
-    "- Independently replicating the champion model's results and conducting additional tests to assess performance, stability, and robustness\n",
-    "- Setting up test inputs and challenger models for comparative analysis\n",
-    "- Running validation tests, analyzing results, and logging artifacts (findings) to ValidMind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Register a sample model](#toc2_1__)    \n",
-    "    - [Assign validator credentials](#toc2_1_1__)    \n",
-    "    - [Apply validation report template](#toc2_1_2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_2__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_3__)    \n",
-    "    - [Get your code snippet](#toc2_3_1__)    \n",
-    "  - [Importing the champion model](#toc2_4__)    \n",
-    "  - [Load the sample dataset](#toc2_5__)    \n",
-    "    - [Preprocess the dataset](#toc2_5_1__)    \n",
-    "    - [Apply feature engineering to the dataset](#toc2_5_2__)    \n",
-    "  - [Split the feature engineered dataset](#toc2_6__)    \n",
-    "- [Developing potential challenger models](#toc3__)    \n",
-    "  - [Train potential challenger models](#toc3_1__)    \n",
-    "    - [Random forest classification model](#toc3_1_1__)    \n",
-    "    - [Logistic regression model](#toc3_1_2__)    \n",
-    "  - [Extract predicted probabilities](#toc3_2__)    \n",
-    "    - [Compute binary predictions](#toc3_2_1__)    \n",
-    "- [Initializing the ValidMind objects](#toc4__)    \n",
-    "  - [Initialize the ValidMind datasets](#toc4_1__)    \n",
-    "  - [Initialize the model objects](#toc4_2__)    \n",
-    "  - [Assign predictions](#toc4_3__)    \n",
-    "  - [Compute credit risk scores](#toc4_4__)    \n",
-    "- [Running data quality tests](#toc5__)    \n",
-    "  - [Identify relevant data quality tests](#toc5_1__)    \n",
-    "  - [Run and log an individual data quality test](#toc5_2__)    \n",
-    "  - [Log multiple data quality tests](#toc5_3__)    \n",
-    "  - [Run data quality comparison tests](#toc5_4__)    \n",
-    "- [Running performance tests](#toc6__)    \n",
-    "  - [Identify relevant performance tests](#toc6_1__)    \n",
-    "  - [Run and log an individual performance test](#toc6_2__)    \n",
-    "  - [Log multiple performance tests](#toc6_3__)    \n",
-    "  - [Evaluate performance of the champion model](#toc6_4__)    \n",
-    "  - [Evaluate performance of challenger models](#toc6_5__)    \n",
-    "    - [Enable custom context for test descriptions](#toc6_5_1__)    \n",
-    "    - [Run performance comparison tests](#toc6_5_2__)    \n",
-    "- [Adjust a ValidMind test](#toc7__)    \n",
-    "- [Run diagnostic tests](#toc8__)    \n",
-    "- [Run feature importance tests](#toc9__)    \n",
-    "- [Implement a custom test](#toc10__)    \n",
-    "- [Verify test runs](#toc11__)    \n",
-    "- [Next steps](#toc12__)    \n",
-    "  - [Work with your validation report](#toc12_1__)    \n",
-    "  - [Discover more learning resources](#toc12_2__)    \n",
-    "- [Upgrade ValidMind](#toc13__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate comparison and other validation tests, and then use the ValidMind Platform to submit compliance assessments of champion models via comprehensive validation reports. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model developers."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Validation report**: A comprehensive and structured assessment of a model’s development and performance, focusing on verifying its integrity, appropriateness, and alignment with its intended use. It includes analyses of model assumptions, data quality, performance metrics, outcomes of testing procedures, and risk considerations. The validation report supports transparency, regulatory compliance, and informed decision-making by documenting the validator’s independent review and conclusions.\n",
-    "\n",
-    "**Validation report template**: Serves as a standardized framework for conducting and documenting model validation activities. It outlines the required sections, recommended analyses, and expected validation tests, ensuring consistency and completeness across validation reports. The template helps guide validators through a systematic review process while promoting comparability and traceability of validation outcomes.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets.\n",
-    "\n",
-    "**Metrics**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
-    "\n",
-    "**Custom metrics**: Custom metrics are functions that you define to evaluate your model or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom metric.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom metric. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a metric, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom metrics can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Register a sample model\n",
-    "\n",
-    "In a usual model lifecycle, a champion model will have been independently registered in your model inventory and submitted to you for validation by your model development team as part of the effective challenge process. (**Learn more:** [Submit for approval](https://docs.validmind.ai/guide/model-documentation/submit-for-approval.html))\n",
-    "\n",
-    "For this notebook, we'll have you register a dummy model in the ValidMind Platform inventory and assign yourself as the validator to familiarize you with the ValidMind interface and circumvent the need for an existing model:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down — don’t worry, we’ll adjust these permissions next for validation.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1_1__'></a>\n",
-    "\n",
-    "#### Assign validator credentials\n",
-    "\n",
-    "In order to log tests as a validator instead of as a developer, on the model details page that appears after you've successfully registered your sample model:\n",
-    "\n",
-    "1. Remove yourself as a model owner: \n",
-    "\n",
-    "    - Click on the **OWNERS** tile.\n",
-    "    - Click the **x** next to your name to remove yourself from that model's role.\n",
-    "    - Click **Save** to apply your changes to that role.\n",
-    "\n",
-    "2. Remove yourself as a developer: \n",
-    "\n",
-    "    - Click on the **DEVELOPERS** tile.\n",
-    "    - Click the **x** next to your name to remove yourself from that model's role.\n",
-    "    - Click **Save** to apply your changes to that role.\n",
-    "\n",
-    "3. Add yourself as a validator: \n",
-    "\n",
-    "    - Click on the **VALIDATORS** tile.\n",
-    "    - Select your name from the drop-down menu.\n",
-    "    - Click **Save** to apply your changes to that role."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1_2__'></a>\n",
-    "\n",
-    "#### Apply validation report template\n",
-    "\n",
-    "Next, let's select a validation report template. A template predefines sections for your report and provides a general outline to follow, making the validation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Validation**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Generic Validation Report`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
-    "<br></br>\n",
-    "Python 3.8 <= x <= 3.14</div>\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3_1__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Validation` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"validation-report\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_4__'></a>\n",
-    "\n",
-    "### Importing the champion model\n",
-    "\n",
-    "With the ValidMind Library set up and ready to go, let's go ahead and import the champion model submitted by the model development team in the format of a `.pkl` file: **[xgb_model_champion.pkl](xgb_model_champion.pkl)**"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import xgboost as xgb\n",
-    "\n",
-    "#Load the saved model\n",
-    "xgb_model = xgb.XGBClassifier()\n",
-    "xgb_model.load_model(\"xgb_model_champion.pkl\")\n",
-    "xgb_model"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Ensure that we have to appropriate order in feature names from Champion model and dataset\n",
-    "cols_when_model_builds = xgb_model.get_booster().feature_names"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_5__'></a>\n",
-    "\n",
-    "### Load the sample dataset\n",
-    "\n",
-    "Let's next import the public [Lending Club](https://www.kaggle.com/datasets/devanshi23/loan-data-2007-2014/data) dataset from Kaggle, which was used to develop the dummy champion model.\n",
-    "\n",
-    "- We'll use this dataset to review steps that should have been conducted during the initial development and documentation of the model to ensure that the model was built correctly.\n",
-    "- By independently performing steps such as preprocessing and feature engineering, we can confirm whether the model was built using appropriate and properly processed data.\n",
-    "\n",
-    "To be able to use the dataset, you'll need to import the dataset and load it into a pandas [DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html), a two-dimensional tabular data structure that makes use of rows and columns:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.datasets.credit_risk import lending_club\n",
-    "\n",
-    "df = lending_club.load_data(source=\"offline\")\n",
-    "df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_5_1__'></a>\n",
-    "\n",
-    "#### Preprocess the dataset\n",
-    "\n",
-    "We'll first quickly preprocess the dataset for data quality testing purposes using `lending_club.preprocess`. This function performs the following operations:\n",
-    "\n",
-    "- Filters the dataset to include only loans for debt consolidation or credit card purposes\n",
-    "- Removes loans classified under the riskier grades \"F\" and \"G\"\n",
-    "- Excludes uncommon home ownership types and standardizes employment length and loan terms into numerical formats\n",
-    "- Discards unnecessary fields and any entries with missing information to maintain a clean and robust dataset for modeling"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "preprocess_df = lending_club.preprocess(df)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_5_2__'></a>\n",
-    "\n",
-    "#### Apply feature engineering to the dataset\n",
-    "\n",
-    "Feature engineering improves the dataset's structure to better match what our model expects, and ensures that the model performs optimally by leveraging additional insights from raw data.\n",
-    "\n",
-    "We'll apply the following transformations using the `ending_club.feature_engineering()` function to optimize the dataset for predictive modeling in our application scorecard:\n",
-    "\n",
-    "- **WoE encoding**: Converts both numerical and categorical features into Weight of Evidence (WoE) values. WoE is a statistical measure used in scorecard modeling that quantifies the relationship between a predictor variable and the binary target variable. It calculates the ratio of the distribution of good outcomes to the distribution of bad outcomes for each category or bin of a feature. This transformation helps to ensure that the features are predictive and consistent in their contribution to the model.\n",
-    "- **Integration of WoE bins**: Ensures that the WoE transformed values are integrated throughout the dataset, replacing the original feature values while excluding the target variable from this transformation. This transformation is used to maintain a consistent scale and impact of each variable within the model, which helps make the predictions more stable and accurate."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "fe_df = lending_club.feature_engineering(preprocess_df)\n",
-    "fe_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_6__'></a>\n",
-    "\n",
-    "### Split the feature engineered dataset\n",
-    "\n",
-    "With our dummy model imported and our independently preprocessed and feature engineered dataset ready to go, let's now **spilt our dataset into train and test** to start the validation testing process.\n",
-    "\n",
-    "Splitting our dataset into training and testing is essential for proper validation testing, as this helps assess how well the model generalizes to unseen data:\n",
-    "\n",
-    "- We begin by dividing our data, which is based on Weight of Evidence (WoE) features, into training and testing sets (`train_df`, `test_df`).\n",
-    "- With `lending_club.split`, we employ a simple random split, randomly allocating data points to each set to ensure a mix of examples in both."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Split the data\n",
-    "train_df, test_df = lending_club.split(fe_df, test_size=0.2)\n",
-    "\n",
-    "x_train = train_df.drop(lending_club.target_column, axis=1)\n",
-    "y_train = train_df[lending_club.target_column]\n",
-    "\n",
-    "x_test = test_df.drop(lending_club.target_column, axis=1)\n",
-    "y_test = test_df[lending_club.target_column]\n",
-    "\n",
-    "# Now let's apply the order of features from the champion model construction\n",
-    "x_train = x_train[cols_when_model_builds]\n",
-    "x_test = x_test[cols_when_model_builds]"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "cols_use = ['annual_inc_woe',\n",
-    " 'verification_status_woe',\n",
-    " 'emp_length_woe',\n",
-    " 'installment_woe',\n",
-    " 'term_woe',\n",
-    " 'home_ownership_woe',\n",
-    " 'purpose_woe',\n",
-    " 'open_acc_woe',\n",
-    " 'total_acc_woe',\n",
-    " 'int_rate_woe',\n",
-    " 'sub_grade_woe',\n",
-    " 'grade_woe','loan_status']\n",
-    "\n",
-    "\n",
-    "train_df = train_df[cols_use]\n",
-    "test_df = test_df[cols_use]\n",
-    "test_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Developing potential challenger models"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Train potential challenger models\n",
-    "\n",
-    "We're curious how alternate models compare to our champion model, so let's train two challenger models as basis for our testing.\n",
-    "\n",
-    "Our selected options below offer decreased complexity in terms of implementation — such as lessened manual preprocessing — which can reduce the amount of risk for implementation. However, model risk is not calculated in isolation from a single factor, but rather in consideration with trade-offs in predictive performance, ease of interpretability, and overall alignment with business objectives."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1_1__'></a>\n",
-    "\n",
-    "#### Random forest classification model\n",
-    "\n",
-    "A *random forest classification model* is an ensemble machine learning algorithm that uses multiple decision trees to classify data. In ensemble learning, multiple models are combined to improve prediction accuracy and robustness.\n",
-    "\n",
-    "Random forest classification models generally have higher accuracy because they capture complex, non-linear relationships, but as a result they lack transparency in their predictions."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Import the Random Forest Classification model\n",
-    "from sklearn.ensemble import RandomForestClassifier\n",
-    "\n",
-    "# Create the model instance with 50 decision trees\n",
-    "rf_model = RandomForestClassifier(\n",
-    "    n_estimators=50,\n",
-    "    random_state=42,\n",
-    ")\n",
-    "\n",
-    "# Train the model\n",
-    "rf_model.fit(x_train, y_train)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1_2__'></a>\n",
-    "\n",
-    "#### Logistic regression model\n",
-    "\n",
-    "A *logistic regression model* is a statistical machine learning algorithm that uses a linear equation (straight-line relationship between variables) and the logistic function (or sigmoid function, which maps any real-valued number to a range between `0` and `1`) to classify data. In statistical modeling, a single equation is used to estimate the probability of an outcome based on input features.\n",
-    "\n",
-    "Logistic regression models are simple and interpretable because they provide clear probability estimates and feature coefficients (numerical value that represents the influence of a particular input feature on the model's prediction), but they may struggle with capturing complex, non-linear relationships in the data."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Import the Logistic Regression model\n",
-    "from sklearn.linear_model import LogisticRegression\n",
-    "\n",
-    "# Logistic Regression grid params\n",
-    "log_reg_params = {\n",
-    "    \"penalty\": [\"l1\", \"l2\"],\n",
-    "    \"C\": [0.001, 0.01, 0.1, 1, 10, 100, 1000],\n",
-    "    \"solver\": [\"liblinear\"],\n",
-    "}\n",
-    "\n",
-    "# Grid search for Logistic Regression\n",
-    "from sklearn.model_selection import GridSearchCV\n",
-    "\n",
-    "grid_log_reg = GridSearchCV(LogisticRegression(), log_reg_params)\n",
-    "grid_log_reg.fit(x_train, y_train)\n",
-    "\n",
-    "# Logistic Regression best estimator\n",
-    "log_reg = grid_log_reg.best_estimator_\n",
-    "log_reg"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2__'></a>\n",
-    "\n",
-    "### Extract predicted probabilities\n",
-    "\n",
-    "With our challenger models trained, let's extract the predicted probabilities from our three models:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Champion — Application scorecard model\n",
-    "train_xgb_prob = xgb_model.predict_proba(x_train)[:, 1]\n",
-    "test_xgb_prob = xgb_model.predict_proba(x_test)[:, 1]\n",
-    "\n",
-    "# Challenger — Random forest classification model\n",
-    "train_rf_prob = rf_model.predict_proba(x_train)[:, 1]\n",
-    "test_rf_prob = rf_model.predict_proba(x_test)[:, 1]\n",
-    "\n",
-    "# Challenger — Logistic regression model\n",
-    "train_log_prob = log_reg.predict_proba(x_train)[:, 1]\n",
-    "test_log_prob = log_reg.predict_proba(x_test)[:, 1]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2_1__'></a>\n",
-    "\n",
-    "#### Compute binary predictions\n",
-    "\n",
-    "Next, we'll convert the probability predictions from our three models into a binary, based on a threshold of `0.3`:\n",
-    "\n",
-    "- If the probability is greater than `0.3`, the prediction becomes `1` (positive).\n",
-    "- Otherwise, it becomes `0` (negative)."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "cut_off_threshold = 0.3\n",
-    "\n",
-    "# Champion — Application scorecard model\n",
-    "train_xgb_binary_predictions = (train_xgb_prob > cut_off_threshold).astype(int)\n",
-    "test_xgb_binary_predictions = (test_xgb_prob > cut_off_threshold).astype(int)\n",
-    "\n",
-    "# Challenger — Random forest classification model\n",
-    "train_rf_binary_predictions = (train_rf_prob > cut_off_threshold).astype(int)\n",
-    "test_rf_binary_predictions = (test_rf_prob > cut_off_threshold).astype(int)\n",
-    "\n",
-    "# Challenger — Logistic regression model\n",
-    "train_log_binary_predictions = (train_log_prob > cut_off_threshold).astype(int)\n",
-    "test_log_binary_predictions = (test_log_prob > cut_off_threshold).astype(int)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Initializing the ValidMind objects"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind datasets\n",
-    "\n",
-    "Before you can run tests, you'll need to connect your data with a ValidMind `Dataset` object. **This step is always necessary every time you want to connect a dataset to documentation and produce test results through ValidMind,** but you only need to do it once per dataset.\n",
-    "\n",
-    "Initialize a ValidMind dataset object using the [`init_dataset` function](https://docs.validmind.ai/validmind/validmind.html#init_dataset) from the ValidMind (`vm`) module. For this example, we'll pass in the following arguments:\n",
-    "\n",
-    "- **`dataset`** — The raw dataset that you want to provide as input to tests.\n",
-    "- **`input_id`** — A unique identifier that allows tracking what inputs are used when running each individual test.\n",
-    "- **`target_column`** — A required argument if tests require access to true values. This is the name of the target column in the dataset."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize the raw dataset\n",
-    "vm_raw_dataset = vm.init_dataset(\n",
-    "    dataset=df,\n",
-    "    input_id=\"raw_dataset\",\n",
-    "    target_column=lending_club.target_column,\n",
-    ")\n",
-    "\n",
-    "# Initialize the preprocessed dataset\n",
-    "vm_preprocess_dataset = vm.init_dataset(\n",
-    "    dataset=preprocess_df,\n",
-    "    input_id=\"preprocess_dataset\",\n",
-    "    target_column=lending_club.target_column,\n",
-    ")\n",
-    "\n",
-    "# Initialize the feature engineered dataset\n",
-    "vm_fe_dataset = vm.init_dataset(\n",
-    "    dataset=fe_df,\n",
-    "    input_id=\"fe_dataset\",\n",
-    "    target_column=lending_club.target_column,\n",
-    ")\n",
-    "\n",
-    "# Initialize the training dataset\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    dataset=train_df,\n",
-    "    input_id=\"train_dataset\",\n",
-    "    target_column=lending_club.target_column,\n",
-    ")\n",
-    "\n",
-    "# Initialize the test dataset\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    dataset=test_df,\n",
-    "    input_id=\"test_dataset\",\n",
-    "    target_column=lending_club.target_column,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "After initialization, you can pass the ValidMind `Dataset` objects `vm_raw_dataset`, `vm_preprocess_dataset`, `vm_fe_dataset`, `vm_train_ds`, and `vm_test_ds` into any ValidMind tests."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Initialize the model objects\n",
-    "\n",
-    "You'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for each of our three models.\n",
-    "\n",
-    "You simply initialize this model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Initialize the champion application scorecard model\n",
-    "vm_xgb_model = vm.init_model(\n",
-    "    xgb_model,\n",
-    "    input_id=\"xgb_model_developer_champion\",\n",
-    ")\n",
-    "\n",
-    "# Initialize the challenger random forest classification model\n",
-    "vm_rf_model = vm.init_model(\n",
-    "    rf_model,\n",
-    "    input_id=\"rf_model\",\n",
-    ")\n",
-    "\n",
-    "# Initialize the challenger logistic regression model\n",
-    "vm_log_model = vm.init_model(\n",
-    "    log_reg,\n",
-    "    input_id=\"log_model\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_3__'></a>\n",
-    "\n",
-    "### Assign predictions\n",
-    "\n",
-    "With our models registered, we'll move on to assigning both the predictive probabilities coming directly from each model's predictions, and the binary prediction after applying the cutoff threshold described in the Compute binary predictions step above.\n",
-    "\n",
-    "- The [`assign_predictions()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#VMDataset.assign_predictions) from the `Dataset` object can link existing predictions to any number of models.\n",
-    "- This method links the model's class prediction values and probabilities to our `vm_train_ds` and `vm_test_ds` datasets."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Champion — Application scorecard model\n",
-    "vm_train_ds.assign_predictions(\n",
-    "    model=vm_xgb_model,\n",
-    "    prediction_values=train_xgb_binary_predictions,\n",
-    "    prediction_probabilities=train_xgb_prob,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds.assign_predictions(\n",
-    "    model=vm_xgb_model,\n",
-    "    prediction_values=test_xgb_binary_predictions,\n",
-    "    prediction_probabilities=test_xgb_prob,\n",
-    ")\n",
-    "\n",
-    "# Challenger — Random forest classification model\n",
-    "vm_train_ds.assign_predictions(\n",
-    "    model=vm_rf_model,\n",
-    "    prediction_values=train_rf_binary_predictions,\n",
-    "    prediction_probabilities=train_rf_prob,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds.assign_predictions(\n",
-    "    model=vm_rf_model,\n",
-    "    prediction_values=test_rf_binary_predictions,\n",
-    "    prediction_probabilities=test_rf_prob,\n",
-    ")\n",
-    "\n",
-    "\n",
-    "# Challenger — Logistic regression model\n",
-    "vm_train_ds.assign_predictions(\n",
-    "    model=vm_log_model,\n",
-    "    prediction_values=train_log_binary_predictions,\n",
-    "    prediction_probabilities=train_log_prob,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds.assign_predictions(\n",
-    "    model=vm_log_model,\n",
-    "    prediction_values=test_log_binary_predictions,\n",
-    "    prediction_probabilities=test_log_prob,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_4__'></a>\n",
-    "\n",
-    "### Compute credit risk scores\n",
-    "\n",
-    "Finally, we'll translate model predictions into actionable scores using probability estimates generated by our trained model:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Compute the scores\n",
-    "train_xgb_scores = lending_club.compute_scores(train_xgb_prob)\n",
-    "test_xgb_scores = lending_club.compute_scores(test_xgb_prob)\n",
-    "train_rf_scores = lending_club.compute_scores(train_rf_prob)\n",
-    "test_rf_scores = lending_club.compute_scores(test_rf_prob)\n",
-    "train_log_scores = lending_club.compute_scores(train_log_prob)\n",
-    "test_log_scores = lending_club.compute_scores(test_log_prob)\n",
-    "\n",
-    "# Assign scores to the datasets\n",
-    "vm_train_ds.add_extra_column(\"xgb_scores\", train_xgb_scores)\n",
-    "vm_test_ds.add_extra_column(\"xgb_scores\", test_xgb_scores)\n",
-    "vm_train_ds.add_extra_column(\"rf_scores\", train_rf_scores)\n",
-    "vm_test_ds.add_extra_column(\"rf_scores\", test_rf_scores)\n",
-    "vm_train_ds.add_extra_column(\"log_scores\", train_log_scores)\n",
-    "vm_test_ds.add_extra_column(\"log_scores\", test_log_scores)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Running data quality tests\n",
-    "\n",
-    "With everything ready to go, let's explore some of ValidMind's available tests. Using ValidMind’s repository of tests streamlines your validation testing, and helps you ensure that your models are being validated appropriately."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_1__'></a>\n",
-    "\n",
-    "### Identify relevant data quality tests\n",
-    "\n",
-    "We want to narrow down the tests we want to run from the selection provided by ValidMind, so we'll use the [`vm.tests.list_tasks_and_tags()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tasks_and_tags) to list which `tags` are associated with each `task` type:\n",
-    "\n",
-    "- **`tasks`** represent the kind of modeling task associated with a test. Here we'll focus on `classification` tasks.\n",
-    "- **`tags`** are free-form descriptions providing more details about the test, for example, what category the test falls into. Here we'll focus on the `data_quality` tag."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.list_tasks_and_tags()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Then we'll call [the `vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) to list all the data quality tests for classification:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.list_tests(\n",
-    "    tags=[\"data_quality\"], task=\"classification\"\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about navigating ValidMind tests?</b></span>\n",
-    "<br></br>\n",
-    "Refer to our notebook outlining the utilities available for viewing and understanding available ValidMind tests: <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/explore_tests/explore_tests.html\" style=\"color: #DE257E;\"><b>Explore tests</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_2__'></a>\n",
-    "\n",
-    "### Run and log an individual data quality test\n",
-    "\n",
-    "Next, we'll use our previously initialized preprocessed dataset (`vm_preprocess_dataset`) as input to run an individual test, then log the result to the ValidMind Platform.\n",
-    "\n",
-    "- You run validation tests by calling [the `run_test` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test) provided by the `validmind.tests` module.\n",
-    "- Every test result returned by the `run_test()` function has a [`.log()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#TestResult.log) that can be used to send the test results to the ValidMind Platform.\n",
-    "\n",
-    "Here, we'll use the [`HighPearsonCorrelation` test](https://docs.validmind.ai/tests/data_validation/HighPearsonCorrelation.html) as an example:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_preprocess_dataset\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your model's documentation for some test IDs. </b></span>\n",
-    "<br></br>\n",
-    "That's expected, as when we run validations tests the results logged need to be manually added to your report as part of your compliance assessment process within the ValidMind Platform. You'll continue to see this message throughout this notebook as we run and log more tests.</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_3__'></a>\n",
-    "\n",
-    "### Log multiple data quality tests\n",
-    "\n",
-    "Now that we understand how to run a test with ValidMind, we want to run all the tests that were returned for our `classification` tasks focusing on `data_quality`.\n",
-    "\n",
-    "We'll store the identified tests in `dq` in preparation for batch running these tests and logging their results to the ValidMind Platform:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "dq = vm.tests.list_tests(tags=[\"data_quality\"], task=\"classification\",pretty=False)\n",
-    "dq"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "With our data quality tests stored, let's run our first batch of tests using the same preprocessed dataset (`vm_preprocess_dataset`) and log their results."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "for test in dq:\n",
-    "    vm.tests.run_test(\n",
-    "        test,\n",
-    "        inputs={\n",
-    "            \"dataset\": vm_preprocess_dataset\n",
-    "        }\n",
-    "    ).log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5_4__'></a>\n",
-    "\n",
-    "### Run data quality comparison tests\n",
-    "\n",
-    "Next, let's reuse the tests in `dq` to perform comparison tests between the raw (`vm_raw_dataset`) and preprocessed (`vm_preprocess_dataset`) dataset, again logging the results to the ValidMind Platform:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "for test in dq:\n",
-    "    vm.tests.run_test(\n",
-    "        test,\n",
-    "        input_grid={\n",
-    "            \"dataset\": [vm_raw_dataset,vm_preprocess_dataset]\n",
-    "        }\n",
-    "    ).log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Running performance tests\n",
-    "\n",
-    "We'll also run some performance tests, beginning with independent testing of our champion application scorecard model, then moving on to our potential challenger models."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_1__'></a>\n",
-    "\n",
-    "### Identify relevant performance tests\n",
-    "\n",
-    "Use `vm.tests.list_tests()` to this time identify all the model performance tests for classification:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "\n",
-    "vm.tests.list_tests(tags=[\"model_performance\"], task=\"classification\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_2__'></a>\n",
-    "\n",
-    "### Run and log an individual performance test\n",
-    "\n",
-    "Before we run our batch of performance tests, we'll use our previously initialized testing dataset (`vm_test_ds`) as input to run an individual test, then log the result to the ValidMind Platform.\n",
-    "\n",
-    "When running individual tests, you can use a custom `result_id` to tag the individual result with a unique identifier by appending this `result_id` to the `test_id` with a `:` separator. We'll append an identifier for our champion model here (`xgboost_champion`):\n",
-    "\n",
-    "Here, we'll use the [`ClassifierPerformance` test](https://docs.validmind.ai/tests/model_validation/sklearn/ClassifierPerformance.html) as an example:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    test_id=\"validmind.model_validation.sklearn.ClassifierPerformance:xgboost_champion\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_test_ds, \"model\" : vm_xgb_model\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_3__'></a>\n",
-    "\n",
-    "### Log multiple performance tests\n",
-    "\n",
-    "We only want to run a few other tests that were returned for our `classification` tasks focusing on `model_performance`, so we'll isolate the specific tests we want to batch run in `mpt`:\n",
-    "\n",
-    "- `ClassifierPerformance`\n",
-    "- [`ConfusionMatrix`](https://docs.validmind.ai/tests/model_validation/sklearn/ConfusionMatrix.html)\n",
-    "- [`MinimumAccuracy`](https://docs.validmind.ai/tests/model_validation/sklearn/MinimumAccuracy.html)\n",
-    "- [`MinimumF1Score`](https://docs.validmind.ai/tests/model_validation/sklearn/MinimumF1Score.html)\n",
-    "- [`ROCCurve`](https://docs.validmind.ai/tests/model_validation/sklearn/ROCCurve.html)\n",
-    "\n",
-    "Note the custom `result_id`s appended to the `test_id`s for our champion model (`xgboost_champion`):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "mpt = [\n",
-    "    \"validmind.model_validation.sklearn.ClassifierPerformance:xgboost_champion\",\n",
-    "    \"validmind.model_validation.sklearn.ConfusionMatrix:xgboost_champion\",\n",
-    "    \"validmind.model_validation.sklearn.MinimumAccuracy:xgboost_champion\",\n",
-    "    \"validmind.model_validation.sklearn.MinimumF1Score:xgboost_champion\",\n",
-    "    \"validmind.model_validation.sklearn.ROCCurve:xgboost_champion\"\n",
-    "]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_4__'></a>\n",
-    "\n",
-    "### Evaluate performance of the champion model\n",
-    "\n",
-    "Now, let's run and log our batch of model performance tests using our testing dataset (`vm_test_ds`) for our champion model:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "for test in mpt:\n",
-    "    vm.tests.run_test(\n",
-    "        test,\n",
-    "        inputs={\n",
-    "            \"dataset\": vm_test_ds, \"model\" : vm_xgb_model\n",
-    "        },\n",
-    "    ).log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_5__'></a>\n",
-    "\n",
-    "### Evaluate performance of challenger models\n",
-    "\n",
-    "We've now conducted similar tests as the model development team for our champion model, with the aim of verifying their test results.\n",
-    "\n",
-    "Next, let's see how our challenger models compare. We'll use the same batch of tests here as we did in `mpt`, but append a different `result_id` to indicate that these results should be associated with our challenger models:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "mpt_chall = [\n",
-    "    \"validmind.model_validation.sklearn.ClassifierPerformance:xgboost_champion_vs_challengers\",\n",
-    "    \"validmind.model_validation.sklearn.ConfusionMatrix:xgboost_champion_vs_challengers\",\n",
-    "    \"validmind.model_validation.sklearn.MinimumAccuracy:xgboost_champion_vs_challengers\",\n",
-    "    \"validmind.model_validation.sklearn.MinimumF1Score:xgboost_champion_vs_challengers\",\n",
-    "    \"validmind.model_validation.sklearn.ROCCurve:xgboost_champion_vs_challengers\"\n",
-    "]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_5_1__'></a>\n",
-    "\n",
-    "#### Enable custom context for test descriptions"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "When you run ValidMind tests, test descriptions are automatically generated with LLM using the test results, the test name, and the static test definitions provided in the test’s docstring. While this metadata offers valuable high-level overviews of tests, insights produced by the LLM-based descriptions may not always align with your specific use cases or incorporate organizational policy requirements.\n",
-    "\n",
-    "Before we run our next batch of tests, we'll include some custom use case context to focus on comparison testing going forward, improving the relevancy, insight, and format of the test descriptions returned. By default, custom context for LLM-generated descriptions is disabled, meaning that the output will not include any additional context. To enable custom use case context, set the `VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED` environment variable to `1`.\n",
-    "\n",
-    "This is a global setting that will affect all tests for your linked model:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import os\n",
-    "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED\"] = \"1\""
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Enabling use case context allows you to pass in additional context to the LLM-generated text descriptions within `context`:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import os\n",
-    "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED\"] = \"1\"\n",
-    "\n",
-    "context = \"\"\"\n",
-    "FORMAT FOR THE LLM DESCRIPTIONS: \n",
-    "    **<Test Name>** is designed to <begin with a concise overview of what the test does and its primary purpose, \n",
-    "    extracted from the test description>.\n",
-    "\n",
-    "    The test operates by <write a paragraph about the test mechanism, explaining how it works and what it measures. \n",
-    "    Include any relevant formulas or methodologies mentioned in the test description.>\n",
-    "\n",
-    "    The primary advantages of this test include <write a paragraph about the test's strengths and capabilities, \n",
-    "    highlighting what makes it particularly useful for specific scenarios.>\n",
-    "\n",
-    "    Users should be aware that <write a paragraph about the test's limitations and potential risks. \n",
-    "    Include both technical limitations and interpretation challenges. \n",
-    "    If the test description includes specific signs of high risk, incorporate these here.>\n",
-    "\n",
-    "    **Key Insights:**\n",
-    "\n",
-    "    The test results reveal:\n",
-    "\n",
-    "    - **<insight title>**: <comprehensive description of one aspect of the results>\n",
-    "    - **<insight title>**: <comprehensive description of another aspect>\n",
-    "    ...\n",
-    "\n",
-    "    Based on these results, <conclude with a brief paragraph that ties together the test results with the test's \n",
-    "    purpose and provides any final recommendations or considerations.>\n",
-    "\n",
-    "ADDITIONAL INSTRUCTIONS:\n",
-    "\n",
-    "    The champion model as the basis for comparison is called \"xgb_model_developer_champion\" and emphasis should be on the following:\n",
-    "    - The metrics for the champion model compared against the challenger models\n",
-    "    - Which model potentially outperforms the champion model based on the metrics, this should be highlighted and emphasized\n",
-    "\n",
-    "\n",
-    "    For each metric in the test results, include in the test overview:\n",
-    "    - The metric's purpose and what it measures\n",
-    "    - Its mathematical formula\n",
-    "    - The range of possible values\n",
-    "    - What constitutes good/bad performance\n",
-    "    - How to interpret different values\n",
-    "\n",
-    "    Each insight should progressively cover:\n",
-    "    1. Overall scope and distribution\n",
-    "    2. Complete breakdown of all elements with specific values\n",
-    "    3. Natural groupings and patterns\n",
-    "    4. Comparative analysis between datasets/categories\n",
-    "    5. Stability and variations\n",
-    "    6. Notable relationships or dependencies\n",
-    "\n",
-    "    Remember:\n",
-    "    - Champion model (xgb_model_developer_champion) is the selection and challenger models are used to challenge the selection\n",
-    "    - Keep all insights at the same level (no sub-bullets or nested structures)\n",
-    "    - Make each insight complete and self-contained\n",
-    "    - Include specific numerical values and ranges\n",
-    "    - Cover all elements in the results comprehensively\n",
-    "    - Maintain clear, concise language\n",
-    "    - Use only \"- **Title**: Description\" format for insights\n",
-    "    - Progress naturally from general to specific observations\n",
-    "\n",
-    "\"\"\".strip()\n",
-    "\n",
-    "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT\"] = context"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about setting custom context for LLM-generated test descriptions?</b></span>\n",
-    "<br></br>\n",
-    "Refer to our extended walkthrough notebook: <a href=\"https://docs.validmind.ai/notebooks/how_to/add_context_to_llm_descriptions.html\" style=\"color: #DE257E;\"><b>Add context to LLM-generated test descriptions\n",
-    "</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6_5_2__'></a>\n",
-    "\n",
-    "#### Run performance comparison tests\n",
-    "\n",
-    "With the use case context set, we'll run each test in `mpt_chall` once for each model with the same `vm_test_ds` dataset to compare them:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "for test in mpt_chall:\n",
-    "    vm.tests.run_test(\n",
-    "        test,\n",
-    "        input_grid={\n",
-    "            \"dataset\": [vm_test_ds], \"model\" : [vm_xgb_model,vm_log_model,vm_rf_model]\n",
-    "        }\n",
-    "    ).log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Based on the performance metrics, we can conclude that the random forest classification model is not a viable candidate for our use case and can be disregarded in our tests going forward.</b></span>\n",
-    "<br></br>\n",
-    "In the next section, we'll dive a bit deeper into some tests comparing our champion application scorecard model and our remaining challenger logistic regression model, including tests that will allow us to customize parameters and thresholds for performance standards.</div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Adjust a ValidMind test\n",
-    "\n",
-    "Let's dig deeper into the `MinimumF1Score` test we ran previously in Run performance tests to ensure that the models maintain a minimum acceptable balance between *precision* and *recall*. Precision refers to how many out of the positive predictions made by the model were actually correct, and recall refers to how many out of the actual positive cases did the model correctly identify.\n",
-    "\n",
-    "Use `run_test()` with our testing dataset (`vm_test_ds`) to run the test in isolation again for our two remaining models without logging the result to have the output to compare with a subsequent iteration:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.MinimumF1Score:xgboost_champion_vs_challengers\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_test_ds],\n",
-    "        \"model\": [vm_xgb_model, vm_log_model]\n",
-    "    },\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "As `MinimumF1Score` allows us to customize parameters and thresholds for performance standards, let's adjust the threshold to see if it improves metrics:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.MinimumF1Score:AdjThreshold\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_test_ds],\n",
-    "        \"model\": [vm_xgb_model, vm_log_model],\n",
-    "        \"params\": {\"min_threshold\": 0.35}\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc8__'></a>\n",
-    "\n",
-    "## Run diagnostic tests\n",
-    "\n",
-    "Next, we want to inspect the robustness and stability testing comparison between our champion and challenger model.\n",
-    "\n",
-    "Use `list_tests()` to list all available diagnosis tests applicable to classification tasks:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.list_tests(tags=[\"model_diagnosis\"], task=\"classification\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Let's see if models suffer from any *overfit* potentials and also where there are potential sub-segments of issues with the [`OverfitDiagnosis` test](https://docs.validmind.ai/tests/model_validation/sklearn/OverfitDiagnosis.html). \n",
-    "\n",
-    "Overfitting occurs when a model learns the training data too well, capturing not only the true pattern but noise and random fluctuations resulting in excellent performance on the training dataset but poor generalization to new, unseen data."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    test_id=\"validmind.model_validation.sklearn.OverfitDiagnosis:Champion_vs_LogRegression\",\n",
-    "    input_grid={\n",
-    "        \"datasets\": [[vm_train_ds,vm_test_ds]],\n",
-    "        \"model\" : [vm_xgb_model,vm_log_model]\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Let's also conduct *robustness* and *stability* testing of the two models with the [`RobustnessDiagnosis` test](https://docs.validmind.ai/tests/model_validation/sklearn/RobustnessDiagnosis.html).\n",
-    "\n",
-    "Robustness refers to a model's ability to maintain consistent performance, and stability refers to a model's ability to produce consistent outputs over time across different data subsets."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    test_id=\"validmind.model_validation.sklearn.RobustnessDiagnosis:Champion_vs_LogRegression\",\n",
-    "    input_grid={\n",
-    "        \"datasets\": [[vm_train_ds,vm_test_ds]],\n",
-    "        \"model\" : [vm_xgb_model,vm_log_model]\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc9__'></a>\n",
-    "\n",
-    "## Run feature importance tests\n",
-    "\n",
-    "We also want to verify the relative influence of different input features on our models' predictions, as well as inspect the differences between our champion and challenger model to see if a certain model offers more understandable or logical importance scores for features.\n",
-    "\n",
-    "Use `list_tests()` to identify all the feature importance tests for classification:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Store the feature importance tests\n",
-    "FI = vm.tests.list_tests(tags=[\"feature_importance\"], task=\"classification\",pretty=False)\n",
-    "FI"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Run and log our feature importance tests for both models for the testing dataset\n",
-    "for test in FI:\n",
-    "    vm.tests.run_test(\n",
-    "        \"\".join((test,':Champion_vs_LogisticRegression')),\n",
-    "        input_grid={\n",
-    "            \"dataset\": [vm_test_ds], \"model\" : [vm_xgb_model,vm_log_model]\n",
-    "        },\n",
-    "    ).log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc10__'></a>\n",
-    "\n",
-    "## Implement a custom test\n",
-    "\n",
-    "Let's finish up testing by implementing a custom *inline test* that outputs a FICO score-type score. An inline test refers to a test written and executed within the same environment as the code being tested — in this case, right in this Jupyter Notebook —  without requiring a separate test file or framework.\n",
-    "\n",
-    "The [`@vm.test` wrapper](https://docs.validmind.ai/validmind/validmind.html#test) allows you to create a reusable test:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import numpy as np\n",
-    "import pandas as pd\n",
-    "import plotly.graph_objects as go\n",
-    "\n",
-    "@vm.test(\"my_custom_tests.ScoreToOdds\")\n",
-    "def score_to_odds_analysis(dataset, score_column='score', score_bands=[410, 440, 470]):\n",
-    "    \"\"\"\n",
-    "    Analyzes the relationship between score bands and odds (good:bad ratio).\n",
-    "    Good odds = (1 - default_rate) / default_rate\n",
-    "    \n",
-    "    Higher scores should correspond to higher odds of being good.\n",
-    "\n",
-    "    If there are multiple scores provided through score_column, this means that there are two different models and the scores reflect each model\n",
-    "\n",
-    "    If there are more scores provided in the score_column then focus the assessment on the differences between the two scores and indicate through evidence which one is preferred.\n",
-    "    \"\"\"\n",
-    "    df = dataset.df\n",
-    "    \n",
-    "    # Create score bands\n",
-    "    df['score_band'] = pd.cut(\n",
-    "        df[score_column],\n",
-    "        bins=[-np.inf] + score_bands + [np.inf],\n",
-    "        labels=[f'<{score_bands[0]}'] + \n",
-    "               [f'{score_bands[i]}-{score_bands[i+1]}' for i in range(len(score_bands)-1)] +\n",
-    "               [f'>{score_bands[-1]}']\n",
-    "    )\n",
-    "    \n",
-    "    # Calculate metrics per band\n",
-    "    results = df.groupby('score_band').agg({\n",
-    "        dataset.target_column: ['mean', 'count']\n",
-    "    })\n",
-    "    \n",
-    "    results.columns = ['Default Rate', 'Total']\n",
-    "    results['Good Count'] = results['Total'] - (results['Default Rate'] * results['Total'])\n",
-    "    results['Bad Count'] = results['Default Rate'] * results['Total']\n",
-    "    results['Odds'] = results['Good Count'] / results['Bad Count']\n",
-    "    \n",
-    "    # Create visualization\n",
-    "    fig = go.Figure()\n",
-    "    \n",
-    "    # Add odds bars\n",
-    "    fig.add_trace(go.Bar(\n",
-    "        name='Odds (Good:Bad)',\n",
-    "        x=results.index,\n",
-    "        y=results['Odds'],\n",
-    "        marker_color='blue'\n",
-    "    ))\n",
-    "    \n",
-    "    fig.update_layout(\n",
-    "        title='Score-to-Odds Analysis',\n",
-    "        yaxis=dict(title='Odds Ratio (Good:Bad)'),\n",
-    "        showlegend=False\n",
-    "    )\n",
-    "    \n",
-    "    return fig"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "With the custom test available, run and log the test for our champion and challenger models with our testing dataset (`vm_test_ds`):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = vm.tests.run_test(\n",
-    "    \"my_custom_tests.ScoreToOdds:Champion_vs_Challenger\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_test_ds,\n",
-    "    },\n",
-    "    param_grid={\n",
-    "        \"score_column\": [\"xgb_scores\",\"log_scores\"],\n",
-    "        \"score_bands\": [[500, 540, 570]],\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about custom tests?</b></span>\n",
-    "<br></br>\n",
-    "Refer to our in-depth introduction to custom tests: <a href=\"../../how_to/tests/custom_tests/implement_custom_tests.ipynb\" style=\"color: #DE257E;\"><b>Implement custom tests</b></a></div>"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc11__'></a>\n",
-    "\n",
-    "## Verify test runs\n",
-    "\n",
-    "Our final task is to verify that all the tests provided by the model development team were run and reported accurately. Note the appended `result_ids` to delineate which dataset we ran the test with for the relevant tests.\n",
-    "\n",
-    "Here, we'll specify all the tests we'd like to independently rerun in a dictionary called `test_config`. **Note here that `inputs` and `input_grid` expect the `input_id` of the dataset or model as the value rather than the variable name we specified**:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test_config = {\n",
-    "    # Run with the raw dataset\n",
-    "    'validmind.data_validation.DatasetDescription:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'}\n",
-    "    },\n",
-    "    'validmind.data_validation.DescriptiveStatistics:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'}\n",
-    "    },\n",
-    "    'validmind.data_validation.MissingValues:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'min_percentage_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.ClassImbalance:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'min_percent_threshold': 10}\n",
-    "    },\n",
-    "    'validmind.data_validation.Duplicates:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'min_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.HighCardinality:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {\n",
-    "            'num_threshold': 100,\n",
-    "            'percent_threshold': 0.1,\n",
-    "            'threshold_type': 'percent'\n",
-    "        }\n",
-    "    },\n",
-    "    'validmind.data_validation.Skewness:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'max_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.UniqueRows:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'min_percent_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.TooManyZeroValues:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'max_percent_threshold': 0.03}\n",
-    "    },\n",
-    "    'validmind.data_validation.IQROutliersTable:raw_data': {\n",
-    "        'inputs': {'dataset': 'raw_dataset'},\n",
-    "        'params': {'threshold': 5}\n",
-    "    },\n",
-    "    # Run with the preprocessed dataset\n",
-    "    'validmind.data_validation.DescriptiveStatistics:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'preprocess_dataset'}\n",
-    "    },\n",
-    "    'validmind.data_validation.TabularDescriptionTables:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'preprocess_dataset'}\n",
-    "    },\n",
-    "    'validmind.data_validation.MissingValues:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'preprocess_dataset'},\n",
-    "        'params': {'min_percentage_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.TabularNumericalHistograms:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'preprocess_dataset'}\n",
-    "    },\n",
-    "    'validmind.data_validation.TabularCategoricalBarPlots:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'preprocess_dataset'}\n",
-    "    },\n",
-    "    'validmind.data_validation.TargetRateBarPlots:preprocessed_data': {\n",
-    "        'inputs': {'dataset': 'preprocess_dataset'},\n",
-    "        'params': {'default_column': 'loan_status'}\n",
-    "    },\n",
-    "    # Run with the training and test datasets\n",
-    "    'validmind.data_validation.DescriptiveStatistics:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']}\n",
-    "    },\n",
-    "    'validmind.data_validation.TabularDescriptionTables:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']}\n",
-    "    },\n",
-    "    'validmind.data_validation.ClassImbalance:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']},\n",
-    "        'params': {'min_percent_threshold': 10}\n",
-    "    },\n",
-    "    'validmind.data_validation.UniqueRows:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']},\n",
-    "        'params': {'min_percent_threshold': 1}\n",
-    "    },\n",
-    "    'validmind.data_validation.TabularNumericalHistograms:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']}\n",
-    "    },\n",
-    "    'validmind.data_validation.MutualInformation:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']},\n",
-    "        'params': {'min_threshold': 0.01}\n",
-    "    },\n",
-    "    'validmind.data_validation.PearsonCorrelationMatrix:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']}\n",
-    "    },\n",
-    "    'validmind.data_validation.HighPearsonCorrelation:development_data': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']},\n",
-    "        'params': {'max_threshold': 0.3, 'top_n_correlations': 10}\n",
-    "    },\n",
-    "    'validmind.model_validation.ModelMetadata': {\n",
-    "        'input_grid': {'model': ['xgb_model_developer_champion', 'rf_model']}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.ModelParameters': {\n",
-    "        'input_grid': {'model': ['xgb_model_developer_champion', 'rf_model']}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.ROCCurve': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model_developer_champion']}\n",
-    "    },\n",
-    "    'validmind.model_validation.sklearn.MinimumROCAUCScore': {\n",
-    "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model_developer_champion']},\n",
-    "        'params': {'min_threshold': 0.5}\n",
-    "    }\n",
-    "}"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Then batch run and log our tests in `test_config`:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "for t in test_config:\n",
-    "    print(t)\n",
-    "    try:\n",
-    "        # Check if test has input_grid\n",
-    "        if 'input_grid' in test_config[t]:\n",
-    "            # For tests with input_grid, pass the input_grid configuration\n",
-    "            if 'params' in test_config[t]:\n",
-    "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid'], params=test_config[t]['params']).log()\n",
-    "            else:\n",
-    "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid']).log()\n",
-    "        else:\n",
-    "            # Original logic for regular inputs\n",
-    "            if 'params' in test_config[t]:\n",
-    "                vm.tests.run_test(t, inputs=test_config[t]['inputs'], params=test_config[t]['params']).log()\n",
-    "            else:\n",
-    "                vm.tests.run_test(t, inputs=test_config[t]['inputs']).log()\n",
-    "    except Exception as e:\n",
-    "        print(f\"Error running test {t}: {str(e)}\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc12__'></a>\n",
-    "\n",
-    "## Next steps"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc12_1__'></a>\n",
-    "\n",
-    "### Work with your validation report\n",
-    "\n",
-    "Now that you've logged all your test results and verified the work done by the model development team, head to the ValidMind Platform to wrap up your validation report:\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you connected to earlier.\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Validation** under Documents.\n",
-    "\n",
-    "Include your logged test results as evidence, create risk assessment notes, add artifacts, and assess compliance, then submit your report for review when it's ready. **Learn more:** [Preparing validation reports](https://docs.validmind.ai/guide/model-validation/preparing-validation-reports.html)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc12_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc13__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-bb563dd58ddf40f49499ddf7f72b21a1",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
-  },
-  "language_info": {
-   "name": "python",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
-}
diff --git a/site/notebooks/use_cases/nlp_and_llm/foundation_models_integration_demo.ipynb b/site/notebooks/use_cases/nlp_and_llm/foundation_models_integration_demo.ipynb
index a9a82857df..583c0a1ea5 100644
--- a/site/notebooks/use_cases/nlp_and_llm/foundation_models_integration_demo.ipynb
+++ b/site/notebooks/use_cases/nlp_and_llm/foundation_models_integration_demo.ipynb
@@ -56,7 +56,9 @@
     "\n",
     "## About ValidMind\n",
     "\n",
-    "ValidMind's suite of tools enables organizations to identify, document, and manage model risks for all types of models, including AI/ML models, LLMs, and statistical models. As a model developer, you use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation initiatives. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
+    "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+    "\n",
+    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
     "\n",
     "If this is your first time trying out ValidMind, we recommend going through the following resources first:\n",
     "\n",
@@ -74,7 +76,7 @@
     "\n",
     "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
     "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+    "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
     "\n",
     "This notebook requires an OpenAI API secret key to run. If you don't have one, visit [API keys](https://platform.openai.com/account/api-keys) on OpenAI's site to create a new key for yourself. Note that API usage charges may apply.\n",
     "\n",
@@ -127,17 +129,19 @@
     "\n",
     "#### Register sample model\n",
     "\n",
-    "Let's first register a sample model for use with this notebook:\n",
+    "Let's first register a sample record (model) for use with this notebook:\n",
+    "\n",
+    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
     "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
+    "2. In the left sidebar, select **Inventory**.\n",
     "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
+    "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
     "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
+    "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
     "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
+    "5. Select your own name under the **RECORD OWNER** drop-down.\n",
     "\n",
-    "5. Click **Register Model** to add the model to your inventory."
+    "6. Click **Register Model** to add the model to your inventory."
    ]
   },
   {
@@ -148,10 +152,12 @@
     "\n",
     "#### Apply documentation template\n",
     "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
+    "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
     "\n",
     "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
     "\n",
+    "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+    "\n",
     "2. Under **TEMPLATE**, select `LLM-based Text Classification`.\n",
     "\n",
     "3. Click **Use Template** to apply the template."
@@ -165,11 +171,13 @@
     "\n",
     "#### Get your code snippet\n",
     "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
+    "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
     "\n",
     "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+    "\n",
     "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+    "\n",
+    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
    ]
   },
   {
@@ -413,7 +421,7 @@
     "\n",
     "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way: view the prompt validation test results as part of your model documentation in the ValidMind Platform:\n",
     "\n",
-    "1. In the ValidMind Platform, click **Development** under Documents for the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-documentation/working-with-model-documentation.html))\n",
+    "1. In the ValidMind Platform, click **Development** under Documents for the model you registered earlier. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
     "\n",
     "2. Expand **2. Data Preparation** or **3. Model Development** to review all test results.\n",
     "\n",
diff --git a/site/notebooks/use_cases/nlp_and_llm/foundation_models_summarization_demo.ipynb b/site/notebooks/use_cases/nlp_and_llm/foundation_models_summarization_demo.ipynb
index e4c7e067b7..759b0d733f 100644
--- a/site/notebooks/use_cases/nlp_and_llm/foundation_models_summarization_demo.ipynb
+++ b/site/notebooks/use_cases/nlp_and_llm/foundation_models_summarization_demo.ipynb
@@ -8,7 +8,7 @@
     "\n",
     "Document a large language model (LLM) using the ValidMind Library. The use case is a summarization of financial news based on a dataset containing just over 300k unique news articles as written by journalists at CNN and the Daily Mail. \n",
     "\n",
-    "This interactive notebook shows you how to set up the ValidMind Library, initialize the library, and load the dataset, followed by running the model validation tests provided by the ValidMind Library to quickly generate documentation about the data and model."
+    "This interactive notebook shows you how to set up the ValidMind Library, initialize the library, and load the dataset, followed by running the validation tests provided by the ValidMind Library to quickly generate documentation about the data and model."
    ]
   },
   {
@@ -54,7 +54,7 @@
     "\n",
     "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
     "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+    "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
     "\n",
     "This notebook requires an OpenAI API secret key to run. If you don't have one, visit [API keys](https://platform.openai.com/account/api-keys) on OpenAI's site to create a new key for yourself. Note that API usage charges may apply.\n",
     "\n",
@@ -69,7 +69,9 @@
     "\n",
     "## About ValidMind\n",
     "\n",
-    "ValidMind's suite of tools enables organizations to identify, document, and manage model risks for all types of models, including AI/ML models, LLMs, and statistical models. As a model developer, you use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
+    "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+    "\n",
+    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
     "\n",
     "If this is your first time trying out ValidMind, we recommend going through the following resources first:\n",
     "\n",
@@ -123,17 +125,19 @@
     "\n",
     "#### Register sample model\n",
     "\n",
-    "Let's first register a sample model for use with this notebook:\n",
+    "Let's first register a sample record (model) for use with this notebook:\n",
+    "\n",
+    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
     "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
+    "2. In the left sidebar, select **Inventory**.\n",
     "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
+    "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
     "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
+    "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
     "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
+    "5. Select your own name under the **RECORD OWNER** drop-down.\n",
     "\n",
-    "5. Click **Register Model** to add the model to your inventory."
+    "6. Click **Register Model** to add the model to your inventory."
    ]
   },
   {
@@ -144,10 +148,12 @@
     "\n",
     "#### Apply documentation template\n",
     "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
+    "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
     "\n",
     "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
     "\n",
+    "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+    "\n",
     "2. Under **TEMPLATE**, select `LLM-based Text Summarization`.\n",
     "\n",
     "3. Click **Use Template** to apply the template."
@@ -161,11 +167,13 @@
     "\n",
     "#### Get your code snippet\n",
     "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
+    "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
     "\n",
     "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+    "\n",
     "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+    "\n",
+    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
    ]
   },
   {
@@ -457,7 +465,7 @@
     "\n",
     "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way: view the prompt validation test results as part of your model documentation in the ValidMind Platform:\n",
     "\n",
-    "1. In the ValidMind Platform, click **Development** under Documents for the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-documentation/working-with-model-documentation.html)\n",
+    "1. In the ValidMind Platform, click **Development** under Documents for the model you registered earlier. (Learn more: [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
     "\n",
     "2. Expand **2. Data Preparation** or **3. Model Development** to review all test results.\n",
     "\n",
diff --git a/site/notebooks/use_cases/nlp_and_llm/hugging_face_integration_demo.ipynb b/site/notebooks/use_cases/nlp_and_llm/hugging_face_integration_demo.ipynb
index a83eeed947..ceefd99f7d 100644
--- a/site/notebooks/use_cases/nlp_and_llm/hugging_face_integration_demo.ipynb
+++ b/site/notebooks/use_cases/nlp_and_llm/hugging_face_integration_demo.ipynb
@@ -55,7 +55,9 @@
     "\n",
     "## About ValidMind\n",
     "\n",
-    "ValidMind's suite of tools enables organizations to identify, document, and manage model risks for all types of models, including AI/ML models, LLMs, and statistical models. As a model developer, you use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation initiatives. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
+    "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+    "\n",
+    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
     "\n",
     "If this is your first time trying out ValidMind, we recommend going through the following resources first:\n",
     "\n",
@@ -73,7 +75,7 @@
     "\n",
     "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
     "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+    "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
     "\n",
     "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
    ]
@@ -124,17 +126,19 @@
     "\n",
     "#### Register sample model\n",
     "\n",
-    "Let's first register a sample model for use with this notebook:\n",
+    "Let's first register a sample record (model) for use with this notebook:\n",
+    "\n",
+    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
     "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
+    "2. In the left sidebar, select **Inventory**.\n",
     "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
+    "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
     "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
+    "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
     "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
+    "5. Select your own name under the **RECORD OWNER** drop-down.\n",
     "\n",
-    "5. Click **Register Model** to add the model to your inventory."
+    "6. Click **Register Model** to add the model to your inventory."
    ]
   },
   {
@@ -145,10 +149,12 @@
     "\n",
     "#### Apply documentation template\n",
     "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
+    "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
     "\n",
     "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
     "\n",
+    "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+    "\n",
     "2. Under **TEMPLATE**, select `NLP-based Text Classification`.\n",
     "\n",
     "3. Click **Use Template** to apply the template."
@@ -162,11 +168,13 @@
     "\n",
     "#### Get your code snippet\n",
     "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
+    "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
     "\n",
     "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+    "\n",
     "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+    "\n",
+    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
    ]
   },
   {
@@ -392,7 +400,7 @@
     "\n",
     "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way: view the prompt validation test results as part of your model documentation in the ValidMind Platform:\n",
     "\n",
-    "1. In the ValidMind Platform, click **Development** under Documents for the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-documentation/working-with-model-documentation.html)\n",
+    "1. In the ValidMind Platform, click **Development** under Documents for the model you registered earlier. (Learn more: [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
     "\n",
     "2. Expand **2. Data Preparation** or **3. Model Development** to review all test results.\n",
     "\n",
diff --git a/site/notebooks/use_cases/nlp_and_llm/hugging_face_summarization_demo.ipynb b/site/notebooks/use_cases/nlp_and_llm/hugging_face_summarization_demo.ipynb
index 290bf7c545..5db308064b 100644
--- a/site/notebooks/use_cases/nlp_and_llm/hugging_face_summarization_demo.ipynb
+++ b/site/notebooks/use_cases/nlp_and_llm/hugging_face_summarization_demo.ipynb
@@ -8,7 +8,7 @@
     "\n",
     "Document a natural language processing (NLP) model using ValidMind to summarize financial news, based on a dataset of just over 300,000 unique news articles written by journalists at CNN and the Daily Mail.\n",
     "\n",
-    "This interactive notebook shows you how to set up the ValidMind Library, initialize the library, and load the dataset, followed by running the model validation tests provided by the ValidMind Library to quickly generate documentation about the data and model."
+    "This interactive notebook shows you how to set up the ValidMind Library, initialize the library, and load the dataset, followed by running the validation tests provided by the ValidMind Library to quickly generate documentation about the data and model."
    ]
   },
   {
@@ -52,7 +52,9 @@
     "\n",
     "## About ValidMind\n",
     "\n",
-    "ValidMind's suite of tools enables organizations to identify, document, and manage model risks for all types of models, including AI/ML models, LLMs, and statistical models. As a model developer, you use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
+    "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+    "\n",
+    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
     "\n",
     "If this is your first time trying out ValidMind, we recommend going through the following resources first:\n",
     "\n",
@@ -70,7 +72,7 @@
     "\n",
     "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
     "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+    "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
     "\n",
     "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
    ]
@@ -121,17 +123,19 @@
     "\n",
     "#### Register sample model\n",
     "\n",
-    "Let's first register a sample model for use with this notebook:\n",
+    "Let's first register a sample record (model) for use with this notebook:\n",
+    "\n",
+    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
     "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
+    "2. In the left sidebar, select **Inventory**.\n",
     "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
+    "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
     "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
+    "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
     "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
+    "5. Select your own name under the **RECORD OWNER** drop-down.\n",
     "\n",
-    "5. Click **Register Model** to add the model to your inventory."
+    "6. Click **Register Model** to add the model to your inventory."
    ]
   },
   {
@@ -142,10 +146,12 @@
     "\n",
     "#### Apply documentation template\n",
     "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
+    "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
     "\n",
     "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
     "\n",
+    "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+    "\n",
     "2. Under **TEMPLATE**, select `NLP-based Text Classification`.\n",
     "\n",
     "3. Click **Use Template** to apply the template."
@@ -159,11 +165,13 @@
     "\n",
     "#### Get your code snippet\n",
     "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
+    "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
     "\n",
     "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+    "\n",
     "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+    "\n",
+    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
    ]
   },
   {
@@ -413,7 +421,7 @@
     "\n",
     "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way: view the prompt validation test results as part of your model documentation in the ValidMind Platform:\n",
     "\n",
-    "1. In the ValidMind Platform, click **Development** under Documents for the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-documentation/working-with-model-documentation.html)\n",
+    "1. In the ValidMind Platform, click **Development** under Documents for the model you registered earlier. (Learn more: [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
     "\n",
     "2. Expand **2. Data Preparation** or **3. Model Development** to review all test results.\n",
     "\n",
diff --git a/site/notebooks/use_cases/nlp_and_llm/llm_summarization_demo.ipynb b/site/notebooks/use_cases/nlp_and_llm/llm_summarization_demo.ipynb
index a79afa7792..14f7b1ee2c 100644
--- a/site/notebooks/use_cases/nlp_and_llm/llm_summarization_demo.ipynb
+++ b/site/notebooks/use_cases/nlp_and_llm/llm_summarization_demo.ipynb
@@ -86,7 +86,9 @@
     "\n",
     "## About ValidMind\n",
     "\n",
-    "ValidMind's suite of tools enables organizations to identify, document, and manage model risks for all types of models, including AI/ML models, LLMs, and statistical models. As a model developer, you use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
+    "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+    "\n",
+    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
     "\n",
     "If this is your first time trying out ValidMind, you can make use of the following resources alongside this notebook:\n",
     "\n",
@@ -104,7 +106,7 @@
     "\n",
     "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
     "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+    "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
     "\n",
     "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
    ]
@@ -155,17 +157,19 @@
     "\n",
     "#### Register sample model\n",
     "\n",
-    "Let's first register a sample model for use with this notebook:\n",
+    "Let's first register a sample record (model) for use with this notebook:\n",
+    "\n",
+    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
     "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
+    "2. In the left sidebar, select **Inventory**.\n",
     "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
+    "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
     "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
+    "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
     "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
+    "5. Select your own name under the **RECORD OWNER** drop-down.\n",
     "\n",
-    "5. Click **Register Model** to add the model to your inventory."
+    "6. Click **Register Model** to add the model to your inventory."
    ]
   },
   {
@@ -176,10 +180,12 @@
     "\n",
     "#### Apply documentation template\n",
     "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
+    "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
     "\n",
     "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
     "\n",
+    "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+    "\n",
     "2. Under **TEMPLATE**, select `LLM-based Text Summarization`.\n",
     "\n",
     "3. Click **Use Template** to apply the template."
@@ -193,11 +199,13 @@
     "\n",
     "#### Get your code snippet\n",
     "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
+    "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
     "\n",
     "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+    "\n",
     "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+    "\n",
+    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
    ]
   },
   {
@@ -930,7 +938,7 @@
     "\n",
     "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way: view the prompt validation test results as part of your model documentation right in the ValidMind Platform:\n",
     "\n",
-    "1. In the ValidMind Platform, click **Development** under Documents for the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-documentation/working-with-model-documentation.html)\n",
+    "1. In the ValidMind Platform, click **Development** under Documents for the model you registered earlier. (Learn more: [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
     "\n",
     "2. Expand **2. Data Preparation** or **3. Model Development** to review all test results.\n",
     "\n",
diff --git a/site/notebooks/use_cases/nlp_and_llm/prompt_validation_demo.ipynb b/site/notebooks/use_cases/nlp_and_llm/prompt_validation_demo.ipynb
index 16b5f7c42c..deeb8293e8 100644
--- a/site/notebooks/use_cases/nlp_and_llm/prompt_validation_demo.ipynb
+++ b/site/notebooks/use_cases/nlp_and_llm/prompt_validation_demo.ipynb
@@ -1,554 +1,566 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Prompt validation for large language models (LLMs)\n",
-    "\n",
-    "Run and document prompt validation tests for a large language model (LLM) specialized in sentiment analysis for financial news. \n",
-    "\n",
-    "This interactive notebook shows you how to set up the ValidMind Library, initialize the library, and use a specific prompt template for analyzing the sentiment of given sentences. Prompt validation covers the initialization of a test dataset and the creation of a foundational model using the ValidMind Library, followed by the execution of a test suite specifically designed for prompt validation. The notebook also includes example data to test the model's ability to correctly identify sentiment as positive, negative, or neutral."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "  - [Preview the documentation template](#toc2_3__)    \n",
-    "- [Get ready to run the analysis](#toc3__)    \n",
-    "- [Get your sample dataset ready for analysis](#toc4__)    \n",
-    "- [Perform the prompt validation](#toc5__)    \n",
-    "- [Next steps](#toc6__)    \n",
-    "  - [Work with your model documentation](#toc6_1__)    \n",
-    "  - [Discover more learning resources](#toc6_2__)    \n",
-    "- [Upgrade ValidMind](#toc7__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
-    "\n",
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Custom tests**: Custom tests are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom test.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom test. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `LLM-based Text Classification`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Get ready to run the analysis\n",
-    "\n",
-    "Import the ValidMind `FoundationModel` and `Prompt` classes needed for the sentiment analysis later on:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.models import FoundationModel, Prompt"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Check your access to the OpenAI API:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import os\n",
-    "\n",
-    "import dotenv\n",
-    "\n",
-    "dotenv.load_dotenv()\n",
-    "\n",
-    "if os.getenv(\"OPENAI_API_KEY\") is None:\n",
-    "    raise Exception(\"OPENAI_API_KEY not found\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from openai import OpenAI\n",
-    "\n",
-    "model = OpenAI()\n",
-    "\n",
-    "\n",
-    "def call_model(prompt):\n",
-    "    return (\n",
-    "        model.chat.completions.create(\n",
-    "            model=\"gpt-3.5-turbo\",\n",
-    "            messages=[\n",
-    "                {\"role\": \"user\", \"content\": prompt},\n",
-    "            ],\n",
-    "        )\n",
-    "        .choices[0]\n",
-    "        .message.content\n",
-    "    )"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Set the prompt guidelines for the sentiment analysis:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "prompt_template = \"\"\"\n",
-    "You are an AI with expertise in sentiment analysis, particularly in the context of financial news.\n",
-    "Your task is to analyze the sentiment of a specific sentence provided below.\n",
-    "Before proceeding, take a moment to understand the context and nuances of the financial terminology used in the sentence.\n",
-    "\n",
-    "Sentence to Analyze:\n",
-    "```\n",
-    "{Sentence}\n",
-    "```\n",
-    "\n",
-    "Please respond with the sentiment of the sentence denoted by one of either 'positive', 'negative', or 'neutral'.\n",
-    "Please respond only with the sentiment enum value. Do not include any other text in your response.\n",
-    "\n",
-    "Note: Ensure that your analysis is based on the content of the sentence and not on external information or assumptions.\n",
-    "\"\"\".strip()\n",
-    "\n",
-    "prompt_variables = [\"Sentence\"]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Get your sample dataset ready for analysis\n",
-    "\n",
-    "To perform the sentiment analysis for financial news we're going to load a local copy of this dataset: https://www.kaggle.com/datasets/ankurzing/sentiment-analysis-for-financial-news.\n",
-    "\n",
-    "This dataset contains two columns, `Sentiment` and `Sentence`. The sentiment can be `negative`, `neutral` or `positive`."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import pandas as pd\n",
-    "\n",
-    "df = pd.read_csv(\"./datasets/sentiments.csv\")\n",
-    "\n",
-    "df_test = df[:10].reset_index(drop=True)\n",
-    "df_test"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Perform the prompt validation\n",
-    "\n",
-    "First, use the ValidMind Library to initialize the dataset and model objects necessary for documentation. The ValidMind `predict_fn` function allows the model to be tested and evaluated in a standardized manner:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_test_ds = vm.init_dataset(\n",
-    "    dataset=df_test,\n",
-    "    input_id=\"test_dataset\",\n",
-    "    text_column=\"Sentence\",\n",
-    "    target_column=\"Sentiment\",\n",
-    ")\n",
-    "\n",
-    "vm_model = vm.init_model(\n",
-    "    model=FoundationModel(\n",
-    "        predict_fn=call_model,\n",
-    "        prompt=Prompt(\n",
-    "            template=prompt_template,\n",
-    "            variables=prompt_variables,\n",
-    "        ),\n",
-    "    ),\n",
-    "    input_id=\"gpt_35_model\",\n",
-    ")\n",
-    "\n",
-    "# Assign model predictions to the test dataset\n",
-    "vm_test_ds.assign_predictions(vm_model)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Next, use the ValidMind Library to run validation tests on the model. These tests evaluate various aspects of the prompts, including bias, clarity, conciseness, delimitation, negative instruction, and specificity.\n",
-    "\n",
-    "Each test is explained in detail, highlighting its purpose, test mechanism, and the importance of the specific aspect being evaluated. The tests are graded on a scale from 1 to 10, with a predetermined threshold, and the explanations for each test include a score, threshold, and a pass/fail determination."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test_suite_results = vm.run_test_suite(\n",
-    "    \"prompt_validation\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_test_ds,\n",
-    "        \"model\": vm_model,\n",
-    "    },\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Here, most of the tests pass but the test for _conciseness_ needs further attention, as it fails the threshold. This test is designed to evaluate the brevity and succinctness of prompts provided to a large language model (LLM).\n",
-    "\n",
-    "The test matters, because a concise prompt strikes a balance between offering clear instructions and eliminating redundant or unnecessary information, ensuring that the LLM receives relevant input without being overwhelmed."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
-    "\n",
-    "<a id='toc6_1__'></a>\n",
-    "\n",
-    "### Work with your model documentation\n",
-    "\n",
-    "1. From the **Model Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. Click and expand the **Model Development** section.\n",
-    "\n",
-    "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/model-documentation/working-with-model-documentation.html)\n",
-    "\n",
-    "<a id='toc6_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc7__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-da0317263ddc4a119cb7b306ac1b39c1",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": ".venv",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.8.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Prompt validation for large language models (LLMs)\n",
+        "\n",
+        "Run and document prompt validation tests for a large language model (LLM) specialized in sentiment analysis for financial news. \n",
+        "\n",
+        "This interactive notebook shows you how to set up the ValidMind Library, initialize the library, and use a specific prompt template for analyzing the sentiment of given sentences. Prompt validation covers the initialization of a test dataset and the creation of a foundational model using the ValidMind Library, followed by the execution of a test suite specifically designed for prompt validation. The notebook also includes example data to test the model's ability to correctly identify sentiment as positive, negative, or neutral."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "  - [Preview the documentation template](#toc2_3__)    \n",
+        "- [Get ready to run the analysis](#toc3__)    \n",
+        "- [Get your sample dataset ready for analysis](#toc4__)    \n",
+        "- [Perform the prompt validation](#toc5__)    \n",
+        "- [Next steps](#toc6__)    \n",
+        "  - [Work with your model documentation](#toc6_1__)    \n",
+        "  - [Discover more learning resources](#toc6_2__)    \n",
+        "- [Upgrade ValidMind](#toc7__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+        "\n",
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `LLM-based Text Classification`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Get ready to run the analysis\n",
+        "\n",
+        "Import the ValidMind `FoundationModel` and `Prompt` classes needed for the sentiment analysis later on:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.models import FoundationModel, Prompt"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Check your access to the OpenAI API:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import os\n",
+        "\n",
+        "import dotenv\n",
+        "\n",
+        "dotenv.load_dotenv()\n",
+        "\n",
+        "if os.getenv(\"OPENAI_API_KEY\") is None:\n",
+        "    raise Exception(\"OPENAI_API_KEY not found\")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from openai import OpenAI\n",
+        "\n",
+        "model = OpenAI()\n",
+        "\n",
+        "\n",
+        "def call_model(prompt):\n",
+        "    return (\n",
+        "        model.chat.completions.create(\n",
+        "            model=\"gpt-3.5-turbo\",\n",
+        "            messages=[\n",
+        "                {\"role\": \"user\", \"content\": prompt},\n",
+        "            ],\n",
+        "        )\n",
+        "        .choices[0]\n",
+        "        .message.content\n",
+        "    )"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Set the prompt guidelines for the sentiment analysis:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "prompt_template = \"\"\"\n",
+        "You are an AI with expertise in sentiment analysis, particularly in the context of financial news.\n",
+        "Your task is to analyze the sentiment of a specific sentence provided below.\n",
+        "Before proceeding, take a moment to understand the context and nuances of the financial terminology used in the sentence.\n",
+        "\n",
+        "Sentence to Analyze:\n",
+        "```\n",
+        "{Sentence}\n",
+        "```\n",
+        "\n",
+        "Please respond with the sentiment of the sentence denoted by one of either 'positive', 'negative', or 'neutral'.\n",
+        "Please respond only with the sentiment enum value. Do not include any other text in your response.\n",
+        "\n",
+        "Note: Ensure that your analysis is based on the content of the sentence and not on external information or assumptions.\n",
+        "\"\"\".strip()\n",
+        "\n",
+        "prompt_variables = [\"Sentence\"]"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Get your sample dataset ready for analysis\n",
+        "\n",
+        "To perform the sentiment analysis for financial news we're going to load a local copy of this dataset: https://www.kaggle.com/datasets/ankurzing/sentiment-analysis-for-financial-news.\n",
+        "\n",
+        "This dataset contains two columns, `Sentiment` and `Sentence`. The sentiment can be `negative`, `neutral` or `positive`."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import pandas as pd\n",
+        "\n",
+        "df = pd.read_csv(\"./datasets/sentiments.csv\")\n",
+        "\n",
+        "df_test = df[:10].reset_index(drop=True)\n",
+        "df_test"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Perform the prompt validation\n",
+        "\n",
+        "First, use the ValidMind Library to initialize the dataset and model objects necessary for documentation. The ValidMind `predict_fn` function allows the model to be tested and evaluated in a standardized manner:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_test_ds = vm.init_dataset(\n",
+        "    dataset=df_test,\n",
+        "    input_id=\"test_dataset\",\n",
+        "    text_column=\"Sentence\",\n",
+        "    target_column=\"Sentiment\",\n",
+        ")\n",
+        "\n",
+        "vm_model = vm.init_model(\n",
+        "    model=FoundationModel(\n",
+        "        predict_fn=call_model,\n",
+        "        prompt=Prompt(\n",
+        "            template=prompt_template,\n",
+        "            variables=prompt_variables,\n",
+        "        ),\n",
+        "    ),\n",
+        "    input_id=\"gpt_35_model\",\n",
+        ")\n",
+        "\n",
+        "# Assign model predictions to the test dataset\n",
+        "vm_test_ds.assign_predictions(vm_model)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Next, use the ValidMind Library to run validation tests on the model. These tests evaluate various aspects of the prompts, including bias, clarity, conciseness, delimitation, negative instruction, and specificity.\n",
+        "\n",
+        "Each test is explained in detail, highlighting its purpose, test mechanism, and the importance of the specific aspect being evaluated. The tests are graded on a scale from 1 to 10, with a predetermined threshold, and the explanations for each test include a score, threshold, and a pass/fail determination."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test_suite_results = vm.run_test_suite(\n",
+        "    \"prompt_validation\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_test_ds,\n",
+        "        \"model\": vm_model,\n",
+        "    },\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Here, most of the tests pass but the test for _conciseness_ needs further attention, as it fails the threshold. This test is designed to evaluate the brevity and succinctness of prompts provided to a large language model (LLM).\n",
+        "\n",
+        "The test matters, because a concise prompt strikes a balance between offering clear instructions and eliminating redundant or unnecessary information, ensuring that the LLM receives relevant input without being overwhelmed."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
+        "\n",
+        "<a id='toc6_1__'></a>\n",
+        "\n",
+        "### Work with your documentation\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (**Learn more:** [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. Click and expand the **Model Development** section.\n",
+        "\n",
+        "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
+        "\n",
+        "<a id='toc6_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-da0317263ddc4a119cb7b306ac1b39c1"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": ".venv",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.8.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 2
 }
diff --git a/site/notebooks/use_cases/nlp_and_llm/rag_benchmark_demo.ipynb b/site/notebooks/use_cases/nlp_and_llm/rag_benchmark_demo.ipynb
index 3c036bc62f..a224f1721f 100644
--- a/site/notebooks/use_cases/nlp_and_llm/rag_benchmark_demo.ipynb
+++ b/site/notebooks/use_cases/nlp_and_llm/rag_benchmark_demo.ipynb
@@ -82,9 +82,9 @@
     "\n",
     "## About ValidMind\n",
     "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
+    "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
     "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
+    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
     "\n",
     "<a id='toc1_1__'></a>\n",
     "\n",
@@ -98,11 +98,11 @@
     "\n",
     "### New to ValidMind?\n",
     "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
+    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
     "\n",
     "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
     "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+    "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
     "\n",
     "<a id='toc1_3__'></a>\n",
     "\n",
@@ -190,17 +190,19 @@
     "\n",
     "#### Register sample model\n",
     "\n",
-    "Let's first register a sample model for use with this notebook:\n",
+    "Let's first register a sample record (model) for use with this notebook:\n",
     "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
+    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
     "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
+    "2. In the left sidebar, select **Inventory**.\n",
     "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
+    "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
     "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
+    "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
     "\n",
-    "5. Click **Register Model** to add the model to your inventory."
+    "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+    "\n",
+    "6. Click **Register Model** to add the model to your inventory."
    ]
   },
   {
@@ -211,10 +213,12 @@
     "\n",
     "#### Apply documentation template\n",
     "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
+    "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
     "\n",
     "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
     "\n",
+    "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+    "\n",
     "2. Under **TEMPLATE**, select `Gen AI RAG`.\n",
     "\n",
     "3. Click **Use Template** to apply the template."
@@ -242,11 +246,13 @@
     "\n",
     "#### Get your code snippet\n",
     "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
+    "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
     "\n",
     "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+    "\n",
     "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+    "\n",
+    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
    ]
   },
   {
diff --git a/site/notebooks/use_cases/nlp_and_llm/rag_documentation_demo.ipynb b/site/notebooks/use_cases/nlp_and_llm/rag_documentation_demo.ipynb
index 744acddc91..7589bd17b7 100644
--- a/site/notebooks/use_cases/nlp_and_llm/rag_documentation_demo.ipynb
+++ b/site/notebooks/use_cases/nlp_and_llm/rag_documentation_demo.ipynb
@@ -81,9 +81,9 @@
     "\n",
     "## About ValidMind\n",
     "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
+    "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
     "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
+    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
     "\n",
     "<a id='toc1_1__'></a>\n",
     "\n",
@@ -97,11 +97,11 @@
     "\n",
     "### New to ValidMind?\n",
     "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
+    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
     "\n",
     "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
     "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+    "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
     "\n",
     "<a id='toc1_3__'></a>\n",
     "\n",
@@ -165,16 +165,18 @@
     "\n",
     "#### Register sample model\n",
     "\n",
-    "Let's first register a sample model for use with this notebook:\n",
+    "Let's first register a sample record (model) for use with this notebook:\n",
     "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
+    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
     "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
+    "2. In the left sidebar, select **Inventory**.\n",
     "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
+    "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
     "\n",
-    "5. Click **Register Model** to add the model to your inventory."
+    "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+    "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+    "\n",
+    "6. Click **Register Model** to add the model to your inventory."
    ]
   },
   {
@@ -185,10 +187,12 @@
     "\n",
     "#### Apply documentation template\n",
     "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
+    "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
     "\n",
     "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
     "\n",
+    "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+    "\n",
     "2. Under **TEMPLATE**, select `Gen AI RAG`.\n",
     "\n",
     "3. Click **Use Template** to apply the template."
@@ -216,11 +220,13 @@
     "\n",
     "#### Get your code snippet\n",
     "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
+    "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
     "\n",
     "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+    "\n",
     "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+    "\n",
+    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
    ]
   },
   {
diff --git a/site/notebooks/use_cases/ongoing_monitoring/application_scorecard_ongoing_monitoring.ipynb b/site/notebooks/use_cases/ongoing_monitoring/application_scorecard_ongoing_monitoring.ipynb
index df159619f9..847417cf02 100644
--- a/site/notebooks/use_cases/ongoing_monitoring/application_scorecard_ongoing_monitoring.ipynb
+++ b/site/notebooks/use_cases/ongoing_monitoring/application_scorecard_ongoing_monitoring.ipynb
@@ -1,1382 +1,1399 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Ongoing Monitoring for Application Scorecard\n",
-    "\n",
-    "In this notebook, you'll learn how to seamlessly monitor your production models using the ValidMind Platform.\n",
-    "\n",
-    "We'll walk you through the process of initializing the ValidMind Library, loading a sample dataset and model, and running a monitoring test suite to quickly generate documentation about your new data and model."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply monitoring report template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "  - [Preview the monitoring report template](#toc2_3__)    \n",
-    "  - [Initialize the Python environment](#toc2_4__)    \n",
-    "  - [Preview the monitoring template](#toc2_5__)    \n",
-    "- [Load the reference and monitoring datasets](#toc3__)    \n",
-    "- [Train the model](#toc4__)    \n",
-    "  - [Initialize the ValidMind datasets](#toc4_1__)    \n",
-    "  - [Initialize a model object](#toc4_2__)    \n",
-    "  - [Assign prediction values and probabilities to the datasets](#toc4_3__)    \n",
-    "  - [Compute credit risk scores](#toc4_4__)    \n",
-    "  - [Adding custom context to the LLM descriptions](#toc4_5__)    \n",
-    "  - [Monitoring data description](#toc4_6__)    \n",
-    "  - [Target and feature drift](#toc4_7__)    \n",
-    "  - [Classification accuracy](#toc4_8__)    \n",
-    "  - [Class discrimination](#toc4_9__)    \n",
-    "  - [Scoring](#toc4_10__)    \n",
-    "  - [Model insights](#toc4_11__)    \n",
-    "  - [Diagnostic monitoring](#toc4_12__)    \n",
-    "  - [Robustness monitoring](#toc4_13__)    \n",
-    "  - [Performance history](#toc4_14__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation, validation, monitoring tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
-    "\n",
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Model monitoring report**: A comprehensive and structured record of a production model, including key elements such as data sources, inputs, performance metrics, and periodic evaluations. This documentation ensures transparency and visibility of the model's performance in the production environment.\n",
-    "\n",
-    "**Monitoring report template**: Similar to documentation template, The monitoring report template functions as a test suite and lays out the structure of model monitoring, segmented into various sections and sub-sections. Monitoring report templates define the structure of your model monitoring report, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Custom tests**: Custom tests are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom test.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom test. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply monitoring report template\n",
-    "\n",
-    "Once you've registered your model, let's select a monitoring report template. A template predefines sections for your monitoring report and provides a general outline to follow, making the monitoring process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Monitoring**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Ongoing Monitoring for Classification Models`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Monitoring` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"monitoring\",\n",
-    "    monitoring = True,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Preview the monitoring report template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_4__'></a>\n",
-    "\n",
-    "### Initialize the Python environment\n",
-    "\n",
-    "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import xgboost as xgb\n",
-    "import numpy as np\n",
-    "\n",
-    "from datetime import datetime, timedelta\n",
-    "\n",
-    "from validmind.tests import run_test\n",
-    "from validmind.datasets.credit_risk import lending_club\n",
-    "from validmind.unit_metrics import list_metrics\n",
-    "from validmind.unit_metrics import describe_metric\n",
-    "from validmind.unit_metrics import run_metric\n",
-    "from validmind.api_client import log_metric\n",
-    "\n",
-    "%matplotlib inline"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_5__'></a>\n",
-    "\n",
-    "### Preview the monitoring template\n",
-    "\n",
-    "A template predefines sections for your model monitoring documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "You will upload documentation and test results into this template later on. For now, take a look at the structure that the template provides with the `vm.preview_template()` function from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Load the reference and monitoring datasets\n",
-    "\n",
-    "The sample dataset used here is provided by the ValidMind library. For demonstration purposes we'll use the training, test dataset splits as `reference` and `monitoring` datasets."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "df = lending_club.load_data(source=\"offline\")\n",
-    "df.head()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "preprocess_df = lending_club.preprocess(df)\n",
-    "preprocess_df.head()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "fe_df = lending_club.feature_engineering(preprocess_df)\n",
-    "fe_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Train the model\n",
-    "\n",
-    "In this section, we focus on constructing and refining our predictive model. \n",
-    "- We begin by dividing our data, which is based on Weight of Evidence (WoE) features, into training and testing sets (`train_df`, `test_df`). \n",
-    "- With `lending_club.split`, we employ a simple random split, randomly allocating data points to each set to ensure a mix of examples in both."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Split the data\n",
-    "train_df, test_df = lending_club.split(fe_df, test_size=0.2)\n",
-    "\n",
-    "x_train = train_df.drop(lending_club.target_column, axis=1)\n",
-    "y_train = train_df[lending_club.target_column]\n",
-    "\n",
-    "x_test = test_df.drop(lending_club.target_column, axis=1)\n",
-    "y_test = test_df[lending_club.target_column]"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Define the XGBoost model\n",
-    "xgb_model = xgb.XGBClassifier(\n",
-    "    n_estimators=50, \n",
-    "    random_state=42, \n",
-    "    early_stopping_rounds=10\n",
-    ")\n",
-    "xgb_model.set_params(\n",
-    "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
-    ")\n",
-    "\n",
-    "# Fit the model\n",
-    "xgb_model.fit(\n",
-    "    x_train, \n",
-    "    y_train,\n",
-    "    eval_set=[(x_test, y_test)],\n",
-    "    verbose=False\n",
-    ")\n",
-    "\n",
-    "# Compute probabilities\n",
-    "train_xgb_prob = xgb_model.predict_proba(x_train)[:, 1]\n",
-    "test_xgb_prob = xgb_model.predict_proba(x_test)[:, 1]\n",
-    "\n",
-    "# Compute binary predictions\n",
-    "cut_off_threshold = 0.3\n",
-    "train_xgb_binary_predictions = (train_xgb_prob > cut_off_threshold).astype(int)\n",
-    "test_xgb_binary_predictions = (test_xgb_prob > cut_off_threshold).astype(int)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind datasets\n",
-    "\n",
-    "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
-    "\n",
-    "This function takes a number of arguments:\n",
-    "\n",
-    "- `dataset` — The raw dataset that you want to provide as input to tests.\n",
-    "- `input_id` - A unique identifier that allows tracking what inputs are used when running each individual test.\n",
-    "- `target_column` — A required argument if tests require access to true values. This is the name of the target column in the dataset.\n",
-    "\n",
-    "With all datasets ready, you can now initialize training, reference(test) and monitor datasets (`reference_df` and `monitor_df`) created earlier into their own dataset objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_reference_ds = vm.init_dataset(\n",
-    "    dataset=train_df,\n",
-    "    input_id=\"reference_dataset\",\n",
-    "    target_column=lending_club.target_column,\n",
-    ")\n",
-    "\n",
-    "vm_monitoring_ds = vm.init_dataset(\n",
-    "    dataset=test_df,\n",
-    "    input_id=\"monitoring_dataset\",\n",
-    "    target_column=lending_club.target_column,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Initialize a model object\n",
-    "\n",
-    "You will also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data. You simply intialize this model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_xgb_model = vm.init_model(\n",
-    "    xgb_model,\n",
-    "    input_id=\"xgb_model\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_3__'></a>\n",
-    "\n",
-    "### Assign prediction values and probabilities to the datasets\n",
-    "\n",
-    "With our model now trained, we'll move on to assigning both the predictive probabilities coming directly from the model's predictions, and the binary prediction after applying the cutoff threshold described in the previous steps. \n",
-    "- These tasks are achieved through the use of the `assign_predictions()` method associated with the VM `dataset` object.\n",
-    "- This method links the model's class prediction values and probabilities to our VM train and test datasets."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_reference_ds.assign_predictions(\n",
-    "    model=vm_xgb_model,\n",
-    "    prediction_values=train_xgb_binary_predictions,\n",
-    "    prediction_probabilities=train_xgb_prob,\n",
-    ")\n",
-    "\n",
-    "vm_monitoring_ds.assign_predictions(\n",
-    "    model=vm_xgb_model,\n",
-    "    prediction_values=test_xgb_binary_predictions,\n",
-    "    prediction_probabilities=test_xgb_prob,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_4__'></a>\n",
-    "\n",
-    "### Compute credit risk scores\n",
-    "\n",
-    "In this phase, we translate model predictions into actionable scores using probability estimates generated by our trained model."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "train_xgb_scores = lending_club.compute_scores(train_xgb_prob)\n",
-    "test_xgb_scores = lending_club.compute_scores(test_xgb_prob)\n",
-    "\n",
-    "# Assign scores to the datasets\n",
-    "vm_reference_ds.add_extra_column(\"xgb_scores\", train_xgb_scores)\n",
-    "vm_monitoring_ds.add_extra_column(\"xgb_scores\", test_xgb_scores)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_5__'></a>\n",
-    "\n",
-    "### Adding custom context to the LLM descriptions\n",
-    "\n",
-    "To enable the LLM descriptions context, you need to set the `VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED` environment variable to `1`. This will enable the LLM descriptions context, which will be used to provide additional context to the LLM descriptions. This is a global setting that will affect all tests."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import os\n",
-    "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED\"] = \"1\"\n",
-    "\n",
-    "context = \"\"\"\n",
-    "FORMAT FOR THE LLM DESCRIPTIONS: \n",
-    "    **<Test Name>** is designed to <begin with a concise overview of what the test does and its primary purpose, \n",
-    "    extracted from the test description>.\n",
-    "\n",
-    "    The test operates by <write a paragraph about the test mechanism, explaining how it works and what it measures. \n",
-    "    Include any relevant formulas or methodologies mentioned in the test description.>\n",
-    "\n",
-    "    The primary advantages of this test include <write a paragraph about the test's strengths and capabilities, \n",
-    "    highlighting what makes it particularly useful for specific scenarios.>\n",
-    "\n",
-    "    Users should be aware that <write a paragraph about the test's limitations and potential risks. \n",
-    "    Include both technical limitations and interpretation challenges. \n",
-    "    If the test description includes specific signs of high risk, incorporate these here.>\n",
-    "\n",
-    "    **Key Insights:**\n",
-    "\n",
-    "    The test results reveal:\n",
-    "\n",
-    "    - **<insight title>**: <comprehensive description of one aspect of the results>\n",
-    "    - **<insight title>**: <comprehensive description of another aspect>\n",
-    "    ...\n",
-    "\n",
-    "    Based on these results, <conclude with a brief paragraph that ties together the test results with the test's \n",
-    "    purpose and provides any final recommendations or considerations.>\n",
-    "\n",
-    "ADDITIONAL INSTRUCTIONS:\n",
-    "    Present insights in order from general to specific, with each insight as a single bullet point with bold title.\n",
-    "\n",
-    "    For each metric in the test results, include in the test overview:\n",
-    "    - The metric's purpose and what it measures\n",
-    "    - Its mathematical formula\n",
-    "    - The range of possible values\n",
-    "    - What constitutes good/bad performance\n",
-    "    - How to interpret different values\n",
-    "\n",
-    "    Each insight should progressively cover:\n",
-    "    1. Overall scope and distribution\n",
-    "    2. Complete breakdown of all elements with specific values\n",
-    "    3. Natural groupings and patterns\n",
-    "    4. Comparative analysis between datasets/categories\n",
-    "    5. Stability and variations\n",
-    "    6. Notable relationships or dependencies\n",
-    "\n",
-    "    Remember:\n",
-    "    - Keep all insights at the same level (no sub-bullets or nested structures)\n",
-    "    - Make each insight complete and self-contained\n",
-    "    - Include specific numerical values and ranges\n",
-    "    - Cover all elements in the results comprehensively\n",
-    "    - Maintain clear, concise language\n",
-    "    - Use only \"- **Title**: Description\" format for insights\n",
-    "    - Progress naturally from general to specific observations\n",
-    "\n",
-    "\"\"\".strip()\n",
-    "\n",
-    "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT\"] = context"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_6__'></a>\n",
-    "\n",
-    "### Monitoring data description\n",
-    "\n",
-    "The Monitoring Data Description tests aim to provide a comprehensive statistical analysis of the monitoring dataset's characteristics. These tests examine the basic statistical properties, identify any missing data patterns, assess data uniqueness, visualize numerical feature distributions, and evaluate feature relationships through correlation analysis.\n",
-    "\n",
-    "The primary objective is to establish a baseline understanding of the monitoring data's structure and quality, enabling the detection of any significant deviations from expected patterns that could impact model performance. Each test is designed to capture different aspects of the data, from univariate statistics to multivariate relationships, providing a foundation for ongoing data quality assessment in the production environment."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.DescriptiveStatistics:monitoring_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_monitoring_ds,\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.MissingValues:monitoring_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_monitoring_ds,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"min_percentage_threshold\": 1\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.UniqueRows:monitoring_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_monitoring_ds,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"min_percent_threshold\": 1\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.TabularNumericalHistograms:monitoring_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_monitoring_ds,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.PearsonCorrelationMatrix:monitoring_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_monitoring_ds,\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.data_validation.HighPearsonCorrelation:monitoring_data\",\n",
-    "    inputs={\n",
-    "        \"dataset\": vm_monitoring_ds,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"feature_columns\": vm_monitoring_ds.feature_columns,\n",
-    "        \"max_threshold\": 0.5,\n",
-    "        \"top_n_correlations\": 10\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.ongoing_monitoring.ClassImbalanceDrift\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"drift_pct_threshold\": 1\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_7__'></a>\n",
-    "\n",
-    "### Target and feature drift\n",
-    "\n",
-    "Next, the goal is to investigate the distributional characteristics of predictions and features to determine if the underlying data has changed. These tests are crucial for assessing the expected accuracy of the model.\n",
-    "\n",
-    "1. **Target drift:** We compare the dataset used for testing (reference data) with the monitoring data. This helps to identify any shifts in the target variable distribution.\n",
-    "2. **Feature drift:** We compare the training dataset with the monitoring data. Since features were used to train the model, any drift in these features could indicate potential issues, as the underlying patterns that the model was trained on may have changed."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Next, we can examine the correlation between features and predictions. Significant changes in these correlations may trigger a deeper assessment."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.PopulationStabilityIndex\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "        \"model\": vm_xgb_model,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.ongoing_monitoring.TargetPredictionDistributionPlot\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "        \"model\": vm_xgb_model,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"drift_pct_threshold\": 5\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Now we want see difference in correlation pairs between model prediction and features."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.ongoing_monitoring.PredictionCorrelation\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "        \"model\": vm_xgb_model,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"drift_pct_threshold\": 5\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Finally for target drift, let's plot each prediction value and feature grid side by side."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.ongoing_monitoring.PredictionQuantilesAcrossFeatures\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "        \"model\": vm_xgb_model,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Next, let's add run a test to investigate how or if the features have drifted. In this instance we want to compare the training data with prediction data."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.ongoing_monitoring.FeatureDrift\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "        \"model\": vm_xgb_model,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"psi_threshold\": 0.2,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_8__'></a>\n",
-    "\n",
-    "### Classification accuracy\n",
-    "\n",
-    "We now evaluate the model's predictive performance by comparing its behavior between reference and monitoring datasets. These tests analyze shifts in overall accuracy metrics, examine changes in the confusion matrix to identify specific classification pattern changes, and assess the model's probability calibration across different prediction thresholds. \n",
-    "\n",
-    "The primary objective is to detect any degradation in the model's classification performance that might indicate reliability issues in production. The tests provide both aggregate performance metrics and detailed breakdowns of prediction patterns, enabling the identification of specific areas where the model's accuracy might be deteriorating."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.ongoing_monitoring.ClassificationAccuracyDrift\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "        \"model\": vm_xgb_model,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"drift_pct_threshold\": 5,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.ongoing_monitoring.ConfusionMatrixDrift\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "        \"model\": vm_xgb_model,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"drift_pct_threshold\": 5,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.ongoing_monitoring.CalibrationCurveDrift\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "        \"model\": vm_xgb_model,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"n_bins\": 10,\n",
-    "        \"drift_pct_threshold\": 10,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_9__'></a>\n",
-    "\n",
-    "### Class discrimination\n",
-    "\n",
-    "The following tests assess the model's ability to effectively separate different classes in both reference and monitoring datasets. These tests analyze the model's discriminative power by examining the separation between class distributions, evaluating changes in the ROC curve characteristics, comparing probability distribution patterns, and assessing cumulative prediction trends. \n",
-    "\n",
-    "The primary objective is to identify any deterioration in the model's ability to distinguish between classes, which could indicate a decline in model effectiveness. The tests examine both the overall discriminative capability and the granular patterns in prediction distributions, providing insights into whether the model maintains its ability to effectively differentiate between classes in the production environment."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.ongoing_monitoring.ClassDiscriminationDrift\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "        \"model\": vm_xgb_model,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"drift_pct_threshold\": 5,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.ongoing_monitoring.ROCCurveDrift\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "        \"model\": vm_xgb_model,\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.ongoing_monitoring.PredictionProbabilitiesHistogramDrift\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "        \"model\": vm_xgb_model,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"drift_pct_threshold\": 10,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.ongoing_monitoring.CumulativePredictionProbabilitiesDrift\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "        \"model\": vm_xgb_model,\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_10__'></a>\n",
-    "\n",
-    "### Scoring\n",
-    "\n",
-    "Next we analyze the distribution and stability of credit scores across reference and monitoring datasets. These tests evaluate shifts in score distributions, examine changes in score band populations, and assess the relationship between scores and default rates. \n",
-    "\n",
-    "The primary objective is to identify any significant changes in how the model assigns credit scores, which could indicate drift in risk assessment capabilities. The tests examine both the overall score distribution patterns and the specific performance within defined score bands, providing insights into whether the model maintains consistent and reliable risk segmentation."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.ongoing_monitoring.ScorecardHistogramDrift\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"score_column\": \"xgb_scores\",\n",
-    "        \"drift_pct_threshold\": 20,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.ongoing_monitoring.ScoreBandsDrift\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "        \"model\": vm_xgb_model,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"score_column\": \"xgb_scores\",\n",
-    "        \"score_bands\": [500, 540, 570],\n",
-    "        \"drift_pct_threshold\": 20,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_11__'></a>\n",
-    "\n",
-    "### Model insights"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.PermutationFeatureImportance\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "        \"model\": [vm_xgb_model]\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.FeaturesAUC\",\n",
-    "    input_grid={\n",
-    "        \"model\": [vm_xgb_model],\n",
-    "        \"dataset\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.SHAPGlobalImportance\",\n",
-    "    input_grid={\n",
-    "        \"model\": [vm_xgb_model],\n",
-    "        \"dataset\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"kernel_explainer_samples\": 10,\n",
-    "        \"tree_or_linear_explainer_samples\": 200,\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_12__'></a>\n",
-    "\n",
-    "### Diagnostic monitoring"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.WeakspotsDiagnosis\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "        \"model\": vm_xgb_model,\n",
-    "    },\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.OverfitDiagnosis\",\n",
-    "    inputs={\n",
-    "        \"model\": vm_xgb_model,\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"cut_off_threshold\": 0.04\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_13__'></a>\n",
-    "\n",
-    "### Robustness monitoring"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "run_test(\n",
-    "    \"validmind.model_validation.sklearn.RobustnessDiagnosis\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
-    "        \"model\": vm_xgb_model,\n",
-    "    },\n",
-    "    params={\n",
-    "        \"scaling_factor_std_dev_list\": [\n",
-    "            0.1,\n",
-    "            0.2,\n",
-    "            0.3,\n",
-    "            0.4,\n",
-    "            0.5\n",
-    "        ],\n",
-    "        \"performance_decay_threshold\": 0.05\n",
-    "    }\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_14__'></a>\n",
-    "\n",
-    "### Performance history\n",
-    "\n",
-    "In this section we showcase how to track and visualize the temporal evolution of key model performance metrics, including AUC, F1 score, precision, recall, and accuracy. For demonstration purposes, the section simulates historical performance data by introducing a gradual downward trend and random noise to these metrics over a specified time period. These tests are useful for analyzing the stability and trends in model performance indicators, helping to identify potential degradation or unexpected fluctuations in model behavior over time. \n",
-    "\n",
-    "The main goal is to maintain a continuous record of model performance that can be used to detect gradual drift, sudden changes, or cyclical patterns in model effectiveness. This temporal monitoring approach provides early warning signals of potential issues and helps establish whether the model maintains consistent performance within acceptable boundaries throughout its deployment period."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "metrics = [metric for metric in list_metrics() if \"classification\" in metric]\n",
-    "\n",
-    "for metric_id in metrics:\n",
-    "    describe_metric(metric_id)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_metric(\n",
-    "    \"validmind.unit_metrics.classification.ROC_AUC\",\n",
-    "    inputs={\n",
-    "        \"model\": vm_xgb_model,\n",
-    "        \"dataset\": vm_monitoring_ds,\n",
-    "    },\n",
-    ")\n",
-    "auc = result.metric"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_metric(\n",
-    "    \"validmind.unit_metrics.classification.Accuracy\",\n",
-    "    inputs={\n",
-    "        \"model\": vm_xgb_model,\n",
-    "        \"dataset\": vm_monitoring_ds,\n",
-    "    },\n",
-    ")\n",
-    "accuracy = result.metric"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "result = run_metric(\n",
-    "    \"validmind.unit_metrics.classification.Recall\",\n",
-    "    inputs={\n",
-    "        \"model\": vm_xgb_model,\n",
-    "        \"dataset\": vm_monitoring_ds,\n",
-    "    },\n",
-    ")\n",
-    "recall = result.metric"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "f1 = run_metric(\n",
-    "    \"validmind.unit_metrics.classification.F1\",\n",
-    "    inputs={\n",
-    "        \"model\": vm_xgb_model,\n",
-    "        \"dataset\": vm_monitoring_ds,\n",
-    "    },\n",
-    ")\n",
-    "f1 = result.metric"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "precision = run_metric(\n",
-    "    \"validmind.unit_metrics.classification.Precision\",\n",
-    "    inputs={\n",
-    "        \"model\": vm_xgb_model,\n",
-    "        \"dataset\": vm_monitoring_ds,\n",
-    "    },\n",
-    ")\n",
-    "precision = result.metric"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "NUM_DAYS = 10\n",
-    "REFERENCE_DATE = datetime(2024, 1, 1)  # Fixed date: January 1st, 2024\n",
-    "base_date = REFERENCE_DATE - timedelta(days=NUM_DAYS)\n",
-    "\n",
-    "\n",
-    "# Initial values\n",
-    "performance_metrics = {\n",
-    "    \"AUC Score\": auc,\n",
-    "    \"F1 Score\": f1,\n",
-    "    \"Precision Score\": precision,\n",
-    "    \"Recall Score\": recall,\n",
-    "    \"Accuracy Score\": accuracy\n",
-    "}\n",
-    "\n",
-    "# Trend parameters\n",
-    "trend_factor = 0.98  # Slight downward trend (multiply by 0.98 each step)\n",
-    "noise_scale = 0.02   # Random fluctuation of ±2%\n",
-    "\n",
-    "\n",
-    "for i in range(NUM_DAYS):\n",
-    "    recorded_at = base_date + timedelta(days=i)\n",
-    "    print(f\"\\nrecorded_at: {recorded_at}\")\n",
-    "\n",
-    "    # Log each metric with trend and noise\n",
-    "    for metric_name, base_value in performance_metrics.items():\n",
-    "        # Apply trend and add random noise\n",
-    "        trend = base_value * (trend_factor ** i)\n",
-    "        noise = np.random.normal(0, noise_scale * base_value)\n",
-    "        value = max(0, min(1, trend + noise))  # Ensure value stays between 0 and 1\n",
-    "        \n",
-    "        log_metric(\n",
-    "            key=metric_name,\n",
-    "            value=value,\n",
-    "            recorded_at=recorded_at.isoformat()\n",
-    "        )\n",
-    "        \n",
-    "        print(f\"{metric_name:<15}: {value:.4f}\")\n"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-7d1a3b9bebaf43cdb331352abb7456af",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "validmind-eEL8LtKG-py3.10",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Ongoing Monitoring for Application Scorecard\n",
+        "\n",
+        "In this notebook, you'll learn how to seamlessly monitor your production models using the ValidMind Platform.\n",
+        "\n",
+        "We'll walk you through the process of initializing the ValidMind Library, loading a sample dataset and model, and running a monitoring test suite to quickly generate documentation about your new data and model."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply monitoring report template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "  - [Preview the monitoring report template](#toc2_3__)    \n",
+        "  - [Initialize the Python environment](#toc2_4__)    \n",
+        "  - [Preview the monitoring template](#toc2_5__)    \n",
+        "- [Load the reference and monitoring datasets](#toc3__)    \n",
+        "- [Train the model](#toc4__)    \n",
+        "  - [Initialize the ValidMind datasets](#toc4_1__)    \n",
+        "  - [Initialize the ValidMind model](#toc4_2__)    \n",
+        "  - [Assign prediction values and probabilities to the datasets](#toc4_3__)    \n",
+        "  - [Compute credit risk scores](#toc4_4__)    \n",
+        "  - [Adding custom context to the LLM descriptions](#toc4_5__)    \n",
+        "  - [Monitoring data description](#toc4_6__)    \n",
+        "  - [Target and feature drift](#toc4_7__)    \n",
+        "  - [Classification accuracy](#toc4_8__)    \n",
+        "  - [Class discrimination](#toc4_9__)    \n",
+        "  - [Scoring](#toc4_10__)    \n",
+        "  - [Model insights](#toc4_11__)    \n",
+        "  - [Diagnostic monitoring](#toc4_12__)    \n",
+        "  - [Robustness monitoring](#toc4_13__)    \n",
+        "  - [Performance history](#toc4_14__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation, validation, and monitoring tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+        "\n",
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**ongoing monitoring report**: A comprehensive and structured periodic report assessing the record's performance and compliance over time, ensuring it remains valid under changing conditions. Monitoring includes key elements such as data sources, inputs, performance metrics, and periodic evaluations, ensuring transparency and visibility of the record's performance in the production environment.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**monitoring template, monitoring report template**: A default ValidMind document template that serves as a standardized framework for ongoing monitoring, including sections designated for test results, performance metrics, and drift analyses. By outlining required monitoring checks and expected routine tests, monitoring templates ensure consistency and completeness across monitoring reports and help guide owners through a systematic monitoring process while promoting early detection of performance degradation.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply monitoring report template\n",
+        "\n",
+        "Once you've registered your model, let's select a monitoring report template. A template predefines sections for your monitoring report and provides a general outline to follow, making the monitoring process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Monitoring**.\n",
+        "\n",
+        "    If you cannot locate your Monitoring document, make sure Monitoring type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Ongoing Monitoring for Classification Models`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Monitoring` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"monitoring\",\n",
+        "    monitoring = True,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Preview the monitoring report template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_4__'></a>\n",
+        "\n",
+        "### Initialize the Python environment\n",
+        "\n",
+        "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import xgboost as xgb\n",
+        "import numpy as np\n",
+        "\n",
+        "from datetime import datetime, timedelta\n",
+        "\n",
+        "from validmind.tests import run_test\n",
+        "from validmind.datasets.credit_risk import lending_club\n",
+        "from validmind.unit_metrics import list_metrics\n",
+        "from validmind.unit_metrics import describe_metric\n",
+        "from validmind.unit_metrics import run_metric\n",
+        "from validmind.api_client import log_metric\n",
+        "\n",
+        "%matplotlib inline"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_5__'></a>\n",
+        "\n",
+        "### Preview the monitoring template\n",
+        "\n",
+        "A template predefines sections for your monitoring documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "You will upload documentation and test results into this template later on. For now, take a look at the structure that the template provides with the `vm.preview_template()` function from the ValidMind library and note the empty sections:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Load the reference and monitoring datasets\n",
+        "\n",
+        "The sample dataset used here is provided by the ValidMind library. For demonstration purposes we'll use the training, test dataset splits as `reference` and `monitoring` datasets."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "df = lending_club.load_data(source=\"offline\")\n",
+        "df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "preprocess_df = lending_club.preprocess(df)\n",
+        "preprocess_df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "fe_df = lending_club.feature_engineering(preprocess_df)\n",
+        "fe_df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Train the model\n",
+        "\n",
+        "In this section, we focus on constructing and refining our predictive model. \n",
+        "- We begin by dividing our data, which is based on Weight of Evidence (WoE) features, into training and testing sets (`train_df`, `test_df`). \n",
+        "- With `lending_club.split`, we employ a simple random split, randomly allocating data points to each set to ensure a mix of examples in both."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Split the data\n",
+        "train_df, test_df = lending_club.split(fe_df, test_size=0.2)\n",
+        "\n",
+        "x_train = train_df.drop(lending_club.target_column, axis=1)\n",
+        "y_train = train_df[lending_club.target_column]\n",
+        "\n",
+        "x_test = test_df.drop(lending_club.target_column, axis=1)\n",
+        "y_test = test_df[lending_club.target_column]"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Define the XGBoost model\n",
+        "xgb_model = xgb.XGBClassifier(\n",
+        "    n_estimators=50, \n",
+        "    random_state=42, \n",
+        "    early_stopping_rounds=10\n",
+        ")\n",
+        "xgb_model.set_params(\n",
+        "    eval_metric=[\"error\", \"logloss\", \"auc\"],\n",
+        ")\n",
+        "\n",
+        "# Fit the model\n",
+        "xgb_model.fit(\n",
+        "    x_train, \n",
+        "    y_train,\n",
+        "    eval_set=[(x_test, y_test)],\n",
+        "    verbose=False\n",
+        ")\n",
+        "\n",
+        "# Compute probabilities\n",
+        "train_xgb_prob = xgb_model.predict_proba(x_train)[:, 1]\n",
+        "test_xgb_prob = xgb_model.predict_proba(x_test)[:, 1]\n",
+        "\n",
+        "# Compute binary predictions\n",
+        "cut_off_threshold = 0.3\n",
+        "train_xgb_binary_predictions = (train_xgb_prob > cut_off_threshold).astype(int)\n",
+        "test_xgb_binary_predictions = (test_xgb_prob > cut_off_threshold).astype(int)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind datasets\n",
+        "\n",
+        "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
+        "\n",
+        "This function takes a number of arguments:\n",
+        "\n",
+        "- `dataset` — The raw dataset that you want to provide as input to tests.\n",
+        "- `input_id` - A unique identifier that allows tracking what inputs are used when running each individual test.\n",
+        "- `target_column` — A required argument if tests require access to true values. This is the name of the target column in the dataset.\n",
+        "\n",
+        "With all datasets ready, you can now initialize training, reference(test) and monitor datasets (`reference_df` and `monitor_df`) created earlier into their own dataset objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_reference_ds = vm.init_dataset(\n",
+        "    dataset=train_df,\n",
+        "    input_id=\"reference_dataset\",\n",
+        "    target_column=lending_club.target_column,\n",
+        ")\n",
+        "\n",
+        "vm_monitoring_ds = vm.init_dataset(\n",
+        "    dataset=test_df,\n",
+        "    input_id=\"monitoring_dataset\",\n",
+        "    target_column=lending_club.target_column,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind model\n",
+        "\n",
+        "You will also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data.\n",
+        "\n",
+        "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+        "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
+        "\n",
+        "Initialize your model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_xgb_model = vm.init_model(\n",
+        "    xgb_model,\n",
+        "    input_id=\"xgb_model\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_3__'></a>\n",
+        "\n",
+        "### Assign prediction values and probabilities to the datasets\n",
+        "\n",
+        "With our model now trained, we'll move on to assigning both the predictive probabilities coming directly from the model's predictions, and the binary prediction after applying the cutoff threshold described in the previous steps. \n",
+        "- These tasks are achieved through the use of the `assign_predictions()` method associated with the VM `dataset` object.\n",
+        "- This method links the model's class prediction values and probabilities to our VM train and test datasets."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_reference_ds.assign_predictions(\n",
+        "    model=vm_xgb_model,\n",
+        "    prediction_values=train_xgb_binary_predictions,\n",
+        "    prediction_probabilities=train_xgb_prob,\n",
+        ")\n",
+        "\n",
+        "vm_monitoring_ds.assign_predictions(\n",
+        "    model=vm_xgb_model,\n",
+        "    prediction_values=test_xgb_binary_predictions,\n",
+        "    prediction_probabilities=test_xgb_prob,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_4__'></a>\n",
+        "\n",
+        "### Compute credit risk scores\n",
+        "\n",
+        "In this phase, we translate model predictions into actionable scores using probability estimates generated by our trained model."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "train_xgb_scores = lending_club.compute_scores(train_xgb_prob)\n",
+        "test_xgb_scores = lending_club.compute_scores(test_xgb_prob)\n",
+        "\n",
+        "# Assign scores to the datasets\n",
+        "vm_reference_ds.add_extra_column(\"xgb_scores\", train_xgb_scores)\n",
+        "vm_monitoring_ds.add_extra_column(\"xgb_scores\", test_xgb_scores)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_5__'></a>\n",
+        "\n",
+        "### Adding custom context to the LLM descriptions\n",
+        "\n",
+        "To enable the LLM descriptions context, you need to set the `VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED` environment variable to `1`. This will enable the LLM descriptions context, which will be used to provide additional context to the LLM descriptions. This is a global setting that will affect all tests."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import os\n",
+        "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED\"] = \"1\"\n",
+        "\n",
+        "context = \"\"\"\n",
+        "FORMAT FOR THE LLM DESCRIPTIONS: \n",
+        "    **<Test Name>** is designed to <begin with a concise overview of what the test does and its primary purpose, \n",
+        "    extracted from the test description>.\n",
+        "\n",
+        "    The test operates by <write a paragraph about the test mechanism, explaining how it works and what it measures. \n",
+        "    Include any relevant formulas or methodologies mentioned in the test description.>\n",
+        "\n",
+        "    The primary advantages of this test include <write a paragraph about the test's strengths and capabilities, \n",
+        "    highlighting what makes it particularly useful for specific scenarios.>\n",
+        "\n",
+        "    Users should be aware that <write a paragraph about the test's limitations and potential risks. \n",
+        "    Include both technical limitations and interpretation challenges. \n",
+        "    If the test description includes specific signs of high risk, incorporate these here.>\n",
+        "\n",
+        "    **Key Insights:**\n",
+        "\n",
+        "    The test results reveal:\n",
+        "\n",
+        "    - **<insight title>**: <comprehensive description of one aspect of the results>\n",
+        "    - **<insight title>**: <comprehensive description of another aspect>\n",
+        "    ...\n",
+        "\n",
+        "    Based on these results, <conclude with a brief paragraph that ties together the test results with the test's \n",
+        "    purpose and provides any final recommendations or considerations.>\n",
+        "\n",
+        "ADDITIONAL INSTRUCTIONS:\n",
+        "    Present insights in order from general to specific, with each insight as a single bullet point with bold title.\n",
+        "\n",
+        "    For each metric in the test results, include in the test overview:\n",
+        "    - The metric's purpose and what it measures\n",
+        "    - Its mathematical formula\n",
+        "    - The range of possible values\n",
+        "    - What constitutes good/bad performance\n",
+        "    - How to interpret different values\n",
+        "\n",
+        "    Each insight should progressively cover:\n",
+        "    1. Overall scope and distribution\n",
+        "    2. Complete breakdown of all elements with specific values\n",
+        "    3. Natural groupings and patterns\n",
+        "    4. Comparative analysis between datasets/categories\n",
+        "    5. Stability and variations\n",
+        "    6. Notable relationships or dependencies\n",
+        "\n",
+        "    Remember:\n",
+        "    - Keep all insights at the same level (no sub-bullets or nested structures)\n",
+        "    - Make each insight complete and self-contained\n",
+        "    - Include specific numerical values and ranges\n",
+        "    - Cover all elements in the results comprehensively\n",
+        "    - Maintain clear, concise language\n",
+        "    - Use only \"- **Title**: Description\" format for insights\n",
+        "    - Progress naturally from general to specific observations\n",
+        "\n",
+        "\"\"\".strip()\n",
+        "\n",
+        "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT\"] = context"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_6__'></a>\n",
+        "\n",
+        "### Monitoring data description\n",
+        "\n",
+        "The Monitoring Data Description tests aim to provide a comprehensive statistical analysis of the monitoring dataset's characteristics. These tests examine the basic statistical properties, identify any missing data patterns, assess data uniqueness, visualize numerical feature distributions, and evaluate feature relationships through correlation analysis.\n",
+        "\n",
+        "The primary objective is to establish a baseline understanding of the monitoring data's structure and quality, enabling the detection of any significant deviations from expected patterns that could impact model performance. Each test is designed to capture different aspects of the data, from univariate statistics to multivariate relationships, providing a foundation for ongoing data quality assessment in the production environment."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.DescriptiveStatistics:monitoring_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_monitoring_ds,\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.MissingValues:monitoring_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_monitoring_ds,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"min_percentage_threshold\": 1\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.UniqueRows:monitoring_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_monitoring_ds,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"min_percent_threshold\": 1\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.TabularNumericalHistograms:monitoring_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_monitoring_ds,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.PearsonCorrelationMatrix:monitoring_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_monitoring_ds,\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.data_validation.HighPearsonCorrelation:monitoring_data\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_monitoring_ds,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"feature_columns\": vm_monitoring_ds.feature_columns,\n",
+        "        \"max_threshold\": 0.5,\n",
+        "        \"top_n_correlations\": 10\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.ongoing_monitoring.ClassImbalanceDrift\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"drift_pct_threshold\": 1\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_7__'></a>\n",
+        "\n",
+        "### Target and feature drift\n",
+        "\n",
+        "Next, the goal is to investigate the distributional characteristics of predictions and features to determine if the underlying data has changed. These tests are crucial for assessing the expected accuracy of the model.\n",
+        "\n",
+        "1. **Target drift:** We compare the dataset used for testing (reference data) with the monitoring data. This helps to identify any shifts in the target variable distribution.\n",
+        "2. **Feature drift:** We compare the training dataset with the monitoring data. Since features were used to train the model, any drift in these features could indicate potential issues, as the underlying patterns that the model was trained on may have changed."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Next, we can examine the correlation between features and predictions. Significant changes in these correlations may trigger a deeper assessment."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.PopulationStabilityIndex\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "        \"model\": vm_xgb_model,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.ongoing_monitoring.TargetPredictionDistributionPlot\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "        \"model\": vm_xgb_model,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"drift_pct_threshold\": 5\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Now we want see difference in correlation pairs between model prediction and features."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.ongoing_monitoring.PredictionCorrelation\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "        \"model\": vm_xgb_model,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"drift_pct_threshold\": 5\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Finally for target drift, let's plot each prediction value and feature grid side by side."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.ongoing_monitoring.PredictionQuantilesAcrossFeatures\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "        \"model\": vm_xgb_model,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Next, let's add run a test to investigate how or if the features have drifted. In this instance we want to compare the training data with prediction data."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.ongoing_monitoring.FeatureDrift\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "        \"model\": vm_xgb_model,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"psi_threshold\": 0.2,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_8__'></a>\n",
+        "\n",
+        "### Classification accuracy\n",
+        "\n",
+        "We now evaluate the model's predictive performance by comparing its behavior between reference and monitoring datasets. These tests analyze shifts in overall accuracy metrics, examine changes in the confusion matrix to identify specific classification pattern changes, and assess the model's probability calibration across different prediction thresholds. \n",
+        "\n",
+        "The primary objective is to detect any degradation in the model's classification performance that might indicate reliability issues in production. The tests provide both aggregate performance metrics and detailed breakdowns of prediction patterns, enabling the identification of specific areas where the model's accuracy might be deteriorating."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.ongoing_monitoring.ClassificationAccuracyDrift\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "        \"model\": vm_xgb_model,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"drift_pct_threshold\": 5,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.ongoing_monitoring.ConfusionMatrixDrift\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "        \"model\": vm_xgb_model,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"drift_pct_threshold\": 5,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.ongoing_monitoring.CalibrationCurveDrift\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "        \"model\": vm_xgb_model,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"n_bins\": 10,\n",
+        "        \"drift_pct_threshold\": 10,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_9__'></a>\n",
+        "\n",
+        "### Class discrimination\n",
+        "\n",
+        "The following tests assess the model's ability to effectively separate different classes in both reference and monitoring datasets. These tests analyze the model's discriminative power by examining the separation between class distributions, evaluating changes in the ROC curve characteristics, comparing probability distribution patterns, and assessing cumulative prediction trends. \n",
+        "\n",
+        "The primary objective is to identify any deterioration in the model's ability to distinguish between classes, which could indicate a decline in model effectiveness. The tests examine both the overall discriminative capability and the granular patterns in prediction distributions, providing insights into whether the model maintains its ability to effectively differentiate between classes in the production environment."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.ongoing_monitoring.ClassDiscriminationDrift\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "        \"model\": vm_xgb_model,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"drift_pct_threshold\": 5,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.ongoing_monitoring.ROCCurveDrift\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "        \"model\": vm_xgb_model,\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.ongoing_monitoring.PredictionProbabilitiesHistogramDrift\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "        \"model\": vm_xgb_model,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"drift_pct_threshold\": 10,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.ongoing_monitoring.CumulativePredictionProbabilitiesDrift\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "        \"model\": vm_xgb_model,\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_10__'></a>\n",
+        "\n",
+        "### Scoring\n",
+        "\n",
+        "Next we analyze the distribution and stability of credit scores across reference and monitoring datasets. These tests evaluate shifts in score distributions, examine changes in score band populations, and assess the relationship between scores and default rates. \n",
+        "\n",
+        "The primary objective is to identify any significant changes in how the model assigns credit scores, which could indicate drift in risk assessment capabilities. The tests examine both the overall score distribution patterns and the specific performance within defined score bands, providing insights into whether the model maintains consistent and reliable risk segmentation."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.ongoing_monitoring.ScorecardHistogramDrift\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"score_column\": \"xgb_scores\",\n",
+        "        \"drift_pct_threshold\": 20,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.ongoing_monitoring.ScoreBandsDrift\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "        \"model\": vm_xgb_model,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"score_column\": \"xgb_scores\",\n",
+        "        \"score_bands\": [500, 540, 570],\n",
+        "        \"drift_pct_threshold\": 20,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_11__'></a>\n",
+        "\n",
+        "### Model insights"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.PermutationFeatureImportance\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "        \"model\": [vm_xgb_model]\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.FeaturesAUC\",\n",
+        "    input_grid={\n",
+        "        \"model\": [vm_xgb_model],\n",
+        "        \"dataset\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.SHAPGlobalImportance\",\n",
+        "    input_grid={\n",
+        "        \"model\": [vm_xgb_model],\n",
+        "        \"dataset\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"kernel_explainer_samples\": 10,\n",
+        "        \"tree_or_linear_explainer_samples\": 200,\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_12__'></a>\n",
+        "\n",
+        "### Diagnostic monitoring"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.WeakspotsDiagnosis\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "        \"model\": vm_xgb_model,\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.OverfitDiagnosis\",\n",
+        "    inputs={\n",
+        "        \"model\": vm_xgb_model,\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"cut_off_threshold\": 0.04\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_13__'></a>\n",
+        "\n",
+        "### Robustness monitoring"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "run_test(\n",
+        "    \"validmind.model_validation.sklearn.RobustnessDiagnosis\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitoring_ds],\n",
+        "        \"model\": vm_xgb_model,\n",
+        "    },\n",
+        "    params={\n",
+        "        \"scaling_factor_std_dev_list\": [\n",
+        "            0.1,\n",
+        "            0.2,\n",
+        "            0.3,\n",
+        "            0.4,\n",
+        "            0.5\n",
+        "        ],\n",
+        "        \"performance_decay_threshold\": 0.05\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_14__'></a>\n",
+        "\n",
+        "### Performance history\n",
+        "\n",
+        "In this section we showcase how to track and visualize the temporal evolution of key model performance metrics, including AUC, F1 score, precision, recall, and accuracy. For demonstration purposes, the section simulates historical performance data by introducing a gradual downward trend and random noise to these metrics over a specified time period. These tests are useful for analyzing the stability and trends in model performance indicators, helping to identify potential degradation or unexpected fluctuations in model behavior over time. \n",
+        "\n",
+        "The main goal is to maintain a continuous record of model performance that can be used to detect gradual drift, sudden changes, or cyclical patterns in model effectiveness. This temporal monitoring approach provides early warning signals of potential issues and helps establish whether the model maintains consistent performance within acceptable boundaries throughout its deployment period."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "metrics = [metric for metric in list_metrics() if \"classification\" in metric]\n",
+        "\n",
+        "for metric_id in metrics:\n",
+        "    describe_metric(metric_id)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_metric(\n",
+        "    \"validmind.unit_metrics.classification.ROC_AUC\",\n",
+        "    inputs={\n",
+        "        \"model\": vm_xgb_model,\n",
+        "        \"dataset\": vm_monitoring_ds,\n",
+        "    },\n",
+        ")\n",
+        "auc = result.metric"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_metric(\n",
+        "    \"validmind.unit_metrics.classification.Accuracy\",\n",
+        "    inputs={\n",
+        "        \"model\": vm_xgb_model,\n",
+        "        \"dataset\": vm_monitoring_ds,\n",
+        "    },\n",
+        ")\n",
+        "accuracy = result.metric"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = run_metric(\n",
+        "    \"validmind.unit_metrics.classification.Recall\",\n",
+        "    inputs={\n",
+        "        \"model\": vm_xgb_model,\n",
+        "        \"dataset\": vm_monitoring_ds,\n",
+        "    },\n",
+        ")\n",
+        "recall = result.metric"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "f1 = run_metric(\n",
+        "    \"validmind.unit_metrics.classification.F1\",\n",
+        "    inputs={\n",
+        "        \"model\": vm_xgb_model,\n",
+        "        \"dataset\": vm_monitoring_ds,\n",
+        "    },\n",
+        ")\n",
+        "f1 = result.metric"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "precision = run_metric(\n",
+        "    \"validmind.unit_metrics.classification.Precision\",\n",
+        "    inputs={\n",
+        "        \"model\": vm_xgb_model,\n",
+        "        \"dataset\": vm_monitoring_ds,\n",
+        "    },\n",
+        ")\n",
+        "precision = result.metric"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "NUM_DAYS = 10\n",
+        "REFERENCE_DATE = datetime(2024, 1, 1)  # Fixed date: January 1st, 2024\n",
+        "base_date = REFERENCE_DATE - timedelta(days=NUM_DAYS)\n",
+        "\n",
+        "\n",
+        "# Initial values\n",
+        "performance_metrics = {\n",
+        "    \"AUC Score\": auc,\n",
+        "    \"F1 Score\": f1,\n",
+        "    \"Precision Score\": precision,\n",
+        "    \"Recall Score\": recall,\n",
+        "    \"Accuracy Score\": accuracy\n",
+        "}\n",
+        "\n",
+        "# Trend parameters\n",
+        "trend_factor = 0.98  # Slight downward trend (multiply by 0.98 each step)\n",
+        "noise_scale = 0.02   # Random fluctuation of ±2%\n",
+        "\n",
+        "\n",
+        "for i in range(NUM_DAYS):\n",
+        "    recorded_at = base_date + timedelta(days=i)\n",
+        "    print(f\"\\nrecorded_at: {recorded_at}\")\n",
+        "\n",
+        "    # Log each metric with trend and noise\n",
+        "    for metric_name, base_value in performance_metrics.items():\n",
+        "        # Apply trend and add random noise\n",
+        "        trend = base_value * (trend_factor ** i)\n",
+        "        noise = np.random.normal(0, noise_scale * base_value)\n",
+        "        value = max(0, min(1, trend + noise))  # Ensure value stays between 0 and 1\n",
+        "        \n",
+        "        log_metric(\n",
+        "            key=metric_name,\n",
+        "            value=value,\n",
+        "            recorded_at=recorded_at.isoformat()\n",
+        "        )\n",
+        "        \n",
+        "        print(f\"{metric_name:<15}: {value:.4f}\")\n"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-a1aa6fcedbed410099c3b537625ad59b"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "validmind-eEL8LtKG-py3.10",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.10.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 2
 }
diff --git a/site/notebooks/use_cases/ongoing_monitoring/quickstart_customer_churn_ongoing_monitoring.ipynb b/site/notebooks/use_cases/ongoing_monitoring/quickstart_customer_churn_ongoing_monitoring.ipynb
index 765be36075..9be6aa92fe 100644
--- a/site/notebooks/use_cases/ongoing_monitoring/quickstart_customer_churn_ongoing_monitoring.ipynb
+++ b/site/notebooks/use_cases/ongoing_monitoring/quickstart_customer_churn_ongoing_monitoring.ipynb
@@ -1,897 +1,914 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Quickstart for ongoing monitoring of models with ValidMind\n",
-    "\n",
-    "Welcome! In this quickstart guide, you'll learn how to seamlessly monitor your production models using the ValidMind Platform.\n",
-    "\n",
-    "We'll walk you through the process of initializing the ValidMind Library, loading a sample dataset and model, and running a monitoring test suite to quickly generate documentation about your new data and model.\n",
-    "\n",
-    "This notebook utilizes the [Bank Customer Churn Prediction](https://www.kaggle.com/code/kmalit/bank-customer-churn-prediction/data) dataset from Kaggle to train a simple classification model for demonstration purposes."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply monitoring report template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "  - [Initialize the Python environment](#toc2_3__)    \n",
-    "  - [Preview the monitoring report template](#toc2_4__)    \n",
-    "- [Load the reference and monitoring datasets](#toc3__)    \n",
-    "  - [Load the production model](#toc3_1__)    \n",
-    "  - [Initialize the ValidMind datasets](#toc3_2__)    \n",
-    "  - [Initialize a model object](#toc3_3__)    \n",
-    "  - [Assign predictions to the datasets](#toc3_4__)    \n",
-    "  - [Run the ongoing monitoring tests](#toc3_5__)    \n",
-    "  - [Conduct target and feature drift testing](#toc3_6__)    \n",
-    "    - [Feature drift tests](#toc3_6_1__)    \n",
-    "  - [Model performance monitoring tests](#toc3_7__)    \n",
-    "- [Next steps](#toc4__)    \n",
-    "  - [Work with your monitoring report](#toc4_1__)    \n",
-    "  - [Discover more learning resources](#toc4_2__)    \n",
-    "- [Upgrade ValidMind](#toc5__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation, validation, monitoring tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
-    "\n",
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Model monitoring report**: A comprehensive and structured record of a production model, including key elements such as data sources, inputs, performance metrics, and periodic evaluations. This documentation ensures transparency and visibility of the model's performance in the production environment.\n",
-    "\n",
-    "**Monitoring report template**: Similar to documentation template, The monitoring report template functions as a test suite and lays out the structure of model monitoring, segmented into various sections and sub-sections. Monitoring report templates define the structure of your model monitoring report, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Custom tests**: Custom tests are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom test.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom test. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply monitoring report template\n",
-    "\n",
-    "Once you've registered your model, let's select a monitoring report template. A template predefines sections for your monitoring report and provides a general outline to follow, making the monitoring process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Monitoring**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Ongoing Monitoring for Classification Models`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Monitoring` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"monitoring\",\n",
-    "    monitoring = True,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Initialize the Python environment\n",
-    "\n",
-    "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import xgboost as xgb\n",
-    "import validmind as vm\n",
-    "import pandas as pd\n",
-    "import numpy as np\n",
-    "import seaborn as sns\n",
-    "import matplotlib.pyplot as plt\n",
-    "from validmind.tests import run_test\n",
-    "\n",
-    "%matplotlib inline"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_4__'></a>\n",
-    "\n",
-    "### Preview the monitoring report template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Load the reference and monitoring datasets\n",
-    "\n",
-    "The sample dataset used here is provided by the ValidMind library. For demonstration purposes we'll use the training, test and validation dataset splits as `training`, `reference` and `monitoring` datasets."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.datasets.classification import customer_churn\n",
-    "\n",
-    "raw_df = customer_churn.load_data()\n",
-    "\n",
-    "train_df, reference_df, monitor_df = customer_churn.preprocess(raw_df)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_1__'></a>\n",
-    "\n",
-    "### Load the production model\n",
-    "\n",
-    "We will also load a pre-trained model for demonstration purposes. This is a simple XGBoost model trained on the Bank Customer Churn Prediction dataset."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import xgboost as xgb\n",
-    "\n",
-    "# Load the saved model\n",
-    "model = xgb.XGBClassifier()\n",
-    "model.load_model(\"xgboost_model.model\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind datasets\n",
-    "\n",
-    "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
-    "\n",
-    "This function takes a number of arguments:\n",
-    "\n",
-    "- `dataset` — The raw dataset that you want to provide as input to tests.\n",
-    "- `input_id` - A unique identifier that allows tracking what inputs are used when running each individual test.\n",
-    "- `target_column` — A required argument if tests require access to true values. This is the name of the target column in the dataset.\n",
-    "- `class_labels` — An optional value to map predicted classes to class labels.\n",
-    "\n",
-    "With all datasets ready, you can now initialize training, reference(test) and monitor datasets (`train_df`, `reference_df` and `monitor_df`) created earlier into their own dataset objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds = vm.init_dataset(\n",
-    "    dataset=train_df,\n",
-    "    input_id=\"train_df\",\n",
-    "    target_column=customer_churn.target_column,\n",
-    ")\n",
-    "\n",
-    "vm_reference_ds = vm.init_dataset(\n",
-    "    dataset=reference_df,\n",
-    "    input_id=\"reference_df\",\n",
-    "    target_column=customer_churn.target_column,\n",
-    ")\n",
-    "\n",
-    "vm_monitor_ds = vm.init_dataset(\n",
-    "    dataset=monitor_df,\n",
-    "    input_id=\"monitor_dataset\",\n",
-    "    target_column=customer_churn.target_column,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_3__'></a>\n",
-    "\n",
-    "### Initialize a model object\n",
-    "\n",
-    "Additionally, you'll need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data. You simply intialize this model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_model = vm.init_model(\n",
-    "    model,\n",
-    "    input_id=\"model\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_4__'></a>\n",
-    "\n",
-    "### Assign predictions to the datasets\n",
-    "\n",
-    "We can now use the `assign_predictions()` method from the Dataset object to link existing predictions to any model. If no prediction values are passed, the method will compute predictions automatically:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds.assign_predictions(\n",
-    "    model=vm_model,\n",
-    ")\n",
-    "\n",
-    "vm_reference_ds.assign_predictions(\n",
-    "    model=vm_model,\n",
-    ")\n",
-    "\n",
-    "vm_monitor_ds.assign_predictions(\n",
-    "    model=vm_model,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_5__'></a>\n",
-    "\n",
-    "### Run the ongoing monitoring tests\n",
-    "\n",
-    "Before we start the testing procedure, let's take a look at the expected tests that are pre-configured:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test_list = vm.get_test_suite().get_default_config()\n",
-    "for l in test_list:\n",
-    "    print(l)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Let's run the first test in the list. Note that you can use `vm.tests.describe_test()` to get information about the inputs required for the test:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.describe_test(\"validmind.model_validation.ModelMetadata\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "As you can see, the `ModelMetadata` only requires a model input. Let's run the test and log the results into the monitoring document with the `.log()` method:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test_result = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.ModelMetadata\",\n",
-    "    model=vm_model,\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Let's run the tests needed to determine data quality of the monitoring dataset:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "data_qual = vm.get_test_suite(\n",
-    "    section=\"prediction_data_description\"\n",
-    ").get_default_config()\n",
-    "\n",
-    "# Run all of the necessary data quality checks where the monitoring dataset is the basis\n",
-    "for l in data_qual:\n",
-    "    vm.tests.run_test(\n",
-    "        l,\n",
-    "        inputs={\"dataset\": vm_monitor_ds},\n",
-    "        show=False,\n",
-    "    ).log()\n",
-    "    print(\"Completed test: {0}\".format(l))"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "To view the results of the model metadata and data quality tests, select **Monitoring** under Documents in the left sidebar of the model in the ValidMind Platform and click on the following sections:\n",
-    "\n",
-    "- 1. Model Monitoring Overview > **1.2. Model Details**\n",
-    "- 2. Data Quality & Drift Assessment > **2.1. Prediction Data Description**"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Next, let's run *comparison tests*, which will allow comparing differences between the training dataset and monitoring datasets. To run a test in comparison mode, you only need to pass an `input_grid` parameter to the `run_test()` method instead of `inputs`.\n",
-    "\n",
-    "For more information about comparison tests, see this [notebook](../../how_to/tests/run_tests/2_run_comparison_tests.ipynb)."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "correlation_tests = [\n",
-    "    \"validmind.data_validation.PearsonCorrelationMatrix:train_vs_test\",\n",
-    "    \"validmind.data_validation.HighPearsonCorrelation:train_vs_test\",\n",
-    "]\n",
-    "\n",
-    "for test in correlation_tests:\n",
-    "    vm.tests.run_test(\n",
-    "        test,\n",
-    "        input_grid={\n",
-    "            \"dataset\": [vm_train_ds, vm_monitor_ds],\n",
-    "            \"model\": [vm_model],\n",
-    "        },\n",
-    "        show=False,\n",
-    "    ).log()\n",
-    "    print(\"Completed test {0}\".format(test))"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You can view these results in the ValidMind Platform in **Ongoing Monitoring** within Documents under the following section:\n",
-    "\n",
-    "- 2. Data Quality & Drift Assessment > **2.2. Prediction Data Correlations and Interactions**"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_6__'></a>\n",
-    "\n",
-    "### Conduct target and feature drift testing\n",
-    "\n",
-    "Next, the goal is to investigate the distributional characteristics of predictions and features to determine if the underlying data has changed. These tests are crucial for assessing the expected accuracy of the model.\n",
-    "\n",
-    "1. **Target drift:** We compare the dataset used for testing (reference data) with the monitoring data. This helps to identify any shifts in the target variable distribution.\n",
-    "2. **Feature drift:** We compare the training dataset with the monitoring data. Since features were used to train the model, any drift in these features could indicate potential issues, as the underlying patterns that the model was trained on may have changed."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "In the 2. Data Quality & Drift Assessment > **2.3 Target Drift** section we can confirm only there is only one pre-configured test:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "for l in vm.get_test_suite(section=\"comparison_data_target\").get_default_config():\n",
-    "    print(l)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "As part of running the rest of the tests, we will directly log the results to a section when calling the `.log()` method."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "First, let's run the *Population Stability Index (PSI)* for predictions. In this case, we want to compare the test data with the monitoring data. (Note: For predictions, the training data is irrelevant.)"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.PopulationStabilityIndex\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitor_ds],\n",
-    "        \"model\": vm_model,\n",
-    "    },\n",
-    "    show=False,\n",
-    ").log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Next, we can examine the correlation between features and predictions. Significant changes in these correlations may trigger a deeper assessment."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    \"validmind.ongoing_monitoring.TargetPredictionDistributionPlot\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitor_ds],\n",
-    "        \"model\": vm_model,\n",
-    "    },\n",
-    "    show=False,\n",
-    ").log(section_id=\"comparison_data_target\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Now we want see difference in correlation pairs between model prediction and features."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    \"validmind.ongoing_monitoring.PredictionCorrelation\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitor_ds],\n",
-    "        \"model\": vm_model,\n",
-    "    },\n",
-    "    show=False,\n",
-    ").log(section_id=\"comparison_data_target\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Finally for target drift, let's plot each prediction value and feature grid side by side."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    \"validmind.ongoing_monitoring.PredictionAcrossEachFeature\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitor_ds],\n",
-    "        \"model\": vm_model,\n",
-    "    },\n",
-    "    show=False,\n",
-    ").log(section_id=\"comparison_data_target\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_6_1__'></a>\n",
-    "\n",
-    "#### Feature drift tests\n",
-    "\n",
-    "Next, let's add run a test to investigate how or if the features have drifted. In this instance we want to compare the training data with prediction data. These results will be logged in the 2. Data Quality & Drift Assessment > **2.4. Feature Drift** section."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.tests.run_test(\n",
-    "    \"validmind.ongoing_monitoring.FeatureDrift\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [vm_reference_ds, vm_monitor_ds],\n",
-    "        \"model\": vm_model,\n",
-    "    },\n",
-    "    show=False,\n",
-    ").log(section_id=\"comparison_data_feature\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3_7__'></a>\n",
-    "\n",
-    "### Model performance monitoring tests\n",
-    "\n",
-    "Let's wrap up by monitoring the model's performance. Keep in mind that in some cases, it may not be possible to determine accuracy if the ground truth is unavailable. If this is the case, you can skip this test and instead focus on target and feature drift to inform the model owners.\n",
-    "\n",
-    "The pre-configured tests for model performance are:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "for l in vm.get_test_suite(section=\"model_performance_monitoring\").get_default_config():\n",
-    "    print(l)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "The code below will run the tests and log the results into the monitoring document for each of the tests. Note the use of `input_grid` again, which is required for comparison tests:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Use the reference dataset vs monitoring dataset - the true comparison of accuracy\n",
-    "for test in vm.get_test_suite(\n",
-    "    section=\"model_performance_monitoring\"\n",
-    ").get_default_config():\n",
-    "    if test == \"validmind.model_validation.statsmodels.GINITable\":\n",
-    "        vm.tests.run_test(\n",
-    "            \"validmind.model_validation.statsmodels.GINITable\",\n",
-    "            input_grid={\n",
-    "                \"dataset\": [vm_reference_ds, vm_monitor_ds],\n",
-    "                \"model\": [vm_model],\n",
-    "            },\n",
-    "            show=False,\n",
-    "        ).log()\n",
-    "    else:\n",
-    "        vm.tests.run_test(\n",
-    "            test,\n",
-    "            input_grid={\n",
-    "                \"dataset\": [vm_reference_ds, vm_monitor_ds],\n",
-    "                \"model\": [vm_model],\n",
-    "            },\n",
-    "            show=False,\n",
-    "        ).log()\n",
-    "    print(\"Completed test: {0}\".format(test))"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the output produced by the ValidMind Library right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your monitoring report.\n",
-    "\n",
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Work with your monitoring report\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Monitoring** under Documents.\n",
-    "\n",
-    "What you see is the full draft of your monitoring report in a more easily consumable version. From here, you can make qualitative edits to monitoring reports, view guidelines, review monitoring results, and submit your monitoring report for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/monitoring/ongoing-monitoring.html)\n",
-    "\n",
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-336984df36024986aa3efd6a4079956f",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "colab": {
-   "provenance": []
-  },
-  "gpuClass": "standard",
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 4
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Quickstart for ongoing monitoring of models with ValidMind\n",
+        "\n",
+        "Welcome! In this quickstart guide, you'll learn how to seamlessly monitor your production models using the ValidMind Platform.\n",
+        "\n",
+        "We'll walk you through the process of initializing the ValidMind Library, loading a sample dataset and model, and running a monitoring test suite to quickly generate documentation about your new data and model.\n",
+        "\n",
+        "This notebook utilizes the [Bank Customer Churn Prediction](https://www.kaggle.com/code/kmalit/bank-customer-churn-prediction/data) dataset from Kaggle to train a simple classification model for demonstration purposes."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply monitoring report template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "  - [Initialize the Python environment](#toc2_3__)    \n",
+        "  - [Preview the monitoring report template](#toc2_4__)    \n",
+        "- [Load the reference and monitoring datasets](#toc3__)    \n",
+        "  - [Load the production model](#toc3_1__)    \n",
+        "  - [Initialize the ValidMind datasets](#toc3_2__)    \n",
+        "  - [Initialize the ValidMind model](#toc3_3__)    \n",
+        "  - [Assign predictions to the datasets](#toc3_4__)    \n",
+        "  - [Run the ongoing monitoring tests](#toc3_5__)    \n",
+        "  - [Conduct target and feature drift testing](#toc3_6__)    \n",
+        "    - [Feature drift tests](#toc3_6_1__)    \n",
+        "  - [Model performance monitoring tests](#toc3_7__)    \n",
+        "- [Next steps](#toc4__)    \n",
+        "  - [Work with your monitoring report](#toc4_1__)    \n",
+        "  - [Discover more learning resources](#toc4_2__)    \n",
+        "- [Upgrade ValidMind](#toc5__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation, validation, and monitoring tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+        "\n",
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**ongoing monitoring report**: A comprehensive and structured periodic report assessing the record's performance and compliance over time, ensuring it remains valid under changing conditions. Monitoring includes key elements such as data sources, inputs, performance metrics, and periodic evaluations, ensuring transparency and visibility of the record's performance in the production environment.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**monitoring template, monitoring report template**: A default ValidMind document template that serves as a standardized framework for ongoing monitoring, including sections designated for test results, performance metrics, and drift analyses. By outlining required monitoring checks and expected routine tests, monitoring templates ensure consistency and completeness across monitoring reports and help guide owners through a systematic monitoring process while promoting early detection of performance degradation.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply monitoring report template\n",
+        "\n",
+        "Once you've registered your model, let's select a monitoring report template. A template predefines sections for your monitoring report and provides a general outline to follow, making the monitoring process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Monitoring**.\n",
+        "\n",
+        "    If you cannot locate your Monitoring document, make sure Monitoring type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Ongoing Monitoring for Classification Models`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Monitoring` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"monitoring\",\n",
+        "    monitoring = True,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Initialize the Python environment\n",
+        "\n",
+        "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import xgboost as xgb\n",
+        "import validmind as vm\n",
+        "import pandas as pd\n",
+        "import numpy as np\n",
+        "import seaborn as sns\n",
+        "import matplotlib.pyplot as plt\n",
+        "from validmind.tests import run_test\n",
+        "\n",
+        "%matplotlib inline"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_4__'></a>\n",
+        "\n",
+        "### Preview the monitoring report template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Load the reference and monitoring datasets\n",
+        "\n",
+        "The sample dataset used here is provided by the ValidMind library. For demonstration purposes we'll use the training, test and validation dataset splits as `training`, `reference` and `monitoring` datasets."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.datasets.classification import customer_churn\n",
+        "\n",
+        "raw_df = customer_churn.load_data()\n",
+        "\n",
+        "train_df, reference_df, monitor_df = customer_churn.preprocess(raw_df)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Load the production model\n",
+        "\n",
+        "We will also load a pre-trained model for demonstration purposes. This is a simple XGBoost model trained on the Bank Customer Churn Prediction dataset."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import xgboost as xgb\n",
+        "\n",
+        "# Load the saved model\n",
+        "model = xgb.XGBClassifier()\n",
+        "model.load_model(\"xgboost_model.model\")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind datasets\n",
+        "\n",
+        "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
+        "\n",
+        "This function takes a number of arguments:\n",
+        "\n",
+        "- `dataset` — The raw dataset that you want to provide as input to tests.\n",
+        "- `input_id` - A unique identifier that allows tracking what inputs are used when running each individual test.\n",
+        "- `target_column` — A required argument if tests require access to true values. This is the name of the target column in the dataset.\n",
+        "- `class_labels` — An optional value to map predicted classes to class labels.\n",
+        "\n",
+        "With all datasets ready, you can now initialize training, reference(test) and monitor datasets (`train_df`, `reference_df` and `monitor_df`) created earlier into their own dataset objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds = vm.init_dataset(\n",
+        "    dataset=train_df,\n",
+        "    input_id=\"train_df\",\n",
+        "    target_column=customer_churn.target_column,\n",
+        ")\n",
+        "\n",
+        "vm_reference_ds = vm.init_dataset(\n",
+        "    dataset=reference_df,\n",
+        "    input_id=\"reference_df\",\n",
+        "    target_column=customer_churn.target_column,\n",
+        ")\n",
+        "\n",
+        "vm_monitor_ds = vm.init_dataset(\n",
+        "    dataset=monitor_df,\n",
+        "    input_id=\"monitor_dataset\",\n",
+        "    target_column=customer_churn.target_column,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_3__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind model\n",
+        "\n",
+        "You'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for our model.\n",
+        "\n",
+        "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+        "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
+        "\n",
+        "Initialize your model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_model = vm.init_model(\n",
+        "    model,\n",
+        "    input_id=\"model\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_4__'></a>\n",
+        "\n",
+        "### Assign predictions to the datasets\n",
+        "\n",
+        "We can now use the `assign_predictions()` method from the Dataset object to link existing predictions to any model. If no prediction values are passed, the method will compute predictions automatically:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds.assign_predictions(\n",
+        "    model=vm_model,\n",
+        ")\n",
+        "\n",
+        "vm_reference_ds.assign_predictions(\n",
+        "    model=vm_model,\n",
+        ")\n",
+        "\n",
+        "vm_monitor_ds.assign_predictions(\n",
+        "    model=vm_model,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_5__'></a>\n",
+        "\n",
+        "### Run the ongoing monitoring tests\n",
+        "\n",
+        "Before we start the testing procedure, let's take a look at the expected tests that are pre-configured:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test_list = vm.get_test_suite().get_default_config()\n",
+        "for l in test_list:\n",
+        "    print(l)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let's run the first test in the list. Note that you can use `vm.tests.describe_test()` to get information about the inputs required for the test:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.describe_test(\"validmind.model_validation.ModelMetadata\")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "As you can see, the `ModelMetadata` only requires a model input. Let's run the test and log the results into the monitoring document with the `.log()` method:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test_result = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.ModelMetadata\",\n",
+        "    model=vm_model,\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let's run the tests needed to determine data quality of the monitoring dataset:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "data_qual = vm.get_test_suite(\n",
+        "    section=\"prediction_data_description\"\n",
+        ").get_default_config()\n",
+        "\n",
+        "# Run all of the necessary data quality checks where the monitoring dataset is the basis\n",
+        "for l in data_qual:\n",
+        "    vm.tests.run_test(\n",
+        "        l,\n",
+        "        inputs={\"dataset\": vm_monitor_ds},\n",
+        "        show=False,\n",
+        "    ).log()\n",
+        "    print(\"Completed test: {0}\".format(l))"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "To view the results of the model metadata and data quality tests, select **Monitoring** under Documents in the left sidebar of the model in the ValidMind Platform and click on the following sections:\n",
+        "\n",
+        "- 1. Model Monitoring Overview > **1.2. Model Details**\n",
+        "- 2. Data Quality & Drift Assessment > **2.1. Prediction Data Description**"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Next, let's run *comparison tests*, which will allow comparing differences between the training dataset and monitoring datasets. To run a test in comparison mode, you only need to pass an `input_grid` parameter to the `run_test()` method instead of `inputs`.\n",
+        "\n",
+        "For more information about comparison tests, see this [notebook](../../how_to/tests/run_tests/2-run_comparison_tests.ipynb)."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "correlation_tests = [\n",
+        "    \"validmind.data_validation.PearsonCorrelationMatrix:train_vs_test\",\n",
+        "    \"validmind.data_validation.HighPearsonCorrelation:train_vs_test\",\n",
+        "]\n",
+        "\n",
+        "for test in correlation_tests:\n",
+        "    vm.tests.run_test(\n",
+        "        test,\n",
+        "        input_grid={\n",
+        "            \"dataset\": [vm_train_ds, vm_monitor_ds],\n",
+        "            \"model\": [vm_model],\n",
+        "        },\n",
+        "        show=False,\n",
+        "    ).log()\n",
+        "    print(\"Completed test {0}\".format(test))"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You can view these results in the ValidMind Platform in **Ongoing Monitoring** within Documents under the following section:\n",
+        "\n",
+        "- 2. Data Quality & Drift Assessment > **2.2. Prediction Data Correlations and Interactions**"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_6__'></a>\n",
+        "\n",
+        "### Conduct target and feature drift testing\n",
+        "\n",
+        "Next, the goal is to investigate the distributional characteristics of predictions and features to determine if the underlying data has changed. These tests are crucial for assessing the expected accuracy of the model.\n",
+        "\n",
+        "1. **Target drift:** We compare the dataset used for testing (reference data) with the monitoring data. This helps to identify any shifts in the target variable distribution.\n",
+        "2. **Feature drift:** We compare the training dataset with the monitoring data. Since features were used to train the model, any drift in these features could indicate potential issues, as the underlying patterns that the model was trained on may have changed."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "In the 2. Data Quality & Drift Assessment > **2.3 Target Drift** section we can confirm only there is only one pre-configured test:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "for l in vm.get_test_suite(section=\"comparison_data_target\").get_default_config():\n",
+        "    print(l)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "As part of running the rest of the tests, we will directly log the results to a section when calling the `.log()` method."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "First, let's run the *Population Stability Index (PSI)* for predictions. In this case, we want to compare the test data with the monitoring data. (Note: For predictions, the training data is irrelevant.)"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.PopulationStabilityIndex\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitor_ds],\n",
+        "        \"model\": vm_model,\n",
+        "    },\n",
+        "    show=False,\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Next, we can examine the correlation between features and predictions. Significant changes in these correlations may trigger a deeper assessment."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    \"validmind.ongoing_monitoring.TargetPredictionDistributionPlot\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitor_ds],\n",
+        "        \"model\": vm_model,\n",
+        "    },\n",
+        "    show=False,\n",
+        ").log(section_id=\"comparison_data_target\")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Now we want see difference in correlation pairs between model prediction and features."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    \"validmind.ongoing_monitoring.PredictionCorrelation\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitor_ds],\n",
+        "        \"model\": vm_model,\n",
+        "    },\n",
+        "    show=False,\n",
+        ").log(section_id=\"comparison_data_target\")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Finally for target drift, let's plot each prediction value and feature grid side by side."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    \"validmind.ongoing_monitoring.PredictionAcrossEachFeature\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitor_ds],\n",
+        "        \"model\": vm_model,\n",
+        "    },\n",
+        "    show=False,\n",
+        ").log(section_id=\"comparison_data_target\")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_6_1__'></a>\n",
+        "\n",
+        "#### Feature drift tests\n",
+        "\n",
+        "Next, let's add run a test to investigate how or if the features have drifted. In this instance we want to compare the training data with prediction data. These results will be logged in the 2. Data Quality & Drift Assessment > **2.4. Feature Drift** section."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    \"validmind.ongoing_monitoring.FeatureDrift\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [vm_reference_ds, vm_monitor_ds],\n",
+        "        \"model\": vm_model,\n",
+        "    },\n",
+        "    show=False,\n",
+        ").log(section_id=\"comparison_data_feature\")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_7__'></a>\n",
+        "\n",
+        "### Model performance monitoring tests\n",
+        "\n",
+        "Let's wrap up by monitoring the model's performance. Keep in mind that in some cases, it may not be possible to determine accuracy if the ground truth is unavailable. If this is the case, you can skip this test and instead focus on target and feature drift to inform the model owners.\n",
+        "\n",
+        "The pre-configured tests for model performance are:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "for l in vm.get_test_suite(section=\"model_performance_monitoring\").get_default_config():\n",
+        "    print(l)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "The code below will run the tests and log the results into the monitoring document for each of the tests. Note the use of `input_grid` again, which is required for comparison tests:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Use the reference dataset vs monitoring dataset - the true comparison of accuracy\n",
+        "for test in vm.get_test_suite(\n",
+        "    section=\"model_performance_monitoring\"\n",
+        ").get_default_config():\n",
+        "    if test == \"validmind.model_validation.statsmodels.GINITable\":\n",
+        "        vm.tests.run_test(\n",
+        "            \"validmind.model_validation.statsmodels.GINITable\",\n",
+        "            input_grid={\n",
+        "                \"dataset\": [vm_reference_ds, vm_monitor_ds],\n",
+        "                \"model\": [vm_model],\n",
+        "            },\n",
+        "            show=False,\n",
+        "        ).log()\n",
+        "    else:\n",
+        "        vm.tests.run_test(\n",
+        "            test,\n",
+        "            input_grid={\n",
+        "                \"dataset\": [vm_reference_ds, vm_monitor_ds],\n",
+        "                \"model\": [vm_model],\n",
+        "            },\n",
+        "            show=False,\n",
+        "        ).log()\n",
+        "    print(\"Completed test: {0}\".format(test))"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the output produced by the ValidMind Library right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your monitoring report.\n",
+        "\n",
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Work with your monitoring report\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Monitoring** under Documents.\n",
+        "\n",
+        "What you see is the full draft of your monitoring report in a more easily consumable version. From here, you can make qualitative edits to monitoring reports, view guidelines, review monitoring results, and submit your monitoring report for approval when it's ready. (**Learn more:** [Ongoing monitoring](https://docs.validmind.ai/guide/monitoring/ongoing-monitoring.html))\n",
+        "\n",
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-06926ffb7c9846eca24d1130049d6316"
+    }
+  ],
+  "metadata": {
+    "colab": {
+      "provenance": []
+    },
+    "gpuClass": "standard",
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.10.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 4
 }
diff --git a/site/notebooks/use_cases/regression/quickstart_regression_full_suite.ipynb b/site/notebooks/use_cases/regression/quickstart_regression_full_suite.ipynb
index 55a3854a1f..466da8019c 100644
--- a/site/notebooks/use_cases/regression/quickstart_regression_full_suite.ipynb
+++ b/site/notebooks/use_cases/regression/quickstart_regression_full_suite.ipynb
@@ -35,11 +35,11 @@
     "- [Document the model](#toc5__)    \n",
     "  - [Prepocess the raw dataset](#toc5_1__)    \n",
     "  - [Initialize the ValidMind datasets](#toc5_2__)    \n",
-    "  - [Initialize a model object](#toc5_3__)    \n",
+    "  - [Initialize the ValidMind models](#toc5_3__)    \n",
     "  - [Assign predictions to the datasets](#toc5_4__)    \n",
     "  - [Run the full suite of tests](#toc5_5__)    \n",
     "- [Next steps](#toc6__)    \n",
-    "  - [Work with your model documentation](#toc6_1__)    \n",
+    "  - [Work with your documentation](#toc6_1__)    \n",
     "  - [Discover more learning resources](#toc6_2__)    \n",
     "- [Upgrade ValidMind](#toc7__)    \n",
     "\n",
@@ -62,7 +62,9 @@
     "\n",
     "## About ValidMind\n",
     "\n",
-    "ValidMind's suite of tools enables organizations to identify, document, and manage model risks for all types of models, including AI/ML models, LLMs, and statistical models. As a model developer, you use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
+    "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+    "\n",
+    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
     "\n",
     "If this is your first time trying out ValidMind, you can make use of the following resources alongside this notebook:\n",
     "\n",
@@ -80,7 +82,7 @@
     "\n",
     "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
     "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+    "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
     "\n",
     "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
    ]
@@ -131,17 +133,19 @@
     "\n",
     "#### Register sample model\n",
     "\n",
-    "Let's first register a sample model for use with this notebook:\n",
+    "Let's first register a sample record (model) for use with this notebook:\n",
+    "\n",
+    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
     "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
+    "2. In the left sidebar, select **Inventory**.\n",
     "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
+    "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
     "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
+    "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
     "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
+    "5. Select your own name under the **RECORD OWNER** drop-down.\n",
     "\n",
-    "5. Click **Register Model** to add the model to your inventory."
+    "6. Click **Register Model** to add the model to your inventory."
    ]
   },
   {
@@ -152,10 +156,12 @@
     "\n",
     "#### Apply documentation template\n",
     "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
+    "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
     "\n",
     "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
     "\n",
+    "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+    "\n",
     "2. Under **TEMPLATE**, select `Binary classification`.\n",
     "\n",
     "3. Click **Use Template** to apply the template."
@@ -169,11 +175,13 @@
     "\n",
     "#### Get your code snippet\n",
     "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
+    "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
     "\n",
     "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+    "\n",
     "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+    "\n",
+    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
    ]
   },
   {
@@ -398,9 +406,14 @@
    "source": [
     "<a id='toc5_3__'></a>\n",
     "\n",
-    "### Initialize a model object\n",
+    "### Initialize the ValidMind models\n",
+    "\n",
+    "You'll also need to initialize ValidMind model objects (`vm_model`) that can be passed to other functions for analysis and tests on the data for our models.\n",
+    "\n",
+    "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+    "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
     "\n",
-    "Additionally, you need to initialize a ValidMind model objects (`vm_model` and `vm_model_1`) that can be passed to other functions for analysis and tests on the data. You simply intialize this model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
+    "Initialize your model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
    ]
   },
   {
@@ -494,13 +507,13 @@
     "\n",
     "## Next steps\n",
     "\n",
-    "You can look at the output produced by the ValidMind Library right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
+    "You can look at the output produced by the ValidMind Library right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your documentation.\n",
     "\n",
     "<a id='toc6_1__'></a>\n",
     "\n",
-    "### Work with your model documentation\n",
+    "### Work with your documentation\n",
     "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
+    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
     "\n",
     "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
     "\n",
@@ -509,17 +522,17 @@
     "   - **2. Data Preparation**\n",
     "   - **3. Model Development**\n",
     "\n",
-    "What you can see now is a much more easily consumable version of the documentation, including the results of the tests you just performed, along with other parts of your model documentation that still need to be completed. There is a wealth of information that gets uploaded when you run the full test suite, so take a closer look around, especially at test results that might need attention (hint: some of the tests in **2.1 Data description** look like they need some attention). From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)\n",
+    "What you can see now is a much more easily consumable version of the documentation, including the results of the tests you just performed, along with other parts of your model documentation that still need to be completed. There is a wealth of information that gets uploaded when you run the full test suite, so take a closer look around, especially at test results that might need attention (hint: some of the tests in **2.1 Data description** look like they need some attention). From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
     "\n",
     "<a id='toc6_2__'></a>\n",
     "\n",
     "### Discover more learning resources\n",
     "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
+    "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
     "\n",
     "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
     "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
+    "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
     "\n",
     "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
    ]
@@ -566,7 +579,7 @@
   },
   {
    "cell_type": "markdown",
-   "id": "copyright-6eb89a7d0bbf4f2a8dd973330f359ed6",
+   "id": "copyright-8bce9bf3b74d4bb5a749dade71cae99d",
    "metadata": {},
    "source": [
     "<!-- VALIDMIND COPYRIGHT -->\n",
diff --git a/site/notebooks/use_cases/time_series/quickstart_time_series_full_suite.ipynb b/site/notebooks/use_cases/time_series/quickstart_time_series_full_suite.ipynb
index 6d712adde6..300dbfeb09 100644
--- a/site/notebooks/use_cases/time_series/quickstart_time_series_full_suite.ipynb
+++ b/site/notebooks/use_cases/time_series/quickstart_time_series_full_suite.ipynb
@@ -1,750 +1,765 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Document a time series forecasting model\n",
-    "\n",
-    "Use the [FRED](https://fred.stlouisfed.org/) sample dataset to train a simple time series model and document that model with the ValidMind Library.\n",
-    "\n",
-    "As part of the notebook, you will learn how to train a simple model while exploring how the documentation process works:\n",
-    "\n",
-    "- Initializing the ValidMind Library\n",
-    "- Loading a sample dataset provided by the library to train a simple time series model\n",
-    "- Running a ValidMind test suite to quickly generate documentation about the data and model"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "  - [Initialize the Python environment](#toc2_3__)    \n",
-    "  - [Preview the documentation template](#toc2_4__)    \n",
-    "- [Load the sample dataset](#toc3__)    \n",
-    "- [Document the model](#toc4__)    \n",
-    "  - [Prepocess the raw dataset](#toc4_1__)    \n",
-    "  - [Train random forests and gradient boosting regressor models](#toc4_2__)    \n",
-    "  - [Initialize the ValidMind datasets](#toc4_3__)    \n",
-    "  - [Initialize the model objects](#toc4_4__)    \n",
-    "  - [Assign predictions to the datasets](#toc4_5__)    \n",
-    "  - [Run the full suite of tests](#toc4_6__)    \n",
-    "- [Next steps](#toc5__)    \n",
-    "  - [Work with your model documentation](#toc5_1__)    \n",
-    "  - [Discover more learning resources](#toc5_2__)    \n",
-    "- [Upgrade ValidMind](#toc6__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
-    "\n",
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Metrics**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
-    "\n",
-    "**Custom metrics**: Custom metrics are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom metric.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom metric. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a metric, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom metrics can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Binary classification`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Initialize the Python environment\n",
-    "\n",
-    "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from sklearn.ensemble import RandomForestRegressor\n",
-    "from sklearn.ensemble import RandomForestRegressor, GradientBoostingRegressor\n",
-    "from sklearn.metrics import mean_squared_error, r2_score\n",
-    "from sklearn.model_selection import train_test_split\n",
-    "\n",
-    "%matplotlib inline"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_4__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Load the sample dataset\n",
-    "\n",
-    "The sample dataset used here is provided by the ValidMind library. To be able to use it, you need to import the dataset and load it into a pandas [DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html), a two-dimensional tabular data structure that makes use of rows and columns:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.datasets.regression import fred_timeseries \n",
-    "\n",
-    "target_column = fred_timeseries.target_column\n",
-    "\n",
-    "print(\n",
-    "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{target_column}'\"\n",
-    ")\n",
-    "\n",
-    "raw_df = fred_timeseries.load_data()\n",
-    "raw_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Document the model\n",
-    "\n",
-    "As part of documenting the model with the ValidMind Library, you need to preprocess the raw dataset, initialize some training and test datasets, initialize a model object you can use for testing, and then run the full suite of tests."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Prepocess the raw dataset\n",
-    "\n",
-    "Preprocessing performs a number of operations to get ready for the subsequent steps:\n",
-    "- **Split the dataset**: Divide the original dataset into training and test sets for the primary model with an 80/20 split, without shuffling.\n",
-    "- **Difference the data**: Calculate the first difference of the train and test datasets to remove trends and seasonality, then drop any resulting NaN values.\n",
-    "- **Extract features and target variables**: Separate the feature columns (predictors) and the target variable from the differenced train and test datasets."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Split the raw dataset into training and test sets \n",
-    "train_df, test_df = train_test_split(raw_df, test_size=0.2, shuffle=False)\n",
-    "\n",
-    "# Take the first difference of the training and test sets\n",
-    "train_diff_df = train_df.diff().dropna()\n",
-    "test_diff_df = test_df.diff().dropna()\n",
-    "\n",
-    "# Extract the features and target variable from the training set\n",
-    "X_diff_train = train_diff_df.drop(target_column, axis=1)\n",
-    "y_diff_train = train_diff_df[target_column]\n",
-    "\n",
-    "# Extract the features and target variable from the test set\n",
-    "X_diff_test = test_diff_df.drop(target_column, axis=1)\n",
-    "y_diff_test = test_diff_df[target_column]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Train random forests and gradient boosting regressor models\n",
-    "\n",
-    "This section trains random forest and gradient boosting models on differenced data, transforms predictions back to the original scale, and evaluates model performance using Mean Squared Error (MSE) and R-squared (R²) scores. \n",
-    "\n",
-    "The following helper functions are used to post-process predictions and evaluate model performance:\n",
-    "\n",
-    "- `transform_to_levels`: Reconstructs the original values from differenced predictions by cumulatively summing them, starting from a given initial value.\n",
-    "- `evaluate_model`: Calculates the Mean Squared Error (MSE) and R-squared (R²) score to evaluate the accuracy of the predictions against the true values."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def transform_to_levels(y_diff_pred, first_value=0): \n",
-    "    y_pred = [first_value]\n",
-    "    for pred in y_diff_pred:\n",
-    "        y_pred.append(y_pred[-1] + pred)\n",
-    "    return y_pred\n",
-    "\n",
-    "def evaluate_model(y_true, y_pred):\n",
-    "    mse = mean_squared_error(y_true, y_pred)\n",
-    "    r2 = r2_score(y_true, y_pred)\n",
-    "    return mse, r2"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Fit the random forest model\n",
-    "model_rf = RandomForestRegressor(n_estimators=1500, random_state=0)\n",
-    "model_rf.fit(X_diff_train, y_diff_train)\n",
-    "\n",
-    "# Make predictions on the training and test sets\n",
-    "y_diff_train_pred = model_rf.predict(X_diff_train)\n",
-    "y_diff_test_pred = model_rf.predict(X_diff_test)\n",
-    "\n",
-    "# Transform the predictions back to the original scale\n",
-    "y_train_rf_pred = transform_to_levels(y_diff_train_pred, first_value=train_df[target_column].iloc[0])\n",
-    "y_test_rf_pred = transform_to_levels(y_diff_test_pred, first_value=test_df[target_column].iloc[0])\n",
-    "\n",
-    "# Evaluate the model's performance on the training and test sets\n",
-    "mse_train, r2_train = evaluate_model(train_df[target_column], y_train_rf_pred)\n",
-    "mse_test, r2_test = evaluate_model(test_df[target_column], y_test_rf_pred)\n",
-    "\n",
-    "print(f\"Train Mean Squared Error: {mse_train}\")\n",
-    "print(f\"Train R-Squared: {r2_train}\")\n",
-    "print(f\"Test Mean Squared Error: {mse_test}\")\n",
-    "print(f\"Test R-Squared: {r2_test}\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Fit the gradient boost model\n",
-    "model_gb = GradientBoostingRegressor(n_estimators=1500, random_state=0)\n",
-    "model_gb.fit(X_diff_train, y_diff_train)\n",
-    "\n",
-    "# Make predictions on the training and test sets\n",
-    "y_diff_train_pred = model_gb.predict(X_diff_train)\n",
-    "y_diff_test_pred = model_gb.predict(X_diff_test)\n",
-    "\n",
-    "# Transform the predictions back to the original scale\n",
-    "y_train_gb_pred = transform_to_levels(y_diff_train_pred, first_value=train_df[target_column].iloc[0])\n",
-    "y_test_gb_pred = transform_to_levels(y_diff_test_pred, first_value=test_df[target_column].iloc[0])\n",
-    "\n",
-    "# Evaluate the model's performance on the training and test sets\n",
-    "mse_train, r2_train = evaluate_model(train_df[target_column], y_train_gb_pred)\n",
-    "mse_test, r2_test = evaluate_model(test_df[target_column], y_test_gb_pred)\n",
-    "\n",
-    "print(f\"Train Mean Squared Error: {mse_train}\")\n",
-    "print(f\"Train R-Squared: {r2_train}\")\n",
-    "print(f\"Test Mean Squared Error: {mse_test}\")\n",
-    "print(f\"Test R-Squared: {r2_test}\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_3__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind datasets\n",
-    "\n",
-    "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
-    "\n",
-    "This function takes a number of arguments:\n",
-    "\n",
-    "- `dataset` — the raw dataset that you want to provide as input to tests\n",
-    "- `input_id` - a unique identifier that allows tracking what inputs are used when running each individual test\n",
-    "- `target_column` — a required argument if tests require access to true values. This is the name of the target column in the dataset\n",
-    "\n",
-    "With all dataframes ready, you can now initialize the ValidMind datasets objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):\n",
-    "\n",
-    "- `vm_raw_ds`: contains the raw, unprocessed data with the specified target column.\n",
-    "- `vm_train_diff_ds`: contains the training data with the differenced target column, excluding the first row to remove NaN values caused by differencing.\n",
-    "- `vm_test_diff_ds`: contains the test data with the differenced target column, excluding the first row to remove NaN values caused by differencing.\n",
-    "- `vm_train_ds`:  contains the training data, excluding the first row to align with the differenced data.\n",
-    "- `vm_test_ds`: includes the test data split from the raw dataset."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_raw_ds = vm.init_dataset(\n",
-    "    input_id=\"raw_ds\",\n",
-    "    dataset=raw_df,\n",
-    "    target_column=target_column,\n",
-    ")\n",
-    "\n",
-    "vm_train_diff_ds = vm.init_dataset(\n",
-    "    input_id=\"train_diff_ds\",\n",
-    "    dataset=train_diff_df,\n",
-    "    target_column=target_column,\n",
-    ")\n",
-    "\n",
-    "vm_test_diff_ds = vm.init_dataset(\n",
-    "    input_id=\"test_diff_ds\",\n",
-    "    dataset=test_diff_df,\n",
-    "    target_column=target_column,\n",
-    ")\n",
-    "\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    input_id=\"train_ds\",\n",
-    "    dataset=train_df,\n",
-    "    target_column=target_column,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    input_id=\"test_ds\",\n",
-    "    dataset=test_df,\n",
-    "    target_column=target_column,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_4__'></a>\n",
-    "\n",
-    "### Initialize the model objects\n",
-    "\n",
-    "Additionally, you need to initialize a ValidMind model object (`vm_model`) for each model, that can be passed to other functions for analysis and tests on the data. You simply intialize this model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_model_rf = vm.init_model(\n",
-    "    model_rf,\n",
-    "    input_id=\"random_forests_model\",\n",
-    ")\n",
-    "\n",
-    "vm_model_gb = vm.init_model(\n",
-    "    model_gb,\n",
-    "    input_id=\"gradient_boosting_model\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_5__'></a>\n",
-    "\n",
-    "### Assign predictions to the datasets\n",
-    "\n",
-    "We can now use the assign_predictions() method from the Dataset object to link existing predictions to any model. If no prediction values are passed, the method will compute predictions automatically:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds.assign_predictions(\n",
-    "    model=vm_model_rf,\n",
-    "    prediction_values=y_train_rf_pred,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds.assign_predictions(\n",
-    "    model=vm_model_rf,\n",
-    "    prediction_values=y_test_rf_pred,\n",
-    ")\n",
-    "\n",
-    "vm_train_ds.assign_predictions(\n",
-    "    model=vm_model_gb,\n",
-    "    prediction_values=y_train_gb_pred,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds.assign_predictions(\n",
-    "    model=vm_model_gb,\n",
-    "    prediction_values=y_test_gb_pred,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_6__'></a>\n",
-    "\n",
-    "### Run the full suite of tests\n",
-    "\n",
-    "This is where it all comes together: you are now ready to run the documentation tests for the model as defined by the documentation template you looked at earlier.\n",
-    "\n",
-    "The [`vm.run_documentation_tests`](https://docs.validmind.ai/validmind/validmind.html#run_documentation_tests) function finds and runs every test specified in the template and then uploads all the documentation and test artifacts that get generated to the ValidMind Platform.\n",
-    "\n",
-    "The function requires information about the inputs to use on every test. These inputs can be passed as an `inputs` argument if we want to use the same inputs for all tests. It's also possible to pass a `config` argument that has information about the `params` and `inputs` that each test requires. The `config` parameter is a dictionary with the following structure:\n",
-    "\n",
-    "```python\n",
-    "config = {\n",
-    "    \"<test-id>\": {\n",
-    "        \"params\": {\n",
-    "            \"param1\": \"value1\",\n",
-    "            \"param2\": \"value2\",\n",
-    "            ...\n",
-    "        },\n",
-    "        \"inputs\": {\n",
-    "            \"input1\": \"value1\",\n",
-    "            \"input2\": \"value2\",\n",
-    "            ...\n",
-    "        }\n",
-    "    },\n",
-    "    ...\n",
-    "}\n",
-    "```\n",
-    "\n",
-    "Each `<test-id>` above corresponds to the test driven block identifiers shown by `vm.preview_template()`. For this model, we will use the default parameters for all tests, but we'll need to specify the input configuration for each one. The method `get_demo_test_config()` below constructs the default input configuration for our demo."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.utils import preview_test_config\n",
-    "\n",
-    "test_config = fred_timeseries.get_demo_test_config()\n",
-    "preview_test_config(test_config)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "Now we can pass the input configuration to `vm.run_documentation_tests()` and run the full suite of tests. The variable `full_suite` then holds the result of these tests."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "full_suite = vm.run_documentation_tests(config=test_config)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
-    "\n",
-    "<a id='toc5_1__'></a>\n",
-    "\n",
-    "### Work with your model documentation\n",
-    "\n",
-    "1. From the **Model Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. Click and expand the **Model Development** section.\n",
-    "\n",
-    "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/model-documentation/working-with-model-documentation.html)\n",
-    "\n",
-    "<a id='toc5_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-b9c8d56383ed44cfa943d32f12fc037c",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "validmind-eEL8LtKG-py3.10",
-   "language": "python",
-   "name": "python3"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Document a time series forecasting model\n",
+        "\n",
+        "Use the [FRED](https://fred.stlouisfed.org/) sample dataset to train a simple time series model and document that model with the ValidMind Library.\n",
+        "\n",
+        "As part of the notebook, you will learn how to train a simple model while exploring how the documentation process works:\n",
+        "\n",
+        "- Initializing the ValidMind Library\n",
+        "- Loading a sample dataset provided by the library to train a simple time series model\n",
+        "- Running a ValidMind test suite to quickly generate documentation about the data and model"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "  - [Initialize the Python environment](#toc2_3__)    \n",
+        "  - [Preview the documentation template](#toc2_4__)    \n",
+        "- [Load the sample dataset](#toc3__)    \n",
+        "- [Document the model](#toc4__)    \n",
+        "  - [Prepocess the raw dataset](#toc4_1__)    \n",
+        "  - [Train random forests and gradient boosting regressor models](#toc4_2__)    \n",
+        "  - [Initialize the ValidMind datasets](#toc4_3__)    \n",
+        "  - [Initialize the ValidMind models](#toc4_4__)    \n",
+        "  - [Assign predictions to the datasets](#toc4_5__)    \n",
+        "  - [Run the full suite of tests](#toc4_6__)    \n",
+        "- [Next steps](#toc5__)    \n",
+        "  - [Work with your documentation](#toc5_1__)    \n",
+        "  - [Discover more learning resources](#toc5_2__)    \n",
+        "- [Upgrade ValidMind](#toc6__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+        "\n",
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Binary classification`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Initialize the Python environment\n",
+        "\n",
+        "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from sklearn.ensemble import RandomForestRegressor\n",
+        "from sklearn.ensemble import RandomForestRegressor, GradientBoostingRegressor\n",
+        "from sklearn.metrics import mean_squared_error, r2_score\n",
+        "from sklearn.model_selection import train_test_split\n",
+        "\n",
+        "%matplotlib inline"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_4__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Load the sample dataset\n",
+        "\n",
+        "The sample dataset used here is provided by the ValidMind library. To be able to use it, you need to import the dataset and load it into a pandas [DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html), a two-dimensional tabular data structure that makes use of rows and columns:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.datasets.regression import fred_timeseries \n",
+        "\n",
+        "target_column = fred_timeseries.target_column\n",
+        "\n",
+        "print(\n",
+        "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{target_column}'\"\n",
+        ")\n",
+        "\n",
+        "raw_df = fred_timeseries.load_data()\n",
+        "raw_df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Document the model\n",
+        "\n",
+        "As part of documenting the model with the ValidMind Library, you need to preprocess the raw dataset, initialize some training and test datasets, initialize a model object you can use for testing, and then run the full suite of tests."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Prepocess the raw dataset\n",
+        "\n",
+        "Preprocessing performs a number of operations to get ready for the subsequent steps:\n",
+        "- **Split the dataset**: Divide the original dataset into training and test sets for the primary model with an 80/20 split, without shuffling.\n",
+        "- **Difference the data**: Calculate the first difference of the train and test datasets to remove trends and seasonality, then drop any resulting NaN values.\n",
+        "- **Extract features and target variables**: Separate the feature columns (predictors) and the target variable from the differenced train and test datasets."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Split the raw dataset into training and test sets \n",
+        "train_df, test_df = train_test_split(raw_df, test_size=0.2, shuffle=False)\n",
+        "\n",
+        "# Take the first difference of the training and test sets\n",
+        "train_diff_df = train_df.diff().dropna()\n",
+        "test_diff_df = test_df.diff().dropna()\n",
+        "\n",
+        "# Extract the features and target variable from the training set\n",
+        "X_diff_train = train_diff_df.drop(target_column, axis=1)\n",
+        "y_diff_train = train_diff_df[target_column]\n",
+        "\n",
+        "# Extract the features and target variable from the test set\n",
+        "X_diff_test = test_diff_df.drop(target_column, axis=1)\n",
+        "y_diff_test = test_diff_df[target_column]"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Train random forests and gradient boosting regressor models\n",
+        "\n",
+        "This section trains random forest and gradient boosting models on differenced data, transforms predictions back to the original scale, and evaluates model performance using Mean Squared Error (MSE) and R-squared (R²) scores. \n",
+        "\n",
+        "The following helper functions are used to post-process predictions and evaluate model performance:\n",
+        "\n",
+        "- `transform_to_levels`: Reconstructs the original values from differenced predictions by cumulatively summing them, starting from a given initial value.\n",
+        "- `evaluate_model`: Calculates the Mean Squared Error (MSE) and R-squared (R²) score to evaluate the accuracy of the predictions against the true values."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "def transform_to_levels(y_diff_pred, first_value=0): \n",
+        "    y_pred = [first_value]\n",
+        "    for pred in y_diff_pred:\n",
+        "        y_pred.append(y_pred[-1] + pred)\n",
+        "    return y_pred\n",
+        "\n",
+        "def evaluate_model(y_true, y_pred):\n",
+        "    mse = mean_squared_error(y_true, y_pred)\n",
+        "    r2 = r2_score(y_true, y_pred)\n",
+        "    return mse, r2"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Fit the random forest model\n",
+        "model_rf = RandomForestRegressor(n_estimators=1500, random_state=0)\n",
+        "model_rf.fit(X_diff_train, y_diff_train)\n",
+        "\n",
+        "# Make predictions on the training and test sets\n",
+        "y_diff_train_pred = model_rf.predict(X_diff_train)\n",
+        "y_diff_test_pred = model_rf.predict(X_diff_test)\n",
+        "\n",
+        "# Transform the predictions back to the original scale\n",
+        "y_train_rf_pred = transform_to_levels(y_diff_train_pred, first_value=train_df[target_column].iloc[0])\n",
+        "y_test_rf_pred = transform_to_levels(y_diff_test_pred, first_value=test_df[target_column].iloc[0])\n",
+        "\n",
+        "# Evaluate the model's performance on the training and test sets\n",
+        "mse_train, r2_train = evaluate_model(train_df[target_column], y_train_rf_pred)\n",
+        "mse_test, r2_test = evaluate_model(test_df[target_column], y_test_rf_pred)\n",
+        "\n",
+        "print(f\"Train Mean Squared Error: {mse_train}\")\n",
+        "print(f\"Train R-Squared: {r2_train}\")\n",
+        "print(f\"Test Mean Squared Error: {mse_test}\")\n",
+        "print(f\"Test R-Squared: {r2_test}\")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Fit the gradient boost model\n",
+        "model_gb = GradientBoostingRegressor(n_estimators=1500, random_state=0)\n",
+        "model_gb.fit(X_diff_train, y_diff_train)\n",
+        "\n",
+        "# Make predictions on the training and test sets\n",
+        "y_diff_train_pred = model_gb.predict(X_diff_train)\n",
+        "y_diff_test_pred = model_gb.predict(X_diff_test)\n",
+        "\n",
+        "# Transform the predictions back to the original scale\n",
+        "y_train_gb_pred = transform_to_levels(y_diff_train_pred, first_value=train_df[target_column].iloc[0])\n",
+        "y_test_gb_pred = transform_to_levels(y_diff_test_pred, first_value=test_df[target_column].iloc[0])\n",
+        "\n",
+        "# Evaluate the model's performance on the training and test sets\n",
+        "mse_train, r2_train = evaluate_model(train_df[target_column], y_train_gb_pred)\n",
+        "mse_test, r2_test = evaluate_model(test_df[target_column], y_test_gb_pred)\n",
+        "\n",
+        "print(f\"Train Mean Squared Error: {mse_train}\")\n",
+        "print(f\"Train R-Squared: {r2_train}\")\n",
+        "print(f\"Test Mean Squared Error: {mse_test}\")\n",
+        "print(f\"Test R-Squared: {r2_test}\")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_3__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind datasets\n",
+        "\n",
+        "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
+        "\n",
+        "This function takes a number of arguments:\n",
+        "\n",
+        "- `dataset` — the raw dataset that you want to provide as input to tests\n",
+        "- `input_id` - a unique identifier that allows tracking what inputs are used when running each individual test\n",
+        "- `target_column` — a required argument if tests require access to true values. This is the name of the target column in the dataset\n",
+        "\n",
+        "With all dataframes ready, you can now initialize the ValidMind datasets objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):\n",
+        "\n",
+        "- `vm_raw_ds`: contains the raw, unprocessed data with the specified target column.\n",
+        "- `vm_train_diff_ds`: contains the training data with the differenced target column, excluding the first row to remove NaN values caused by differencing.\n",
+        "- `vm_test_diff_ds`: contains the test data with the differenced target column, excluding the first row to remove NaN values caused by differencing.\n",
+        "- `vm_train_ds`:  contains the training data, excluding the first row to align with the differenced data.\n",
+        "- `vm_test_ds`: includes the test data split from the raw dataset."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_raw_ds = vm.init_dataset(\n",
+        "    input_id=\"raw_ds\",\n",
+        "    dataset=raw_df,\n",
+        "    target_column=target_column,\n",
+        ")\n",
+        "\n",
+        "vm_train_diff_ds = vm.init_dataset(\n",
+        "    input_id=\"train_diff_ds\",\n",
+        "    dataset=train_diff_df,\n",
+        "    target_column=target_column,\n",
+        ")\n",
+        "\n",
+        "vm_test_diff_ds = vm.init_dataset(\n",
+        "    input_id=\"test_diff_ds\",\n",
+        "    dataset=test_diff_df,\n",
+        "    target_column=target_column,\n",
+        ")\n",
+        "\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    input_id=\"train_ds\",\n",
+        "    dataset=train_df,\n",
+        "    target_column=target_column,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    input_id=\"test_ds\",\n",
+        "    dataset=test_df,\n",
+        "    target_column=target_column,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_4__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind models\n",
+        "\n",
+        "You'll also need to initialize ValidMind model objects (`vm_model`) that can be passed to other functions for analysis and tests on the data for our models.\n",
+        "\n",
+        "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+        "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
+        "\n",
+        "Initialize your model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_model_rf = vm.init_model(\n",
+        "    model_rf,\n",
+        "    input_id=\"random_forests_model\",\n",
+        ")\n",
+        "\n",
+        "vm_model_gb = vm.init_model(\n",
+        "    model_gb,\n",
+        "    input_id=\"gradient_boosting_model\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_5__'></a>\n",
+        "\n",
+        "### Assign predictions to the datasets\n",
+        "\n",
+        "We can now use the assign_predictions() method from the Dataset object to link existing predictions to any model. If no prediction values are passed, the method will compute predictions automatically:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds.assign_predictions(\n",
+        "    model=vm_model_rf,\n",
+        "    prediction_values=y_train_rf_pred,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds.assign_predictions(\n",
+        "    model=vm_model_rf,\n",
+        "    prediction_values=y_test_rf_pred,\n",
+        ")\n",
+        "\n",
+        "vm_train_ds.assign_predictions(\n",
+        "    model=vm_model_gb,\n",
+        "    prediction_values=y_train_gb_pred,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds.assign_predictions(\n",
+        "    model=vm_model_gb,\n",
+        "    prediction_values=y_test_gb_pred,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_6__'></a>\n",
+        "\n",
+        "### Run the full suite of tests\n",
+        "\n",
+        "This is where it all comes together: you are now ready to run the documentation tests for the model as defined by the documentation template you looked at earlier.\n",
+        "\n",
+        "The [`vm.run_documentation_tests`](https://docs.validmind.ai/validmind/validmind.html#run_documentation_tests) function finds and runs every test specified in the template and then uploads all the documentation and test artifacts that get generated to the ValidMind Platform.\n",
+        "\n",
+        "The function requires information about the inputs to use on every test. These inputs can be passed as an `inputs` argument if we want to use the same inputs for all tests. It's also possible to pass a `config` argument that has information about the `params` and `inputs` that each test requires. The `config` parameter is a dictionary with the following structure:\n",
+        "\n",
+        "```python\n",
+        "config = {\n",
+        "    \"<test-id>\": {\n",
+        "        \"params\": {\n",
+        "            \"param1\": \"value1\",\n",
+        "            \"param2\": \"value2\",\n",
+        "            ...\n",
+        "        },\n",
+        "        \"inputs\": {\n",
+        "            \"input1\": \"value1\",\n",
+        "            \"input2\": \"value2\",\n",
+        "            ...\n",
+        "        }\n",
+        "    },\n",
+        "    ...\n",
+        "}\n",
+        "```\n",
+        "\n",
+        "Each `<test-id>` above corresponds to the test driven block identifiers shown by `vm.preview_template()`. For this model, we will use the default parameters for all tests, but we'll need to specify the input configuration for each one. The method `get_demo_test_config()` below constructs the default input configuration for our demo."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.utils import preview_test_config\n",
+        "\n",
+        "test_config = fred_timeseries.get_demo_test_config()\n",
+        "preview_test_config(test_config)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Now we can pass the input configuration to `vm.run_documentation_tests()` and run the full suite of tests. The variable `full_suite` then holds the result of these tests."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "full_suite = vm.run_documentation_tests(config=test_config)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
+        "\n",
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Work with your documentation\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (**Learn more:** [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. Click and expand the **Model Development** section.\n",
+        "\n",
+        "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
+        "\n",
+        "<a id='toc5_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-ab56373aa7ee4e15909017ab135ceaae"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "validmind-eEL8LtKG-py3.10",
+      "language": "python",
+      "name": "python3"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.10.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 2
 }
diff --git a/site/notebooks/use_cases/time_series/quickstart_time_series_high_code.ipynb b/site/notebooks/use_cases/time_series/quickstart_time_series_high_code.ipynb
index 87610c5f9e..1dfae1e06e 100644
--- a/site/notebooks/use_cases/time_series/quickstart_time_series_high_code.ipynb
+++ b/site/notebooks/use_cases/time_series/quickstart_time_series_high_code.ipynb
@@ -1,1008 +1,1023 @@
 {
- "cells": [
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "# Document a time series forecasting model\n",
-    "\n",
-    "Use the [FRED](https://fred.stlouisfed.org/) sample dataset to train a simple time series model and document that model with the ValidMind Library.\n",
-    "\n",
-    "As part of the notebook, you will learn how to train a simple model while exploring how the documentation process works:\n",
-    "\n",
-    "- Initializing the ValidMind Library\n",
-    "- Loading a sample dataset provided by the library to train a simple time series model\n",
-    "- Running a ValidMind test suite to quickly generate documentation about the data and model"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "::: {.content-hidden when-format=\"html\"}\n",
-    "## Contents    \n",
-    "- [About ValidMind](#toc1__)    \n",
-    "  - [Before you begin](#toc1_1__)    \n",
-    "  - [New to ValidMind?](#toc1_2__)    \n",
-    "  - [Key concepts](#toc1_3__)    \n",
-    "- [Setting up](#toc2__)    \n",
-    "  - [Install the ValidMind Library](#toc2_1__)    \n",
-    "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
-    "    - [Register sample model](#toc2_2_1__)    \n",
-    "    - [Apply documentation template](#toc2_2_2__)    \n",
-    "    - [Get your code snippet](#toc2_2_3__)    \n",
-    "  - [Initialize the Python environment](#toc2_3__)    \n",
-    "  - [Preview the documentation template](#toc2_4__)    \n",
-    "- [Load the sample dataset](#toc3__)    \n",
-    "- [Document the model](#toc4__)    \n",
-    "  - [Prepocess the raw dataset](#toc4_1__)    \n",
-    "  - [Train random forests and gradient boosting regressor models](#toc4_2__)    \n",
-    "  - [Initialize the ValidMind datasets](#toc4_3__)    \n",
-    "  - [Initialize the model objects](#toc4_4__)    \n",
-    "  - [Assign predictions to the datasets](#toc4_5__)    \n",
-    "  - [Run data validation tests](#toc4_6__)    \n",
-    "  - [Run model validation tests](#toc4_7__)    \n",
-    "- [Next steps](#toc5__)    \n",
-    "  - [Work with your model documentation](#toc5_1__)    \n",
-    "  - [Discover more learning resources](#toc5_2__)    \n",
-    "- [Upgrade ValidMind](#toc6__)    \n",
-    "\n",
-    ":::\n",
-    "<!-- jn-toc-notebook-config\n",
-    "\tnumbering=false\n",
-    "\tanchor=true\n",
-    "\tflat=false\n",
-    "\tminLevel=2\n",
-    "\tmaxLevel=4\n",
-    "\t/jn-toc-notebook-config -->\n",
-    "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc1__'></a>\n",
-    "\n",
-    "## About ValidMind\n",
-    "\n",
-    "ValidMind is a suite of tools for managing model risk, including risk associated with AI and statistical models.\n",
-    "\n",
-    "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on model documentation. Together, these products simplify model risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and model validators.\n",
-    "\n",
-    "<a id='toc1_1__'></a>\n",
-    "\n",
-    "### Before you begin\n",
-    "\n",
-    "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
-    "\n",
-    "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
-    "\n",
-    "<a id='toc1_2__'></a>\n",
-    "\n",
-    "### New to ValidMind?\n",
-    "\n",
-    "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting models and running tests, as well as find code samples and our Python Library API reference.\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
-    "<br></br>\n",
-    "<a href=\"https://docs.validmind.ai/guide/configuration/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
-    "\n",
-    "<a id='toc1_3__'></a>\n",
-    "\n",
-    "### Key concepts\n",
-    "\n",
-    "**Model documentation**: A structured and detailed record pertaining to a model, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. It serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the model’s application.\n",
-    "\n",
-    "**Documentation template**: Functions as a test suite and lays out the structure of model documentation, segmented into various sections and sub-sections. Documentation templates define the structure of your model documentation, specifying the tests that should be run, and how the results should be displayed.\n",
-    "\n",
-    "**Tests**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or model. Tests are the building blocks of ValidMind, used to evaluate and document models and datasets, and can be run individually or as part of a suite defined by your model documentation template.\n",
-    "\n",
-    "**Metrics**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
-    "\n",
-    "**Custom metrics**: Custom metrics are functions that you define to evaluate your model or dataset. These functions can be registered via the ValidMind Library to be used with the ValidMind Platform.\n",
-    "\n",
-    "**Inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
-    "\n",
-    "  - **model**: A single model that has been initialized in ValidMind with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model).\n",
-    "  - **dataset**: Single dataset that has been initialized in ValidMind with [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
-    "  - **models**: A list of ValidMind models - usually this is used when you want to compare multiple models in your custom metric.\n",
-    "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom metric. See this [example](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html) for more information.\n",
-    "\n",
-    "**Parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a metric, customize its behavior, or provide additional context.\n",
-    "\n",
-    "**Outputs**: Custom metrics can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures.\n",
-    "\n",
-    "**Test suites**: Collections of tests designed to run together to automate and generate model documentation end-to-end for specific use-cases.\n",
-    "\n",
-    "Example: the [`classifier_full_suite`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html#ClassifierFullSuite) test suite runs tests from the [`tabular_dataset`](https://docs.validmind.ai/validmind/validmind/test_suites/tabular_datasets.html) and [`classifier`](https://docs.validmind.ai/validmind/validmind/test_suites/classifier.html) test suites to fully document the data and model sections for binary classification model use-cases."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2__'></a>\n",
-    "\n",
-    "## Setting up"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_1__'></a>\n",
-    "\n",
-    "### Install the ValidMind Library\n",
-    "\n",
-    "To install the library:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip install -q validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind Library"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_1__'></a>\n",
-    "\n",
-    "#### Register sample model\n",
-    "\n",
-    "Let's first register a sample model for use with this notebook:\n",
-    "\n",
-    "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/configuration/log-in-to-validmind.html).\n",
-    "\n",
-    "2. In the left sidebar, navigate to **Inventory** and click **+ Register Model**.\n",
-    "\n",
-    "3. Enter the model details and click **Next >** to continue to assignment of model stakeholders. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/register-models-in-inventory.html))\n",
-    "\n",
-    "4. Select your own name under the **MODEL OWNER** drop-down.\n",
-    "\n",
-    "5. Click **Register Model** to add the model to your inventory."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_2__'></a>\n",
-    "\n",
-    "#### Apply documentation template\n",
-    "\n",
-    "Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.\n",
-    "\n",
-    "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
-    "\n",
-    "2. Under **TEMPLATE**, select `Time Series Forecasting with ML`.\n",
-    "\n",
-    "3. Click **Use Template** to apply the template."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_2_3__'></a>\n",
-    "\n",
-    "#### Get your code snippet\n",
-    "\n",
-    "Initialize the ValidMind Library with the *code snippet* unique to each model per document, ensuring your test results are uploaded to the correct model and automatically populated in the right document in the ValidMind Platform when you run this notebook.\n",
-    "\n",
-    "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
-    "2. Click **Copy snippet to clipboard**.\n",
-    "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/model-documentation/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Load your model identifier credentials from an `.env` file\n",
-    "\n",
-    "%load_ext dotenv\n",
-    "%dotenv .env\n",
-    "\n",
-    "# Or replace with your code snippet\n",
-    "\n",
-    "import validmind as vm\n",
-    "\n",
-    "vm.init(\n",
-    "    # api_host=\"...\",\n",
-    "    # api_key=\"...\",\n",
-    "    # api_secret=\"...\",\n",
-    "    # model=\"...\",\n",
-    "    document=\"documentation\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_3__'></a>\n",
-    "\n",
-    "### Initialize the Python environment\n",
-    "\n",
-    "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from sklearn.ensemble import RandomForestRegressor, GradientBoostingRegressor\n",
-    "from sklearn.metrics import mean_squared_error, r2_score\n",
-    "from sklearn.model_selection import train_test_split\n",
-    "\n",
-    "%matplotlib inline"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc2_4__'></a>\n",
-    "\n",
-    "### Preview the documentation template\n",
-    "\n",
-    "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
-    "\n",
-    "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm.preview_template()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc3__'></a>\n",
-    "\n",
-    "## Load the sample dataset\n",
-    "\n",
-    "The sample dataset used here is provided by the ValidMind library. To be able to use it, you need to import the dataset and load it into a pandas [DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html), a two-dimensional tabular data structure that makes use of rows and columns:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.datasets.regression import fred_timeseries \n",
-    "\n",
-    "target_column = fred_timeseries.target_column\n",
-    "\n",
-    "print(\n",
-    "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{target_column}'\"\n",
-    ")\n",
-    "\n",
-    "raw_df = fred_timeseries.load_data()\n",
-    "raw_df.head()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4__'></a>\n",
-    "\n",
-    "## Document the model\n",
-    "\n",
-    "As part of documenting the model with the ValidMind Library, you need to preprocess the raw dataset, initialize some training and test datasets, initialize a model object you can use for testing, and then run the full suite of tests."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_1__'></a>\n",
-    "\n",
-    "### Prepocess the raw dataset\n",
-    "\n",
-    "Preprocessing performs a number of operations to get ready for the subsequent steps:\n",
-    "- **Split the dataset**: Divide the original dataset into training and test sets for the primary model with an 80/20 split, without shuffling.\n",
-    "- **Difference the data**: Calculate the first difference of the train and test datasets to remove trends and seasonality, then drop any resulting NaN values.\n",
-    "- **Extract features and target variables**: Separate the feature columns (predictors) and the target variable from the differenced train and test datasets."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Split the raw dataset into training and test sets \n",
-    "train_df, test_df = train_test_split(raw_df, test_size=0.2, shuffle=False)\n",
-    "\n",
-    "# Take the first difference of the training and test sets\n",
-    "train_diff_df = train_df.diff().dropna()\n",
-    "test_diff_df = test_df.diff().dropna()\n",
-    "\n",
-    "# Extract the features and target variable from the training set\n",
-    "X_diff_train = train_diff_df.drop(target_column, axis=1)\n",
-    "y_diff_train = train_diff_df[target_column]\n",
-    "\n",
-    "# Extract the features and target variable from the test set\n",
-    "X_diff_test = test_diff_df.drop(target_column, axis=1)\n",
-    "y_diff_test = test_diff_df[target_column]"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_2__'></a>\n",
-    "\n",
-    "### Train random forests and gradient boosting regressor models\n",
-    "\n",
-    "This section trains random forest and gradient boosting models on differenced data, transforms predictions back to the original scale, and evaluates model performance using Mean Squared Error (MSE) and R-squared (R²) scores. \n",
-    "\n",
-    "The following helper functions are used to post-process predictions and evaluate model performance:\n",
-    "\n",
-    "- `transform_to_levels`: Reconstructs the original values from differenced predictions by cumulatively summing them, starting from a given initial value.\n",
-    "- `evaluate_model`: Calculates the Mean Squared Error (MSE) and R-squared (R²) score to evaluate the accuracy of the predictions against the true values."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "def transform_to_levels(y_diff_pred, first_value=0): \n",
-    "    y_pred = [first_value]\n",
-    "    for pred in y_diff_pred:\n",
-    "        y_pred.append(y_pred[-1] + pred)\n",
-    "    return y_pred\n",
-    "\n",
-    "def evaluate_model(y_true, y_pred):\n",
-    "    mse = mean_squared_error(y_true, y_pred)\n",
-    "    r2 = r2_score(y_true, y_pred)\n",
-    "    return mse, r2"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Fit the random forest model\n",
-    "model_rf = RandomForestRegressor(n_estimators=1500, random_state=0)\n",
-    "model_rf.fit(X_diff_train, y_diff_train)\n",
-    "\n",
-    "# Make predictions on the training and test sets\n",
-    "y_diff_train_pred = model_rf.predict(X_diff_train)\n",
-    "y_diff_test_pred = model_rf.predict(X_diff_test)\n",
-    "\n",
-    "# Transform the predictions back to the original scale\n",
-    "y_train_rf_pred = transform_to_levels(y_diff_train_pred, first_value=train_df[target_column].iloc[0])\n",
-    "y_test_rf_pred = transform_to_levels(y_diff_test_pred, first_value=test_df[target_column].iloc[0])\n",
-    "\n",
-    "# Evaluate the model's performance on the training and test sets\n",
-    "mse_train, r2_train = evaluate_model(train_df[target_column], y_train_rf_pred)\n",
-    "mse_test, r2_test = evaluate_model(test_df[target_column], y_test_rf_pred)\n",
-    "\n",
-    "print(f\"Train Mean Squared Error: {mse_train}\")\n",
-    "print(f\"Train R-Squared: {r2_train}\")\n",
-    "print(f\"Test Mean Squared Error: {mse_test}\")\n",
-    "print(f\"Test R-Squared: {r2_test}\")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "# Fit the gradient boost model\n",
-    "model_gb = GradientBoostingRegressor(n_estimators=1500, random_state=0)\n",
-    "model_gb.fit(X_diff_train, y_diff_train)\n",
-    "\n",
-    "# Make predictions on the training and test sets\n",
-    "y_diff_train_pred = model_gb.predict(X_diff_train)\n",
-    "y_diff_test_pred = model_gb.predict(X_diff_test)\n",
-    "\n",
-    "# Transform the predictions back to the original scale\n",
-    "y_train_gb_pred = transform_to_levels(y_diff_train_pred, first_value=train_df[target_column].iloc[0])\n",
-    "y_test_gb_pred = transform_to_levels(y_diff_test_pred, first_value=test_df[target_column].iloc[0])\n",
-    "\n",
-    "# Evaluate the model's performance on the training and test sets\n",
-    "mse_train, r2_train = evaluate_model(train_df[target_column], y_train_gb_pred)\n",
-    "mse_test, r2_test = evaluate_model(test_df[target_column], y_test_gb_pred)\n",
-    "\n",
-    "print(f\"Train Mean Squared Error: {mse_train}\")\n",
-    "print(f\"Train R-Squared: {r2_train}\")\n",
-    "print(f\"Test Mean Squared Error: {mse_test}\")\n",
-    "print(f\"Test R-Squared: {r2_test}\")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_3__'></a>\n",
-    "\n",
-    "### Initialize the ValidMind datasets\n",
-    "\n",
-    "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
-    "\n",
-    "This function takes a number of arguments:\n",
-    "\n",
-    "- `dataset` — the raw dataset that you want to provide as input to tests\n",
-    "- `input_id` - a unique identifier that allows tracking what inputs are used when running each individual test\n",
-    "- `target_column` — a required argument if tests require access to true values. This is the name of the target column in the dataset\n",
-    "\n",
-    "With all dataframes ready, you can now initialize the ValidMind datasets objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):\n",
-    "\n",
-    "- `vm_raw_ds`: contains the raw, unprocessed data with the specified target column.\n",
-    "- `vm_train_diff_ds`: contains the training data with the differenced target column, excluding the first row to remove NaN values caused by differencing.\n",
-    "- `vm_test_diff_ds`: contains the test data with the differenced target column, excluding the first row to remove NaN values caused by differencing.\n",
-    "- `vm_train_ds`:  contains the training data, excluding the first row to align with the differenced data.\n",
-    "- `vm_test_ds`: includes the test data split from the raw dataset."
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_raw_ds = vm.init_dataset(\n",
-    "    input_id=\"raw_ds\",\n",
-    "    dataset=raw_df,\n",
-    "    target_column=target_column,\n",
-    ")\n",
-    "\n",
-    "vm_train_diff_ds = vm.init_dataset(\n",
-    "    input_id=\"train_diff_ds\",\n",
-    "    dataset=train_diff_df,\n",
-    "    target_column=target_column,\n",
-    ")\n",
-    "\n",
-    "vm_test_diff_ds = vm.init_dataset(\n",
-    "    input_id=\"test_diff_ds\",\n",
-    "    dataset=test_diff_df,\n",
-    "    target_column=target_column,\n",
-    ")\n",
-    "\n",
-    "vm_train_ds = vm.init_dataset(\n",
-    "    input_id=\"train_ds\",\n",
-    "    dataset=train_df,\n",
-    "    target_column=target_column,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds = vm.init_dataset(\n",
-    "    input_id=\"test_ds\",\n",
-    "    dataset=test_df,\n",
-    "    target_column=target_column,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_4__'></a>\n",
-    "\n",
-    "### Initialize the model objects\n",
-    "\n",
-    "Additionally, you need to initialize a ValidMind model object (`vm_model`) for each model, that can be passed to other functions for analysis and tests on the data. You simply intialize this model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_model_rf = vm.init_model(\n",
-    "    model_rf,\n",
-    "    input_id=\"random_forests_model\",\n",
-    ")\n",
-    "\n",
-    "vm_model_gb = vm.init_model(\n",
-    "    model_gb,\n",
-    "    input_id=\"gradient_boosting_model\",\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_5__'></a>\n",
-    "\n",
-    "### Assign predictions to the datasets\n",
-    "\n",
-    "We can now use the assign_predictions() method from the Dataset object to link existing predictions to any model. If no prediction values are passed, the method will compute predictions automatically:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "vm_train_ds.assign_predictions(\n",
-    "    model=vm_model_rf,\n",
-    "    prediction_values=y_train_rf_pred,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds.assign_predictions(\n",
-    "    model=vm_model_rf,\n",
-    "    prediction_values=y_test_rf_pred,\n",
-    ")\n",
-    "\n",
-    "vm_train_ds.assign_predictions(\n",
-    "    model=vm_model_gb,\n",
-    "    prediction_values=y_train_gb_pred,\n",
-    ")\n",
-    "\n",
-    "vm_test_ds.assign_predictions(\n",
-    "    model=vm_model_gb,\n",
-    "    prediction_values=y_test_gb_pred,\n",
-    ")"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "from validmind.utils import preview_test_config\n",
-    "\n",
-    "test_config = fred_timeseries.get_demo_test_config()\n",
-    "preview_test_config(test_config)"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_6__'></a>\n",
-    "\n",
-    "### Run data validation tests"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.TimeSeriesDescription\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [\"raw_ds\", \"train_diff_ds\", \"test_diff_ds\", \"train_ds\", \"test_ds\"],\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.TimeSeriesLinePlot\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [\"raw_ds\"],\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.TimeSeriesMissingValues\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [\"raw_ds\", \"train_diff_ds\", \"test_diff_ds\", \"train_ds\", \"test_ds\"],\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.SeasonalDecompose\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [\"raw_ds\"],\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.TimeSeriesDescriptiveStatistics\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [\"train_diff_ds\", \"test_diff_ds\"],\n",
-    "    },\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.TimeSeriesOutliers\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [\"train_diff_ds\", \"test_diff_ds\"],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"zscore_threshold\": 4\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.TimeSeriesHistogram\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [ \"train_diff_ds\", \"test_diff_ds\"],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"nbins\": 100\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.data_validation.DatasetSplit\",\n",
-    "    inputs={\n",
-    "        \"datasets\": [\"train_diff_ds\", \"test_diff_ds\"],\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc4_7__'></a>\n",
-    "\n",
-    "### Run model validation tests"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.ModelMetadata\",\n",
-    "    input_grid={\n",
-    "        \"model\": [\"random_forests_model\", \"gradient_boosting_model\"],\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.RegressionErrors\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [\"train_ds\", \"test_ds\"],\n",
-    "        \"model\": [\"random_forests_model\", \"gradient_boosting_model\"],\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.RegressionR2Square\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [\"train_ds\", \"test_ds\"],\n",
-    "        \"model\": [\"random_forests_model\", \"gradient_boosting_model\"],\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.TimeSeriesR2SquareBySegments:train_data\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [\"train_ds\"],\n",
-    "        \"model\": [\"random_forests_model\", \"gradient_boosting_model\"],\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.TimeSeriesR2SquareBySegments:test_data\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [\"test_ds\"],\n",
-    "        \"model\": [\"random_forests_model\", \"gradient_boosting_model\"],\n",
-    "    },\n",
-    "    params={\n",
-    "        \"segments\":{\n",
-    "            \"start_date\": [\"2012-11-01\",\"2018-02-01\"],\n",
-    "            \"end_date\": [\"2018-01-01\",\"2023-03-01\"]\n",
-    "        }\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.TimeSeriesPredictionsPlot\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [\"train_ds\", \"test_ds\"],\n",
-    "        \"model\": [\"random_forests_model\", \"gradient_boosting_model\"],\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.TimeSeriesPredictionWithCI\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [\"train_ds\", \"test_ds\"],\n",
-    "        \"model\": [\"random_forests_model\", \"gradient_boosting_model\"],\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.ModelPredictionResiduals\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [\"train_ds\", \"test_ds\"],\n",
-    "        \"model\": [\"random_forests_model\", \"gradient_boosting_model\"],\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.FeatureImportance\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [\"train_ds\", \"test_ds\"],\n",
-    "        \"model\": [\"random_forests_model\", \"gradient_boosting_model\"],\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "test = vm.tests.run_test(\n",
-    "    \"validmind.model_validation.sklearn.PermutationFeatureImportance\",\n",
-    "    input_grid={\n",
-    "        \"dataset\": [\"train_ds\", \"test_ds\"],\n",
-    "        \"model\": [\"random_forests_model\", \"gradient_boosting_model\"],\n",
-    "    }\n",
-    ")\n",
-    "test.log()"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc5__'></a>\n",
-    "\n",
-    "## Next steps\n",
-    "\n",
-    "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
-    "\n",
-    "<a id='toc5_1__'></a>\n",
-    "\n",
-    "### Work with your model documentation\n",
-    "\n",
-    "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. ([Need more help?](https://docs.validmind.ai/guide/model-inventory/working-with-model-inventory.html))\n",
-    "\n",
-    "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
-    "\n",
-    "What you see is the full draft of your model documentation in a more easily consumable version. From here, you can make qualitative edits to model documentation, view guidelines, collaborate with validators, and submit your model documentation for approval when it's ready. [Learn more ...](https://docs.validmind.ai/guide/working-with-model-documentation.html)\n",
-    "\n",
-    "<a id='toc5_2__'></a>\n",
-    "\n",
-    "### Discover more learning resources\n",
-    "\n",
-    "We offer many interactive notebooks to help you automate testing, documenting, validating, and more:\n",
-    "\n",
-    "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
-    "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
-    "- [Code samples by use case](https://docs.validmind.ai/guide/samples-jupyter-notebooks.html)\n",
-    "\n",
-    "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "<a id='toc6__'></a>\n",
-    "\n",
-    "## Upgrade ValidMind\n",
-    "\n",
-    "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
-    "\n",
-    "Retrieve the information for the currently installed version of ValidMind:"
-   ]
-  },
-  {
-   "cell_type": "code",
-   "execution_count": null,
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "%pip show validmind"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
-    "\n",
-    "```bash\n",
-    "%pip install --upgrade validmind\n",
-    "```"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "metadata": {},
-   "source": [
-    "You may need to restart your kernel after running the upgrade package for changes to be applied."
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "copyright-4f0137500d9c49d3b6641ef3779aa140",
-   "metadata": {},
-   "source": [
-    "<!-- VALIDMIND COPYRIGHT -->\n",
-    "\n",
-    "<small>\n",
-    "\n",
-    "***\n",
-    "\n",
-    "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
-    "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
-    "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
-   ]
-  }
- ],
- "metadata": {
-  "kernelspec": {
-   "display_name": "ValidMind Library",
-   "language": "python",
-   "name": "validmind"
-  },
-  "language_info": {
-   "codemirror_mode": {
-    "name": "ipython",
-    "version": 3
-   },
-   "file_extension": ".py",
-   "mimetype": "text/x-python",
-   "name": "python",
-   "nbconvert_exporter": "python",
-   "pygments_lexer": "ipython3",
-   "version": "3.10.13"
-  }
- },
- "nbformat": 4,
- "nbformat_minor": 2
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Document a time series forecasting model\n",
+        "\n",
+        "Use the [FRED](https://fred.stlouisfed.org/) sample dataset to train a simple time series model and document that model with the ValidMind Library.\n",
+        "\n",
+        "As part of the notebook, you will learn how to train a simple model while exploring how the documentation process works:\n",
+        "\n",
+        "- Initializing the ValidMind Library\n",
+        "- Loading a sample dataset provided by the library to train a simple time series model\n",
+        "- Running a ValidMind test suite to quickly generate documentation about the data and model"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_1__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_2__)    \n",
+        "    - [Register sample model](#toc2_2_1__)    \n",
+        "    - [Apply documentation template](#toc2_2_2__)    \n",
+        "    - [Get your code snippet](#toc2_2_3__)    \n",
+        "  - [Initialize the Python environment](#toc2_3__)    \n",
+        "  - [Preview the documentation template](#toc2_4__)    \n",
+        "- [Load the sample dataset](#toc3__)    \n",
+        "- [Document the model](#toc4__)    \n",
+        "  - [Prepocess the raw dataset](#toc4_1__)    \n",
+        "  - [Train random forests and gradient boosting regressor models](#toc4_2__)    \n",
+        "  - [Initialize the ValidMind datasets](#toc4_3__)    \n",
+        "  - [Initialize the ValidMind models](#toc4_4__)    \n",
+        "  - [Assign predictions to the datasets](#toc4_5__)    \n",
+        "  - [Run data validation tests](#toc4_6__)    \n",
+        "  - [Run model validation tests](#toc4_7__)    \n",
+        "- [Next steps](#toc5__)    \n",
+        "  - [Work with your documentation](#toc5_1__)    \n",
+        "  - [Discover more learning resources](#toc5_2__)    \n",
+        "- [Upgrade ValidMind](#toc6__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate documentation and validation tests, and then use the ValidMind Platform to collaborate on documentation. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and validators.\n",
+        "\n",
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html).\n",
+        "\n",
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about documenting records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>\n",
+        "\n",
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**documentation, model documentation**: A structured and detailed document pertaining to a record, encompassing key components such as its underlying assumptions, methodologies, data sources, inputs, performance metrics, evaluations, limitations, and intended uses. Within the realm of risk management, this documentation serves to ensure transparency, adherence to regulatory requirements, and a clear understanding of potential risks associated with the record's application.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**documentation template**: A default ValidMind document type that serves as a standardized framework for developing and documenting records, including sections designated for record details, data descriptions, test results, and performance metrics. By outlining required documentation and recommended analyses, document templates ensure consistency and completeness across documentation and help guide developers through a systematic development process while promoting comparability and traceability of development outcomes.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_1__'></a>\n",
+        "\n",
+        "#### Register sample model\n",
+        "\n",
+        "Let's first register a sample record (model) for use with this notebook:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_2__'></a>\n",
+        "\n",
+        "#### Apply documentation template\n",
+        "\n",
+        "Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Development**.\n",
+        "\n",
+        "    If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Time Series Forecasting with ML`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2_3__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Development` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"documentation\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Initialize the Python environment\n",
+        "\n",
+        "Next, let's import the necessary libraries and set up your Python environment for data analysis:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from sklearn.ensemble import RandomForestRegressor, GradientBoostingRegressor\n",
+        "from sklearn.metrics import mean_squared_error, r2_score\n",
+        "from sklearn.model_selection import train_test_split\n",
+        "\n",
+        "%matplotlib inline"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_4__'></a>\n",
+        "\n",
+        "### Preview the documentation template\n",
+        "\n",
+        "Let's verify that you have connected the ValidMind Library to the ValidMind Platform and that the appropriate *template* is selected for your model.\n",
+        "\n",
+        "You will upload documentation and test results unique to your model based on this template later on. For now, **take a look at the default structure that the template provides with [the `vm.preview_template()` function](https://docs.validmind.ai/validmind/validmind.html#preview_template)** from the ValidMind library and note the empty sections:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.preview_template()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Load the sample dataset\n",
+        "\n",
+        "The sample dataset used here is provided by the ValidMind library. To be able to use it, you need to import the dataset and load it into a pandas [DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html), a two-dimensional tabular data structure that makes use of rows and columns:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.datasets.regression import fred_timeseries \n",
+        "\n",
+        "target_column = fred_timeseries.target_column\n",
+        "\n",
+        "print(\n",
+        "    f\"Loaded demo dataset with: \\n\\n\\t• Target column: '{target_column}'\"\n",
+        ")\n",
+        "\n",
+        "raw_df = fred_timeseries.load_data()\n",
+        "raw_df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Document the model\n",
+        "\n",
+        "As part of documenting the model with the ValidMind Library, you need to preprocess the raw dataset, initialize some training and test datasets, initialize a model object you can use for testing, and then run the full suite of tests."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Prepocess the raw dataset\n",
+        "\n",
+        "Preprocessing performs a number of operations to get ready for the subsequent steps:\n",
+        "- **Split the dataset**: Divide the original dataset into training and test sets for the primary model with an 80/20 split, without shuffling.\n",
+        "- **Difference the data**: Calculate the first difference of the train and test datasets to remove trends and seasonality, then drop any resulting NaN values.\n",
+        "- **Extract features and target variables**: Separate the feature columns (predictors) and the target variable from the differenced train and test datasets."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Split the raw dataset into training and test sets \n",
+        "train_df, test_df = train_test_split(raw_df, test_size=0.2, shuffle=False)\n",
+        "\n",
+        "# Take the first difference of the training and test sets\n",
+        "train_diff_df = train_df.diff().dropna()\n",
+        "test_diff_df = test_df.diff().dropna()\n",
+        "\n",
+        "# Extract the features and target variable from the training set\n",
+        "X_diff_train = train_diff_df.drop(target_column, axis=1)\n",
+        "y_diff_train = train_diff_df[target_column]\n",
+        "\n",
+        "# Extract the features and target variable from the test set\n",
+        "X_diff_test = test_diff_df.drop(target_column, axis=1)\n",
+        "y_diff_test = test_diff_df[target_column]"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Train random forests and gradient boosting regressor models\n",
+        "\n",
+        "This section trains random forest and gradient boosting models on differenced data, transforms predictions back to the original scale, and evaluates model performance using Mean Squared Error (MSE) and R-squared (R²) scores. \n",
+        "\n",
+        "The following helper functions are used to post-process predictions and evaluate model performance:\n",
+        "\n",
+        "- `transform_to_levels`: Reconstructs the original values from differenced predictions by cumulatively summing them, starting from a given initial value.\n",
+        "- `evaluate_model`: Calculates the Mean Squared Error (MSE) and R-squared (R²) score to evaluate the accuracy of the predictions against the true values."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "def transform_to_levels(y_diff_pred, first_value=0): \n",
+        "    y_pred = [first_value]\n",
+        "    for pred in y_diff_pred:\n",
+        "        y_pred.append(y_pred[-1] + pred)\n",
+        "    return y_pred\n",
+        "\n",
+        "def evaluate_model(y_true, y_pred):\n",
+        "    mse = mean_squared_error(y_true, y_pred)\n",
+        "    r2 = r2_score(y_true, y_pred)\n",
+        "    return mse, r2"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Fit the random forest model\n",
+        "model_rf = RandomForestRegressor(n_estimators=1500, random_state=0)\n",
+        "model_rf.fit(X_diff_train, y_diff_train)\n",
+        "\n",
+        "# Make predictions on the training and test sets\n",
+        "y_diff_train_pred = model_rf.predict(X_diff_train)\n",
+        "y_diff_test_pred = model_rf.predict(X_diff_test)\n",
+        "\n",
+        "# Transform the predictions back to the original scale\n",
+        "y_train_rf_pred = transform_to_levels(y_diff_train_pred, first_value=train_df[target_column].iloc[0])\n",
+        "y_test_rf_pred = transform_to_levels(y_diff_test_pred, first_value=test_df[target_column].iloc[0])\n",
+        "\n",
+        "# Evaluate the model's performance on the training and test sets\n",
+        "mse_train, r2_train = evaluate_model(train_df[target_column], y_train_rf_pred)\n",
+        "mse_test, r2_test = evaluate_model(test_df[target_column], y_test_rf_pred)\n",
+        "\n",
+        "print(f\"Train Mean Squared Error: {mse_train}\")\n",
+        "print(f\"Train R-Squared: {r2_train}\")\n",
+        "print(f\"Test Mean Squared Error: {mse_test}\")\n",
+        "print(f\"Test R-Squared: {r2_test}\")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Fit the gradient boost model\n",
+        "model_gb = GradientBoostingRegressor(n_estimators=1500, random_state=0)\n",
+        "model_gb.fit(X_diff_train, y_diff_train)\n",
+        "\n",
+        "# Make predictions on the training and test sets\n",
+        "y_diff_train_pred = model_gb.predict(X_diff_train)\n",
+        "y_diff_test_pred = model_gb.predict(X_diff_test)\n",
+        "\n",
+        "# Transform the predictions back to the original scale\n",
+        "y_train_gb_pred = transform_to_levels(y_diff_train_pred, first_value=train_df[target_column].iloc[0])\n",
+        "y_test_gb_pred = transform_to_levels(y_diff_test_pred, first_value=test_df[target_column].iloc[0])\n",
+        "\n",
+        "# Evaluate the model's performance on the training and test sets\n",
+        "mse_train, r2_train = evaluate_model(train_df[target_column], y_train_gb_pred)\n",
+        "mse_test, r2_test = evaluate_model(test_df[target_column], y_test_gb_pred)\n",
+        "\n",
+        "print(f\"Train Mean Squared Error: {mse_train}\")\n",
+        "print(f\"Train R-Squared: {r2_train}\")\n",
+        "print(f\"Test Mean Squared Error: {mse_test}\")\n",
+        "print(f\"Test R-Squared: {r2_test}\")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_3__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind datasets\n",
+        "\n",
+        "Before you can run tests, you must first initialize a ValidMind dataset object using the [`init_dataset`](https://docs.validmind.ai/validmind/validmind.html#init_dataset) function from the ValidMind (`vm`) module.\n",
+        "\n",
+        "This function takes a number of arguments:\n",
+        "\n",
+        "- `dataset` — the raw dataset that you want to provide as input to tests\n",
+        "- `input_id` - a unique identifier that allows tracking what inputs are used when running each individual test\n",
+        "- `target_column` — a required argument if tests require access to true values. This is the name of the target column in the dataset\n",
+        "\n",
+        "With all dataframes ready, you can now initialize the ValidMind datasets objects using [`vm.init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset):\n",
+        "\n",
+        "- `vm_raw_ds`: contains the raw, unprocessed data with the specified target column.\n",
+        "- `vm_train_diff_ds`: contains the training data with the differenced target column, excluding the first row to remove NaN values caused by differencing.\n",
+        "- `vm_test_diff_ds`: contains the test data with the differenced target column, excluding the first row to remove NaN values caused by differencing.\n",
+        "- `vm_train_ds`:  contains the training data, excluding the first row to align with the differenced data.\n",
+        "- `vm_test_ds`: includes the test data split from the raw dataset."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_raw_ds = vm.init_dataset(\n",
+        "    input_id=\"raw_ds\",\n",
+        "    dataset=raw_df,\n",
+        "    target_column=target_column,\n",
+        ")\n",
+        "\n",
+        "vm_train_diff_ds = vm.init_dataset(\n",
+        "    input_id=\"train_diff_ds\",\n",
+        "    dataset=train_diff_df,\n",
+        "    target_column=target_column,\n",
+        ")\n",
+        "\n",
+        "vm_test_diff_ds = vm.init_dataset(\n",
+        "    input_id=\"test_diff_ds\",\n",
+        "    dataset=test_diff_df,\n",
+        "    target_column=target_column,\n",
+        ")\n",
+        "\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    input_id=\"train_ds\",\n",
+        "    dataset=train_df,\n",
+        "    target_column=target_column,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    input_id=\"test_ds\",\n",
+        "    dataset=test_df,\n",
+        "    target_column=target_column,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_4__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind models\n",
+        "\n",
+        "You'll also need to initialize ValidMind model objects (`vm_model`) that can be passed to other functions for analysis and tests on the data for our models.\n",
+        "\n",
+        "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+        "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
+        "\n",
+        "Initialize your model object with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_model_rf = vm.init_model(\n",
+        "    model_rf,\n",
+        "    input_id=\"random_forests_model\",\n",
+        ")\n",
+        "\n",
+        "vm_model_gb = vm.init_model(\n",
+        "    model_gb,\n",
+        "    input_id=\"gradient_boosting_model\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_5__'></a>\n",
+        "\n",
+        "### Assign predictions to the datasets\n",
+        "\n",
+        "We can now use the assign_predictions() method from the Dataset object to link existing predictions to any model. If no prediction values are passed, the method will compute predictions automatically:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm_train_ds.assign_predictions(\n",
+        "    model=vm_model_rf,\n",
+        "    prediction_values=y_train_rf_pred,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds.assign_predictions(\n",
+        "    model=vm_model_rf,\n",
+        "    prediction_values=y_test_rf_pred,\n",
+        ")\n",
+        "\n",
+        "vm_train_ds.assign_predictions(\n",
+        "    model=vm_model_gb,\n",
+        "    prediction_values=y_train_gb_pred,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds.assign_predictions(\n",
+        "    model=vm_model_gb,\n",
+        "    prediction_values=y_test_gb_pred,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.utils import preview_test_config\n",
+        "\n",
+        "test_config = fred_timeseries.get_demo_test_config()\n",
+        "preview_test_config(test_config)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_6__'></a>\n",
+        "\n",
+        "### Run data validation tests"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.TimeSeriesDescription\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [\"raw_ds\", \"train_diff_ds\", \"test_diff_ds\", \"train_ds\", \"test_ds\"],\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.TimeSeriesLinePlot\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [\"raw_ds\"],\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.TimeSeriesMissingValues\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [\"raw_ds\", \"train_diff_ds\", \"test_diff_ds\", \"train_ds\", \"test_ds\"],\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.SeasonalDecompose\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [\"raw_ds\"],\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.TimeSeriesDescriptiveStatistics\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [\"train_diff_ds\", \"test_diff_ds\"],\n",
+        "    },\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.TimeSeriesOutliers\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [\"train_diff_ds\", \"test_diff_ds\"],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"zscore_threshold\": 4\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.TimeSeriesHistogram\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [ \"train_diff_ds\", \"test_diff_ds\"],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"nbins\": 100\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.data_validation.DatasetSplit\",\n",
+        "    inputs={\n",
+        "        \"datasets\": [\"train_diff_ds\", \"test_diff_ds\"],\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_7__'></a>\n",
+        "\n",
+        "### Run model validation tests"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.ModelMetadata\",\n",
+        "    input_grid={\n",
+        "        \"model\": [\"random_forests_model\", \"gradient_boosting_model\"],\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.RegressionErrors\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [\"train_ds\", \"test_ds\"],\n",
+        "        \"model\": [\"random_forests_model\", \"gradient_boosting_model\"],\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.RegressionR2Square\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [\"train_ds\", \"test_ds\"],\n",
+        "        \"model\": [\"random_forests_model\", \"gradient_boosting_model\"],\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.TimeSeriesR2SquareBySegments:train_data\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [\"train_ds\"],\n",
+        "        \"model\": [\"random_forests_model\", \"gradient_boosting_model\"],\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.TimeSeriesR2SquareBySegments:test_data\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [\"test_ds\"],\n",
+        "        \"model\": [\"random_forests_model\", \"gradient_boosting_model\"],\n",
+        "    },\n",
+        "    params={\n",
+        "        \"segments\":{\n",
+        "            \"start_date\": [\"2012-11-01\",\"2018-02-01\"],\n",
+        "            \"end_date\": [\"2018-01-01\",\"2023-03-01\"]\n",
+        "        }\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.TimeSeriesPredictionsPlot\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [\"train_ds\", \"test_ds\"],\n",
+        "        \"model\": [\"random_forests_model\", \"gradient_boosting_model\"],\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.TimeSeriesPredictionWithCI\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [\"train_ds\", \"test_ds\"],\n",
+        "        \"model\": [\"random_forests_model\", \"gradient_boosting_model\"],\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.ModelPredictionResiduals\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [\"train_ds\", \"test_ds\"],\n",
+        "        \"model\": [\"random_forests_model\", \"gradient_boosting_model\"],\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.FeatureImportance\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [\"train_ds\", \"test_ds\"],\n",
+        "        \"model\": [\"random_forests_model\", \"gradient_boosting_model\"],\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.PermutationFeatureImportance\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [\"train_ds\", \"test_ds\"],\n",
+        "        \"model\": [\"random_forests_model\", \"gradient_boosting_model\"],\n",
+        "    }\n",
+        ")\n",
+        "test.log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Next steps\n",
+        "\n",
+        "You can look at the results of this test suite right in the notebook where you ran the code, as you would expect. But there is a better way — use the ValidMind Platform to work with your model documentation.\n",
+        "\n",
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Work with your documentation\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you registered earlier. (Learn more: [Working with the inventory](https://docs.validmind.ai/guide/inventory/working-with-the-inventory.html))\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Development** under Documents.\n",
+        "\n",
+        "What you see is the full draft of your documentation in a more easily consumable version. From here, you can make qualitative edits to documentation, view guidelines, collaborate with validators, and submit your documentation for approval when it's ready. (**Learn more:** [Working with documentation](https://docs.validmind.ai/guide/documentation/working-with-documentation.html))\n",
+        "\n",
+        "<a id='toc5_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-d549f9055f374ee392fb42facfd75cb9"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "codemirror_mode": {
+        "name": "ipython",
+        "version": 3
+      },
+      "file_extension": ".py",
+      "mimetype": "text/x-python",
+      "name": "python",
+      "nbconvert_exporter": "python",
+      "pygments_lexer": "ipython3",
+      "version": "3.10.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 2
 }
diff --git a/site/notebooks/use_cases/validation/validate_application_scorecard.ipynb b/site/notebooks/use_cases/validation/validate_application_scorecard.ipynb
new file mode 100644
index 0000000000..563c622a21
--- /dev/null
+++ b/site/notebooks/use_cases/validation/validate_application_scorecard.ipynb
@@ -0,0 +1,1893 @@
+{
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "# Validate an application scorecard model\n",
+        "\n",
+        "Learn how to independently assess an application scorecard model developed using the ValidMind Library as a validator. You'll evaluate the development of the model by conducting thorough testing and analysis, including the use of challenger models to benchmark performance.\n",
+        "\n",
+        "An *application scorecard model* is a type of statistical model used in credit scoring to evaluate the creditworthiness of potential borrowers by generating a score based on various characteristics of an applicant such as credit history, income, employment status, and other relevant financial data.\n",
+        "\n",
+        " - This score assists lenders in making informed decisions about whether to approve or reject loan applications, as well as in determining the terms of the loan, including interest rates and credit limits.\n",
+        " - Effective validation of application scorecard models ensures that lenders can manage risk efficiently while maintaining a fast and transparent loan application process for applicants.\n",
+        "\n",
+        "This interactive notebook provides a step-by-step guide for:\n",
+        "\n",
+        "- Verifying the data quality steps performed by the development team\n",
+        "- Independently replicating the champion's results and conducting additional tests to assess performance, stability, and robustness\n",
+        "- Setting up test inputs and challenger models for comparative analysis\n",
+        "- Running validation tests, analyzing results, and logging artifacts (findings) to ValidMind"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "::: {.content-hidden when-format=\"html\"}\n",
+        "## Contents    \n",
+        "- [About ValidMind](#toc1__)    \n",
+        "  - [Before you begin](#toc1_1__)    \n",
+        "  - [New to ValidMind?](#toc1_2__)    \n",
+        "  - [Key concepts](#toc1_3__)    \n",
+        "- [Setting up](#toc2__)    \n",
+        "  - [Register a sample model](#toc2_1__)    \n",
+        "    - [Assign validator credentials](#toc2_1_1__)    \n",
+        "    - [Apply validation report template](#toc2_1_2__)    \n",
+        "  - [Install the ValidMind Library](#toc2_2__)    \n",
+        "  - [Initialize the ValidMind Library](#toc2_3__)    \n",
+        "    - [Get your code snippet](#toc2_3_1__)    \n",
+        "  - [Importing the champion model](#toc2_4__)    \n",
+        "  - [Load the sample dataset](#toc2_5__)    \n",
+        "    - [Preprocess the dataset](#toc2_5_1__)    \n",
+        "    - [Apply feature engineering to the dataset](#toc2_5_2__)    \n",
+        "  - [Split the feature engineered dataset](#toc2_6__)    \n",
+        "- [Developing potential challenger models](#toc3__)    \n",
+        "  - [Train potential challenger models](#toc3_1__)    \n",
+        "    - [Random forest classification model](#toc3_1_1__)    \n",
+        "    - [Logistic regression model](#toc3_1_2__)    \n",
+        "  - [Extract predicted probabilities](#toc3_2__)    \n",
+        "    - [Compute binary predictions](#toc3_2_1__)    \n",
+        "- [Initializing the ValidMind objects](#toc4__)    \n",
+        "  - [Initialize the ValidMind datasets](#toc4_1__)    \n",
+        "  - [Initialize the ValidMind models](#toc4_2__)    \n",
+        "  - [Assign predictions](#toc4_3__)    \n",
+        "  - [Compute credit risk scores](#toc4_4__)    \n",
+        "- [Running data quality tests](#toc5__)    \n",
+        "  - [Identify relevant data quality tests](#toc5_1__)    \n",
+        "  - [Run and log an individual data quality test](#toc5_2__)    \n",
+        "  - [Log multiple data quality tests](#toc5_3__)    \n",
+        "  - [Run data quality comparison tests](#toc5_4__)    \n",
+        "- [Running performance tests](#toc6__)    \n",
+        "  - [Identify relevant performance tests](#toc6_1__)    \n",
+        "  - [Run and log an individual performance test](#toc6_2__)    \n",
+        "  - [Log multiple performance tests](#toc6_3__)    \n",
+        "  - [Evaluate performance of the champion model](#toc6_4__)    \n",
+        "  - [Evaluate performance of challenger models](#toc6_5__)    \n",
+        "    - [Enable custom context for test descriptions](#toc6_5_1__)    \n",
+        "    - [Run performance comparison tests](#toc6_5_2__)    \n",
+        "- [Adjust a ValidMind test](#toc7__)    \n",
+        "- [Run diagnostic tests](#toc8__)    \n",
+        "- [Run feature importance tests](#toc9__)    \n",
+        "- [Implement a custom test](#toc10__)    \n",
+        "- [Verify test runs](#toc11__)    \n",
+        "- [Next steps](#toc12__)    \n",
+        "  - [Work with your validation report](#toc12_1__)    \n",
+        "  - [Discover more learning resources](#toc12_2__)    \n",
+        "- [Upgrade ValidMind](#toc13__)    \n",
+        "\n",
+        ":::\n",
+        "<!-- jn-toc-notebook-config\n",
+        "\tnumbering=false\n",
+        "\tanchor=true\n",
+        "\tflat=false\n",
+        "\tminLevel=2\n",
+        "\tmaxLevel=4\n",
+        "\t/jn-toc-notebook-config -->\n",
+        "<!-- THIS CELL WILL BE REPLACED ON TOC UPDATE. DO NOT WRITE YOUR TEXT IN THIS CELL -->"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1__'></a>\n",
+        "\n",
+        "## About ValidMind\n",
+        "\n",
+        "ValidMind is a suite of tools for managing risk, including risk associated with AI and statistical models.\n",
+        "\n",
+        "You use the ValidMind Library to automate comparison and other validation tests, and then use the ValidMind Platform to submit compliance assessments of champions via comprehensive validation reports. Together, these products simplify risk management, facilitate compliance with regulations and institutional standards, and enhance collaboration between yourself and developers."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_1__'></a>\n",
+        "\n",
+        "### Before you begin\n",
+        "\n",
+        "This notebook assumes you have basic familiarity with Python, including an understanding of how functions work. If you are new to Python, you can still run the notebook but we recommend further familiarizing yourself with the language. \n",
+        "\n",
+        "If you encounter errors due to missing modules in your Python environment, install the modules with `pip install`, and then re-run the notebook. For more help, refer to [Installing Python Modules](https://docs.python.org/3/installing/index.html)."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_2__'></a>\n",
+        "\n",
+        "### New to ValidMind?\n",
+        "\n",
+        "If you haven't already seen our documentation on the [ValidMind Library](https://docs.validmind.ai/developer/validmind-library.html), we recommend you begin by exploring the available resources in this section. There, you can learn more about validating records such as models and running tests, as well as find code samples and our Python Library API reference.\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>For access to all features available in this notebook, you'll need access to a ValidMind account.</b></span>\n",
+        "<br></br>\n",
+        "<a href=\"https://docs.validmind.ai/guide/access/register-with-validmind.html\" style=\"color: #DE257E;\"><b>Register with ValidMind</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc1_3__'></a>\n",
+        "\n",
+        "### Key concepts\n",
+        "\n",
+        "**record**: A tool tracked in the ValidMind inventory, such as a model. Records include traditional statistical models, legacy systems, artificial intelligence/machine learning models, large language models (LLMs), agentic AI systems, and other documentable items that benefit from oversight, testing, and lifecycle management.\n",
+        "\n",
+        "**model**: [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm) (which supersedes SR 11-7) defines a model as a \"complex quantitative method, system, or approach that applies statistical, economic, or financial theories to process input data into quantitative estimates.\" Simple arithmetic, deterministic rule-based processes, or software without statistical, economic, or financial theories underpinning their design or use are generally outside SR 26-2’s definition of a model. Within ValidMind, a model is a type of record tracked in the inventory.\n",
+        "\n",
+        "**validation report:** A validation report is a comprehensive and structured review evaluating a record's accuracy, performance, and suitability for its intended purpose. A report follows established validation guidelines to ensure consistency and adherence to internal and regulatory standards — encompassing the process of risk assessment, identifying areas of potential error or risk within the record's components, supporting transparency, regulatory compliance, and informed decision-making by documenting the validator’s independent review and conclusions.\n",
+        "\n",
+        "**document template**: Lays out the structure of documents, segmented into various sections and sub-sections, and functions as a test suite specifying the tests that should be run, and how the results should be displayed. Document templates help automate your development, validation, monitoring, and other risk management processes. Document templates are available for default ValidMind document types as well as custom document types.\n",
+        "\n",
+        "**validation report template**: A default ValidMind document template that serves as a standardized framework for conducting and documenting validation, including sections designated for attaching test results, evidence, or artifacts (findings). By outlining required documentation, recommended analyses, and expected validation tests, validation report templates ensure consistency and completeness across validation reports and help guide validators through a systematic review process while promoting comparability and traceability of validation outcomes.\n",
+        "\n",
+        "**artifacts (findings)**: Observations or issues identified during validation, including any deviations from expected performance or standards. Artifacts are organized by type — default types provided by ValidMind include Validation Issue, Policy Exception, and Limitation. Custom artifact types can be created to track other categories relevant to your organization.\n",
+        "\n",
+        "**test**: A function contained in the ValidMind Library, designed to run a specific quantitative test on the dataset or record. Test results are logged to the ValidMind Platform, where they are attached to documents. Tests are the building blocks of ValidMind, used to evaluate and document records and datasets, and can be run individually or as part of a suite defined by your templates.\n",
+        "\n",
+        "**test suite**: A collection of tests designed to run together to automate and generate documentation end-to-end for specific use cases. (Learn more: [`test_suites`](https://docs.validmind.ai/validmind/validmind/test_suites.html))\n",
+        "\n",
+        "**metric**: A subset of tests that do not have thresholds. In the context of this notebook, metrics and tests can be thought of as interchangeable concepts.\n",
+        "\n",
+        "**custom test**: Functions that you define to evaluate your record or dataset. These functions can be registered with the ValidMind Library to be used in the ValidMind Platform.\n",
+        "\n",
+        "**inputs**: Objects to be evaluated and documented in the ValidMind Library. They can be any of the following:\n",
+        "\n",
+        "  - **model**: A single record that has been initialized in ValidMind with [`init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model). Despite the naming convention, model objects can be any type of record you want to test, document, validate, or monitor with ValidMind.\n",
+        "  - **dataset**: A single dataset that has been initialized in ValidMind with [`init_dataset()`](https://docs.validmind.ai/validmind/validmind.html#init_dataset).\n",
+        "  - **models**: A list of ValidMind records - usually this is used when you want to compare multiple records in your custom tests.\n",
+        "  - **datasets**: A list of ValidMind datasets - usually this is used when you want to compare multiple datasets in your custom tests. (Learn more: [Run tests with multiple datasets](https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/run_tests_that_require_multiple_datasets.html))\n",
+        "\n",
+        "**parameters**: Additional arguments that can be passed when running a ValidMind test, used to pass additional information to a test, customize its behavior, or provide additional context.\n",
+        "\n",
+        "**outputs**: Custom tests can return elements like tables or plots. Tables may be a list of dictionaries (each representing a row) or a pandas DataFrame. Plots may be matplotlib or plotly figures."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2__'></a>\n",
+        "\n",
+        "## Setting up"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1__'></a>\n",
+        "\n",
+        "### Register a sample model\n",
+        "\n",
+        "In a usual lifecycle, a champion will have been independently registered in your inventory and submitted to you for validation by your development team as part of the effective challenge process. (**Learn more:** [Submit documents](https://docs.validmind.ai/guide/documentation/submit-documents.html))\n",
+        "\n",
+        "For this notebook, we'll have you register a dummy record (model) in the ValidMind Platform inventory and assign yourself as the validator to familiarize you with the ValidMind interface and circumvent the need for an existing model:\n",
+        "\n",
+        "1. In a browser, [log in to ValidMind](https://docs.validmind.ai/guide/access/log-in-to-validmind.html).\n",
+        "\n",
+        "2. In the left sidebar, select **Inventory**.\n",
+        "\n",
+        "3. Under the **RECORD TYPE** drop-down, select `Model` and click **+ Register Model**. (Learn more: [Register records in the inventory](https://docs.validmind.ai/guide/inventory/register-records-in-inventory.html))\n",
+        "\n",
+        "4. Enter the model details and click **Next >** to continue to assignment of inventory record stakeholders.\n",
+        "\n",
+        "5. Select your own name under the **RECORD OWNER** drop-down — don’t worry, we’ll adjust these permissions next for validation.\n",
+        "\n",
+        "6. Click **Register Model** to add the model to your inventory."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1_1__'></a>\n",
+        "\n",
+        "#### Assign validator credentials\n",
+        "\n",
+        "In order to log tests as a validator instead of as a developer, on the details page that appears after you've successfully registered your sample model:\n",
+        "\n",
+        "1. Remove yourself as an owner:\n",
+        "\n",
+        "    - Click on the **OWNERS** tile.\n",
+        "    - Click the **x** next to your name to remove yourself from that model's role.\n",
+        "    - Click **Save** to apply your changes to that role.\n",
+        "\n",
+        "2. Remove yourself as a developer:\n",
+        "\n",
+        "    - Click on the **DEVELOPERS** tile.\n",
+        "    - Click the **x** next to your name to remove yourself from that model's role.\n",
+        "    - Click **Save** to apply your changes to that role.\n",
+        "\n",
+        "3. Add yourself as a validator:\n",
+        "\n",
+        "    - Click on the **VALIDATORS** tile.\n",
+        "    - Select your name from the drop-down menu.\n",
+        "    - Click **Save** to apply your changes to that role."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_1_2__'></a>\n",
+        "\n",
+        "#### Apply validation report template\n",
+        "\n",
+        "Next, let's select a validation report template. A template predefines sections for your report and provides a general outline to follow, making the validation process much easier.\n",
+        "\n",
+        "1. In the left sidebar that appears for your model, click **Documents** and select **Validation**.\n",
+        "\n",
+        "    If you cannot locate your Validation document, make sure Validation type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents))\n",
+        "\n",
+        "2. Under **TEMPLATE**, select `Generic Validation Report`.\n",
+        "\n",
+        "3. Click **Use Template** to apply the template."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_2__'></a>\n",
+        "\n",
+        "### Install the ValidMind Library\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Recommended Python versions</b></span>\n",
+        "<br></br>\n",
+        "Python 3.8 <= x <= 3.14</div>\n",
+        "\n",
+        "To install the library:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip install -q validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind Library"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_3_1__'></a>\n",
+        "\n",
+        "#### Get your code snippet\n",
+        "\n",
+        "Initialize the ValidMind Library with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the ValidMind Platform when you run the Library.\n",
+        "\n",
+        "1. On the left sidebar that appears for your model, select **Getting Started** and select `Validation` from the **DOCUMENT** drop-down menu.\n",
+        "\n",
+        "2. Click **Copy snippet to clipboard**.\n",
+        "\n",
+        "3. Next, [load your model identifier credentials from an `.env` file](https://docs.validmind.ai/developer/quickstart/store-credentials-in-env-file.html) or replace the placeholder with your own code snippet:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Load your model identifier credentials from an `.env` file\n",
+        "\n",
+        "%load_ext dotenv\n",
+        "%dotenv .env\n",
+        "\n",
+        "# Or replace with your code snippet\n",
+        "\n",
+        "import validmind as vm\n",
+        "\n",
+        "vm.init(\n",
+        "    # api_host=\"...\",\n",
+        "    # api_key=\"...\",\n",
+        "    # api_secret=\"...\",\n",
+        "    # model=\"...\",\n",
+        "    document=\"validation-report\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_4__'></a>\n",
+        "\n",
+        "### Importing the champion model\n",
+        "\n",
+        "With the ValidMind Library set up and ready to go, let's go ahead and import the champion submitted by the development team in the format of a `.pkl` file: **[xgb_model_champion.pkl](xgb_model_champion.pkl)**"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import xgboost as xgb\n",
+        "\n",
+        "#Load the saved model\n",
+        "xgb_model = xgb.XGBClassifier()\n",
+        "xgb_model.load_model(\"xgb_model_champion.pkl\")\n",
+        "xgb_model"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Ensure that we have to appropriate order in feature names from Champion model and dataset\n",
+        "cols_when_model_builds = xgb_model.get_booster().feature_names"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_5__'></a>\n",
+        "\n",
+        "### Load the sample dataset\n",
+        "\n",
+        "Let's next import the public [Lending Club](https://www.kaggle.com/datasets/devanshi23/loan-data-2007-2014/data) dataset from Kaggle, which was used to develop the dummy champion model.\n",
+        "\n",
+        "- We'll use this dataset to review steps that should have been conducted during the initial development and documentation of the model to ensure that the model was built correctly.\n",
+        "- By independently performing steps such as preprocessing and feature engineering, we can confirm whether the model was built using appropriate and properly processed data.\n",
+        "\n",
+        "To be able to use the dataset, you'll need to import the dataset and load it into a pandas [DataFrame](https://pandas.pydata.org/docs/reference/api/pandas.DataFrame.html), a two-dimensional tabular data structure that makes use of rows and columns:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "from validmind.datasets.credit_risk import lending_club\n",
+        "\n",
+        "df = lending_club.load_data(source=\"offline\")\n",
+        "df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_5_1__'></a>\n",
+        "\n",
+        "#### Preprocess the dataset\n",
+        "\n",
+        "We'll first quickly preprocess the dataset for data quality testing purposes using `lending_club.preprocess`. This function performs the following operations:\n",
+        "\n",
+        "- Filters the dataset to include only loans for debt consolidation or credit card purposes\n",
+        "- Removes loans classified under the riskier grades \"F\" and \"G\"\n",
+        "- Excludes uncommon home ownership types and standardizes employment length and loan terms into numerical formats\n",
+        "- Discards unnecessary fields and any entries with missing information to maintain a clean and robust dataset for modeling"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "preprocess_df = lending_club.preprocess(df)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_5_2__'></a>\n",
+        "\n",
+        "#### Apply feature engineering to the dataset\n",
+        "\n",
+        "Feature engineering improves the dataset's structure to better match what our model expects, and ensures that the model performs optimally by leveraging additional insights from raw data.\n",
+        "\n",
+        "We'll apply the following transformations using the `ending_club.feature_engineering()` function to optimize the dataset for predictive modeling in our application scorecard:\n",
+        "\n",
+        "- **WoE encoding**: Converts both numerical and categorical features into Weight of Evidence (WoE) values. WoE is a statistical measure used in scorecard modeling that quantifies the relationship between a predictor variable and the binary target variable. It calculates the ratio of the distribution of good outcomes to the distribution of bad outcomes for each category or bin of a feature. This transformation helps to ensure that the features are predictive and consistent in their contribution to the model.\n",
+        "- **Integration of WoE bins**: Ensures that the WoE transformed values are integrated throughout the dataset, replacing the original feature values while excluding the target variable from this transformation. This transformation is used to maintain a consistent scale and impact of each variable within the model, which helps make the predictions more stable and accurate."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "fe_df = lending_club.feature_engineering(preprocess_df)\n",
+        "fe_df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc2_6__'></a>\n",
+        "\n",
+        "### Split the feature engineered dataset\n",
+        "\n",
+        "With our dummy model imported and our independently preprocessed and feature engineered dataset ready to go, let's now **spilt our dataset into train and test** to start the validation testing process.\n",
+        "\n",
+        "Splitting our dataset into training and testing is essential for proper validation testing, as this helps assess how well the model generalizes to unseen data:\n",
+        "\n",
+        "- We begin by dividing our data, which is based on Weight of Evidence (WoE) features, into training and testing sets (`train_df`, `test_df`).\n",
+        "- With `lending_club.split`, we employ a simple random split, randomly allocating data points to each set to ensure a mix of examples in both."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Split the data\n",
+        "train_df, test_df = lending_club.split(fe_df, test_size=0.2)\n",
+        "\n",
+        "x_train = train_df.drop(lending_club.target_column, axis=1)\n",
+        "y_train = train_df[lending_club.target_column]\n",
+        "\n",
+        "x_test = test_df.drop(lending_club.target_column, axis=1)\n",
+        "y_test = test_df[lending_club.target_column]\n",
+        "\n",
+        "# Now let's apply the order of features from the champion model construction\n",
+        "x_train = x_train[cols_when_model_builds]\n",
+        "x_test = x_test[cols_when_model_builds]"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "cols_use = ['annual_inc_woe',\n",
+        " 'verification_status_woe',\n",
+        " 'emp_length_woe',\n",
+        " 'installment_woe',\n",
+        " 'term_woe',\n",
+        " 'home_ownership_woe',\n",
+        " 'purpose_woe',\n",
+        " 'open_acc_woe',\n",
+        " 'total_acc_woe',\n",
+        " 'int_rate_woe',\n",
+        " 'sub_grade_woe',\n",
+        " 'grade_woe','loan_status']\n",
+        "\n",
+        "\n",
+        "train_df = train_df[cols_use]\n",
+        "test_df = test_df[cols_use]\n",
+        "test_df.head()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3__'></a>\n",
+        "\n",
+        "## Developing potential challenger models"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1__'></a>\n",
+        "\n",
+        "### Train potential challenger models\n",
+        "\n",
+        "We're curious how alternate models compare to our champion model, so let's train two challenger models as basis for our testing.\n",
+        "\n",
+        "Our selected options below offer decreased complexity in terms of implementation — such as lessened manual preprocessing — which can reduce the amount of risk for implementation. However, model risk is not calculated in isolation from a single factor, but rather in consideration with trade-offs in predictive performance, ease of interpretability, and overall alignment with business objectives."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1_1__'></a>\n",
+        "\n",
+        "#### Random forest classification model\n",
+        "\n",
+        "A *random forest classification model* is an ensemble machine learning algorithm that uses multiple decision trees to classify data. In ensemble learning, multiple models are combined to improve prediction accuracy and robustness.\n",
+        "\n",
+        "Random forest classification models generally have higher accuracy because they capture complex, non-linear relationships, but as a result they lack transparency in their predictions."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Import the Random Forest Classification model\n",
+        "from sklearn.ensemble import RandomForestClassifier\n",
+        "\n",
+        "# Create the model instance with 50 decision trees\n",
+        "rf_model = RandomForestClassifier(\n",
+        "    n_estimators=50,\n",
+        "    random_state=42,\n",
+        ")\n",
+        "\n",
+        "# Train the model\n",
+        "rf_model.fit(x_train, y_train)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_1_2__'></a>\n",
+        "\n",
+        "#### Logistic regression model\n",
+        "\n",
+        "A *logistic regression model* is a statistical machine learning algorithm that uses a linear equation (straight-line relationship between variables) and the logistic function (or sigmoid function, which maps any real-valued number to a range between `0` and `1`) to classify data. In statistical modeling, a single equation is used to estimate the probability of an outcome based on input features.\n",
+        "\n",
+        "Logistic regression models are simple and interpretable because they provide clear probability estimates and feature coefficients (numerical value that represents the influence of a particular input feature on the model's prediction), but they may struggle with capturing complex, non-linear relationships in the data."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Import the Logistic Regression model\n",
+        "from sklearn.linear_model import LogisticRegression\n",
+        "\n",
+        "# Logistic Regression grid params\n",
+        "log_reg_params = {\n",
+        "    \"penalty\": [\"l1\", \"l2\"],\n",
+        "    \"C\": [0.001, 0.01, 0.1, 1, 10, 100, 1000],\n",
+        "    \"solver\": [\"liblinear\"],\n",
+        "}\n",
+        "\n",
+        "# Grid search for Logistic Regression\n",
+        "from sklearn.model_selection import GridSearchCV\n",
+        "\n",
+        "grid_log_reg = GridSearchCV(LogisticRegression(), log_reg_params)\n",
+        "grid_log_reg.fit(x_train, y_train)\n",
+        "\n",
+        "# Logistic Regression best estimator\n",
+        "log_reg = grid_log_reg.best_estimator_\n",
+        "log_reg"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2__'></a>\n",
+        "\n",
+        "### Extract predicted probabilities\n",
+        "\n",
+        "With our challenger models trained, let's extract the predicted probabilities from our three models:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Champion — Application scorecard model\n",
+        "train_xgb_prob = xgb_model.predict_proba(x_train)[:, 1]\n",
+        "test_xgb_prob = xgb_model.predict_proba(x_test)[:, 1]\n",
+        "\n",
+        "# Challenger — Random forest classification model\n",
+        "train_rf_prob = rf_model.predict_proba(x_train)[:, 1]\n",
+        "test_rf_prob = rf_model.predict_proba(x_test)[:, 1]\n",
+        "\n",
+        "# Challenger — Logistic regression model\n",
+        "train_log_prob = log_reg.predict_proba(x_train)[:, 1]\n",
+        "test_log_prob = log_reg.predict_proba(x_test)[:, 1]"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc3_2_1__'></a>\n",
+        "\n",
+        "#### Compute binary predictions\n",
+        "\n",
+        "Next, we'll convert the probability predictions from our three models into a binary, based on a threshold of `0.3`:\n",
+        "\n",
+        "- If the probability is greater than `0.3`, the prediction becomes `1` (positive).\n",
+        "- Otherwise, it becomes `0` (negative)."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "cut_off_threshold = 0.3\n",
+        "\n",
+        "# Champion — Application scorecard model\n",
+        "train_xgb_binary_predictions = (train_xgb_prob > cut_off_threshold).astype(int)\n",
+        "test_xgb_binary_predictions = (test_xgb_prob > cut_off_threshold).astype(int)\n",
+        "\n",
+        "# Challenger — Random forest classification model\n",
+        "train_rf_binary_predictions = (train_rf_prob > cut_off_threshold).astype(int)\n",
+        "test_rf_binary_predictions = (test_rf_prob > cut_off_threshold).astype(int)\n",
+        "\n",
+        "# Challenger — Logistic regression model\n",
+        "train_log_binary_predictions = (train_log_prob > cut_off_threshold).astype(int)\n",
+        "test_log_binary_predictions = (test_log_prob > cut_off_threshold).astype(int)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4__'></a>\n",
+        "\n",
+        "## Initializing the ValidMind objects"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_1__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind datasets\n",
+        "\n",
+        "Before you can run tests, you'll need to connect your data with a ValidMind `Dataset` object. **This step is always necessary every time you want to connect a dataset to documentation and produce test results through ValidMind,** but you only need to do it once per dataset.\n",
+        "\n",
+        "Initialize a ValidMind dataset object using the [`init_dataset` function](https://docs.validmind.ai/validmind/validmind.html#init_dataset) from the ValidMind (`vm`) module. For this example, we'll pass in the following arguments:\n",
+        "\n",
+        "- **`dataset`** — The raw dataset that you want to provide as input to tests.\n",
+        "- **`input_id`** — A unique identifier that allows tracking what inputs are used when running each individual test.\n",
+        "- **`target_column`** — A required argument if tests require access to true values. This is the name of the target column in the dataset."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Initialize the raw dataset\n",
+        "vm_raw_dataset = vm.init_dataset(\n",
+        "    dataset=df,\n",
+        "    input_id=\"raw_dataset\",\n",
+        "    target_column=lending_club.target_column,\n",
+        ")\n",
+        "\n",
+        "# Initialize the preprocessed dataset\n",
+        "vm_preprocess_dataset = vm.init_dataset(\n",
+        "    dataset=preprocess_df,\n",
+        "    input_id=\"preprocess_dataset\",\n",
+        "    target_column=lending_club.target_column,\n",
+        ")\n",
+        "\n",
+        "# Initialize the feature engineered dataset\n",
+        "vm_fe_dataset = vm.init_dataset(\n",
+        "    dataset=fe_df,\n",
+        "    input_id=\"fe_dataset\",\n",
+        "    target_column=lending_club.target_column,\n",
+        ")\n",
+        "\n",
+        "# Initialize the training dataset\n",
+        "vm_train_ds = vm.init_dataset(\n",
+        "    dataset=train_df,\n",
+        "    input_id=\"train_dataset\",\n",
+        "    target_column=lending_club.target_column,\n",
+        ")\n",
+        "\n",
+        "# Initialize the test dataset\n",
+        "vm_test_ds = vm.init_dataset(\n",
+        "    dataset=test_df,\n",
+        "    input_id=\"test_dataset\",\n",
+        "    target_column=lending_club.target_column,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "After initialization, you can pass the ValidMind `Dataset` objects `vm_raw_dataset`, `vm_preprocess_dataset`, `vm_fe_dataset`, `vm_train_ds`, and `vm_test_ds` into any ValidMind tests."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_2__'></a>\n",
+        "\n",
+        "### Initialize the ValidMind models\n",
+        "\n",
+        "You'll also need to initialize ValidMind model objects (`vm_model`) that can be passed to other functions for analysis and tests on the data for each of our three models.\n",
+        "\n",
+        "- Despite the naming convention, ValidMind model objects can be any type of record you want to test, document, validate, or monitor with the ValidMind Library.\n",
+        "- From classical statistical and machine learning models, to generative and agentic AI systems and more, the ValidMind model object provides a consistent wrapper around your record so it can be passed as a unified input to any ValidMind test or test suite, with results sent directly to the ValidMind Platform.\n",
+        "\n",
+        "Initialize your model objects with [`vm.init_model()`](https://docs.validmind.ai/validmind/validmind.html#init_model):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Initialize the champion application scorecard model\n",
+        "vm_xgb_model = vm.init_model(\n",
+        "    xgb_model,\n",
+        "    input_id=\"xgb_model_developer_champion\",\n",
+        ")\n",
+        "\n",
+        "# Initialize the challenger random forest classification model\n",
+        "vm_rf_model = vm.init_model(\n",
+        "    rf_model,\n",
+        "    input_id=\"rf_model\",\n",
+        ")\n",
+        "\n",
+        "# Initialize the challenger logistic regression model\n",
+        "vm_log_model = vm.init_model(\n",
+        "    log_reg,\n",
+        "    input_id=\"log_model\",\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_3__'></a>\n",
+        "\n",
+        "### Assign predictions\n",
+        "\n",
+        "With our models registered, we'll move on to assigning both the predictive probabilities coming directly from each model's predictions, and the binary prediction after applying the cutoff threshold described in the Compute binary predictions step above.\n",
+        "\n",
+        "- The [`assign_predictions()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#VMDataset.assign_predictions) from the `Dataset` object can link existing predictions to any number of models.\n",
+        "- This method links the model's class prediction values and probabilities to our `vm_train_ds` and `vm_test_ds` datasets."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Champion — Application scorecard model\n",
+        "vm_train_ds.assign_predictions(\n",
+        "    model=vm_xgb_model,\n",
+        "    prediction_values=train_xgb_binary_predictions,\n",
+        "    prediction_probabilities=train_xgb_prob,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds.assign_predictions(\n",
+        "    model=vm_xgb_model,\n",
+        "    prediction_values=test_xgb_binary_predictions,\n",
+        "    prediction_probabilities=test_xgb_prob,\n",
+        ")\n",
+        "\n",
+        "# Challenger — Random forest classification model\n",
+        "vm_train_ds.assign_predictions(\n",
+        "    model=vm_rf_model,\n",
+        "    prediction_values=train_rf_binary_predictions,\n",
+        "    prediction_probabilities=train_rf_prob,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds.assign_predictions(\n",
+        "    model=vm_rf_model,\n",
+        "    prediction_values=test_rf_binary_predictions,\n",
+        "    prediction_probabilities=test_rf_prob,\n",
+        ")\n",
+        "\n",
+        "\n",
+        "# Challenger — Logistic regression model\n",
+        "vm_train_ds.assign_predictions(\n",
+        "    model=vm_log_model,\n",
+        "    prediction_values=train_log_binary_predictions,\n",
+        "    prediction_probabilities=train_log_prob,\n",
+        ")\n",
+        "\n",
+        "vm_test_ds.assign_predictions(\n",
+        "    model=vm_log_model,\n",
+        "    prediction_values=test_log_binary_predictions,\n",
+        "    prediction_probabilities=test_log_prob,\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc4_4__'></a>\n",
+        "\n",
+        "### Compute credit risk scores\n",
+        "\n",
+        "Finally, we'll translate model predictions into actionable scores using probability estimates generated by our trained model:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Compute the scores\n",
+        "train_xgb_scores = lending_club.compute_scores(train_xgb_prob)\n",
+        "test_xgb_scores = lending_club.compute_scores(test_xgb_prob)\n",
+        "train_rf_scores = lending_club.compute_scores(train_rf_prob)\n",
+        "test_rf_scores = lending_club.compute_scores(test_rf_prob)\n",
+        "train_log_scores = lending_club.compute_scores(train_log_prob)\n",
+        "test_log_scores = lending_club.compute_scores(test_log_prob)\n",
+        "\n",
+        "# Assign scores to the datasets\n",
+        "vm_train_ds.add_extra_column(\"xgb_scores\", train_xgb_scores)\n",
+        "vm_test_ds.add_extra_column(\"xgb_scores\", test_xgb_scores)\n",
+        "vm_train_ds.add_extra_column(\"rf_scores\", train_rf_scores)\n",
+        "vm_test_ds.add_extra_column(\"rf_scores\", test_rf_scores)\n",
+        "vm_train_ds.add_extra_column(\"log_scores\", train_log_scores)\n",
+        "vm_test_ds.add_extra_column(\"log_scores\", test_log_scores)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5__'></a>\n",
+        "\n",
+        "## Running data quality tests\n",
+        "\n",
+        "With everything ready to go, let's explore some of ValidMind's available tests. Using ValidMind’s repository of tests streamlines your validation testing, and helps you ensure that your records are being validated appropriately."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_1__'></a>\n",
+        "\n",
+        "### Identify relevant data quality tests\n",
+        "\n",
+        "We want to narrow down the tests we want to run from the selection provided by ValidMind, so we'll use the [`vm.tests.list_tasks_and_tags()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tasks_and_tags) to list which `tags` are associated with each `task` type:\n",
+        "\n",
+        "- **`tasks`** represent the kind of modeling task associated with a test. Here we'll focus on `classification` tasks.\n",
+        "- **`tags`** are free-form descriptions providing more details about the test, for example, what category the test falls into. Here we'll focus on the `data_quality` tag."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.list_tasks_and_tags()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Then we'll call [the `vm.tests.list_tests()` function](https://docs.validmind.ai/validmind/validmind/tests.html#list_tests) to list all the data quality tests for classification:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.list_tests(\n",
+        "    tags=[\"data_quality\"], task=\"classification\"\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about navigating ValidMind tests?</b></span>\n",
+        "<br></br>\n",
+        "Refer to our notebook outlining the utilities available for viewing and understanding available ValidMind tests: <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/explore_tests/explore_tests.html\" style=\"color: #DE257E;\"><b>Explore tests</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_2__'></a>\n",
+        "\n",
+        "### Run and log an individual data quality test\n",
+        "\n",
+        "Next, we'll use our previously initialized preprocessed dataset (`vm_preprocess_dataset`) as input to run an individual test, then log the result to the ValidMind Platform.\n",
+        "\n",
+        "- You run validation tests by calling [the `run_test` function](https://docs.validmind.ai/validmind/validmind/tests.html#run_test) provided by the `validmind.tests` module.\n",
+        "- Every test result returned by the `run_test()` function has a [`.log()` method](https://docs.validmind.ai/validmind/validmind/vm_models.html#TestResult.log) that can be used to send the test results to the ValidMind Platform.\n",
+        "\n",
+        "Here, we'll use the `data_validation.HighPearsonCorrelation` test as an example:\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    test_id=\"validmind.data_validation.HighPearsonCorrelation\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_preprocess_dataset\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Note the output returned indicating that a test-driven block doesn't currently exist in your documentation for some test IDs. </b></span>\n",
+        "<br></br>\n",
+        "That's expected, as when we run validations tests the results logged need to be manually added to your report as part of your compliance assessment process within the ValidMind Platform. You'll continue to see this message throughout this notebook as we run and log more tests.</div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_3__'></a>\n",
+        "\n",
+        "### Log multiple data quality tests\n",
+        "\n",
+        "Now that we understand how to run a test with ValidMind, we want to run all the tests that were returned for our `classification` tasks focusing on `data_quality`.\n",
+        "\n",
+        "We'll store the identified tests in `dq` in preparation for batch running these tests and logging their results to the ValidMind Platform:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "dq = vm.tests.list_tests(tags=[\"data_quality\"], task=\"classification\",pretty=False)\n",
+        "dq"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "With our data quality tests stored, let's run our first batch of tests using the same preprocessed dataset (`vm_preprocess_dataset`) and log their results."
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "for test in dq:\n",
+        "    vm.tests.run_test(\n",
+        "        test,\n",
+        "        inputs={\n",
+        "            \"dataset\": vm_preprocess_dataset\n",
+        "        }\n",
+        "    ).log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc5_4__'></a>\n",
+        "\n",
+        "### Run data quality comparison tests\n",
+        "\n",
+        "Next, let's reuse the tests in `dq` to perform comparison tests between the raw (`vm_raw_dataset`) and preprocessed (`vm_preprocess_dataset`) dataset, again logging the results to the ValidMind Platform:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "for test in dq:\n",
+        "    vm.tests.run_test(\n",
+        "        test,\n",
+        "        input_grid={\n",
+        "            \"dataset\": [vm_raw_dataset,vm_preprocess_dataset]\n",
+        "        }\n",
+        "    ).log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6__'></a>\n",
+        "\n",
+        "## Running performance tests\n",
+        "\n",
+        "We'll also run some performance tests, beginning with independent testing of our champion application scorecard model, then moving on to our potential challenger models."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_1__'></a>\n",
+        "\n",
+        "### Identify relevant performance tests\n",
+        "\n",
+        "Use `vm.tests.list_tests()` to this time identify all the model performance tests for classification:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "\n",
+        "vm.tests.list_tests(tags=[\"model_performance\"], task=\"classification\")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_2__'></a>\n",
+        "\n",
+        "### Run and log an individual performance test\n",
+        "\n",
+        "Before we run our batch of performance tests, we'll use our previously initialized testing dataset (`vm_test_ds`) as input to run an individual test, then log the result to the ValidMind Platform.\n",
+        "\n",
+        "When running individual tests, you can use a custom `result_id` to tag the individual result with a unique identifier by appending this `result_id` to the `test_id` with a `:` separator. We'll append an identifier for our champion model here (`xgboost_champion`):\n",
+        "\n",
+        "Here, we'll use the `model_validation.sklearn.ClassifierPerformance` test as an example:\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    test_id=\"validmind.model_validation.sklearn.ClassifierPerformance:xgboost_champion\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_test_ds, \"model\" : vm_xgb_model\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_3__'></a>\n",
+        "\n",
+        "### Log multiple performance tests\n",
+        "\n",
+        "We only want to run a few other tests that were returned for our `classification` tasks focusing on `model_performance`, so we'll isolate the specific tests we want to batch run in `mpt`:\n",
+        "\n",
+        "- `model_validation.sklearn.ClassifierPerformance`\n",
+        "- `model_validation.sklearn.ConfusionMatrix`\n",
+        "- `model_validation.sklearn.MinimumAccuracy`\n",
+        "- `model_validation.sklearn.MinimumF1Score`\n",
+        "- `model_validation.sklearn.ROCCurve`\n",
+        "\n",
+        "Note the custom `result_id`s appended to the `test_id`s for our champion model (`xgboost_champion`):\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "mpt = [\n",
+        "    \"validmind.model_validation.sklearn.ClassifierPerformance:xgboost_champion\",\n",
+        "    \"validmind.model_validation.sklearn.ConfusionMatrix:xgboost_champion\",\n",
+        "    \"validmind.model_validation.sklearn.MinimumAccuracy:xgboost_champion\",\n",
+        "    \"validmind.model_validation.sklearn.MinimumF1Score:xgboost_champion\",\n",
+        "    \"validmind.model_validation.sklearn.ROCCurve:xgboost_champion\"\n",
+        "]"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_4__'></a>\n",
+        "\n",
+        "### Evaluate performance of the champion model\n",
+        "\n",
+        "Now, let's run and log our batch of model performance tests using our testing dataset (`vm_test_ds`) for our champion model:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "for test in mpt:\n",
+        "    vm.tests.run_test(\n",
+        "        test,\n",
+        "        inputs={\n",
+        "            \"dataset\": vm_test_ds, \"model\" : vm_xgb_model\n",
+        "        },\n",
+        "    ).log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_5__'></a>\n",
+        "\n",
+        "### Evaluate performance of challenger models\n",
+        "\n",
+        "We've now conducted similar tests as the development team for our champion, with the aim of verifying their test results.\n",
+        "\n",
+        "Next, let's see how our challenger models compare. We'll use the same batch of tests here as we did in `mpt`, but append a different `result_id` to indicate that these results should be associated with our challenger models:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "mpt_chall = [\n",
+        "    \"validmind.model_validation.sklearn.ClassifierPerformance:xgboost_champion_vs_challengers\",\n",
+        "    \"validmind.model_validation.sklearn.ConfusionMatrix:xgboost_champion_vs_challengers\",\n",
+        "    \"validmind.model_validation.sklearn.MinimumAccuracy:xgboost_champion_vs_challengers\",\n",
+        "    \"validmind.model_validation.sklearn.MinimumF1Score:xgboost_champion_vs_challengers\",\n",
+        "    \"validmind.model_validation.sklearn.ROCCurve:xgboost_champion_vs_challengers\"\n",
+        "]"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_5_1__'></a>\n",
+        "\n",
+        "#### Enable custom context for test descriptions"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "When you run ValidMind tests, test descriptions are automatically generated with LLM using the test results, the test name, and the static test definitions provided in the test’s docstring. While this metadata offers valuable high-level overviews of tests, insights produced by the LLM-based descriptions may not always align with your specific use cases or incorporate organizational policy requirements.\n",
+        "\n",
+        "Before we run our next batch of tests, we'll include some custom use case context to focus on comparison testing going forward, improving the relevancy, insight, and format of the test descriptions returned. By default, custom context for LLM-generated descriptions is disabled, meaning that the output will not include any additional context. To enable custom use case context, set the `VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED` environment variable to `1`.\n",
+        "\n",
+        "This is a global setting that will affect all tests for your linked model:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import os\n",
+        "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED\"] = \"1\""
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Enabling use case context allows you to pass in additional context to the LLM-generated text descriptions within `context`:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import os\n",
+        "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT_ENABLED\"] = \"1\"\n",
+        "\n",
+        "context = \"\"\"\n",
+        "FORMAT FOR THE LLM DESCRIPTIONS: \n",
+        "    **<Test Name>** is designed to <begin with a concise overview of what the test does and its primary purpose, \n",
+        "    extracted from the test description>.\n",
+        "\n",
+        "    The test operates by <write a paragraph about the test mechanism, explaining how it works and what it measures. \n",
+        "    Include any relevant formulas or methodologies mentioned in the test description.>\n",
+        "\n",
+        "    The primary advantages of this test include <write a paragraph about the test's strengths and capabilities, \n",
+        "    highlighting what makes it particularly useful for specific scenarios.>\n",
+        "\n",
+        "    Users should be aware that <write a paragraph about the test's limitations and potential risks. \n",
+        "    Include both technical limitations and interpretation challenges. \n",
+        "    If the test description includes specific signs of high risk, incorporate these here.>\n",
+        "\n",
+        "    **Key Insights:**\n",
+        "\n",
+        "    The test results reveal:\n",
+        "\n",
+        "    - **<insight title>**: <comprehensive description of one aspect of the results>\n",
+        "    - **<insight title>**: <comprehensive description of another aspect>\n",
+        "    ...\n",
+        "\n",
+        "    Based on these results, <conclude with a brief paragraph that ties together the test results with the test's \n",
+        "    purpose and provides any final recommendations or considerations.>\n",
+        "\n",
+        "ADDITIONAL INSTRUCTIONS:\n",
+        "\n",
+        "    The champion model as the basis for comparison is called \"xgb_model_developer_champion\" and emphasis should be on the following:\n",
+        "    - The metrics for the champion model compared against the challenger models\n",
+        "    - Which model potentially outperforms the champion model based on the metrics, this should be highlighted and emphasized\n",
+        "\n",
+        "\n",
+        "    For each metric in the test results, include in the test overview:\n",
+        "    - The metric's purpose and what it measures\n",
+        "    - Its mathematical formula\n",
+        "    - The range of possible values\n",
+        "    - What constitutes good/bad performance\n",
+        "    - How to interpret different values\n",
+        "\n",
+        "    Each insight should progressively cover:\n",
+        "    1. Overall scope and distribution\n",
+        "    2. Complete breakdown of all elements with specific values\n",
+        "    3. Natural groupings and patterns\n",
+        "    4. Comparative analysis between datasets/categories\n",
+        "    5. Stability and variations\n",
+        "    6. Notable relationships or dependencies\n",
+        "\n",
+        "    Remember:\n",
+        "    - Champion model (xgb_model_developer_champion) is the selection and challenger models are used to challenge the selection\n",
+        "    - Keep all insights at the same level (no sub-bullets or nested structures)\n",
+        "    - Make each insight complete and self-contained\n",
+        "    - Include specific numerical values and ranges\n",
+        "    - Cover all elements in the results comprehensively\n",
+        "    - Maintain clear, concise language\n",
+        "    - Use only \"- **Title**: Description\" format for insights\n",
+        "    - Progress naturally from general to specific observations\n",
+        "\n",
+        "\"\"\".strip()\n",
+        "\n",
+        "os.environ[\"VALIDMIND_LLM_DESCRIPTIONS_CONTEXT\"] = context"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about setting custom context for LLM-generated test descriptions?</b></span>\n",
+        "<br></br>\n",
+        "Refer to our extended walkthrough notebook: <a href=\"https://docs.validmind.ai/notebooks/how_to/tests/run_tests/configure_tests/customize_test_result_descriptions.html\" style=\"color: #DE257E;\"><b>Add context to LLM-generated test descriptions\n",
+        "</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc6_5_2__'></a>\n",
+        "\n",
+        "#### Run performance comparison tests\n",
+        "\n",
+        "With the use case context set, we'll run each test in `mpt_chall` once for each model with the same `vm_test_ds` dataset to compare them:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "for test in mpt_chall:\n",
+        "    vm.tests.run_test(\n",
+        "        test,\n",
+        "        input_grid={\n",
+        "            \"dataset\": [vm_test_ds], \"model\" : [vm_xgb_model,vm_log_model,vm_rf_model]\n",
+        "        }\n",
+        "    ).log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Based on the performance metrics, we can conclude that the random forest classification model is not a viable candidate for our use case and can be disregarded in our tests going forward.</b></span>\n",
+        "<br></br>\n",
+        "In the next section, we'll dive a bit deeper into some tests comparing our champion application scorecard model and our remaining challenger logistic regression model, including tests that will allow us to customize parameters and thresholds for performance standards.</div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc7__'></a>\n",
+        "\n",
+        "## Adjust a ValidMind test\n",
+        "\n",
+        "Let's dig deeper into the `model_validation.sklearn.MinimumF1Score` test we ran previously in Run performance tests to ensure that the models maintain a minimum acceptable balance between *precision* and *recall*. Precision refers to how many out of the positive predictions made by the model were actually correct, and recall refers to how many out of the actual positive cases did the model correctly identify.\n",
+        "\n",
+        "Use `run_test()` with our testing dataset (`vm_test_ds`) to run the test in isolation again for our two remaining models without logging the result to have the output to compare with a subsequent iteration:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.MinimumF1Score:xgboost_champion_vs_challengers\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_test_ds],\n",
+        "        \"model\": [vm_xgb_model, vm_log_model]\n",
+        "    },\n",
+        ")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "As `model_validation.sklearn.MinimumF1Score` allows us to customize parameters and thresholds for performance standards, let's adjust the threshold to see if it improves metrics:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = vm.tests.run_test(\n",
+        "    \"validmind.model_validation.sklearn.MinimumF1Score:AdjThreshold\",\n",
+        "    input_grid={\n",
+        "        \"dataset\": [vm_test_ds],\n",
+        "        \"model\": [vm_xgb_model, vm_log_model],\n",
+        "        \"params\": {\"min_threshold\": 0.35}\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc8__'></a>\n",
+        "\n",
+        "## Run diagnostic tests\n",
+        "\n",
+        "Next, we want to inspect the robustness and stability testing comparison between our champion and challenger model.\n",
+        "\n",
+        "Use `list_tests()` to list all available diagnosis tests applicable to classification tasks:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.list_tests(tags=[\"model_diagnosis\"], task=\"classification\")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let's see if models suffer from any *overfit* potentials and also where there are potential sub-segments of issues with the `model_validation.sklearn.OverfitDiagnosis` test. \n",
+        "\n",
+        "Overfitting occurs when a model learns the training data too well, capturing not only the true pattern but noise and random fluctuations resulting in excellent performance on the training dataset but poor generalization to new, unseen data.\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    test_id=\"validmind.model_validation.sklearn.OverfitDiagnosis:Champion_vs_LogRegression\",\n",
+        "    input_grid={\n",
+        "        \"datasets\": [[vm_train_ds,vm_test_ds]],\n",
+        "        \"model\" : [vm_xgb_model,vm_log_model]\n",
+        "    }\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Let's also conduct *robustness* and *stability* testing of the two models with the `model_validation.sklearn.RobustnessDiagnosis` test.\n",
+        "\n",
+        "Robustness refers to a model's ability to maintain consistent performance, and stability refers to a model's ability to produce consistent outputs over time across different data subsets.\n"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "vm.tests.run_test(\n",
+        "    test_id=\"validmind.model_validation.sklearn.RobustnessDiagnosis:Champion_vs_LogRegression\",\n",
+        "    input_grid={\n",
+        "        \"datasets\": [[vm_train_ds,vm_test_ds]],\n",
+        "        \"model\" : [vm_xgb_model,vm_log_model]\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc9__'></a>\n",
+        "\n",
+        "## Run feature importance tests\n",
+        "\n",
+        "We also want to verify the relative influence of different input features on our models' predictions, as well as inspect the differences between our champion and challenger model to see if a certain model offers more understandable or logical importance scores for features.\n",
+        "\n",
+        "Use `list_tests()` to identify all the feature importance tests for classification:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Store the feature importance tests\n",
+        "FI = vm.tests.list_tests(tags=[\"feature_importance\"], task=\"classification\",pretty=False)\n",
+        "FI"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "# Run and log our feature importance tests for both models for the testing dataset\n",
+        "for test in FI:\n",
+        "    vm.tests.run_test(\n",
+        "        \"\".join((test,':Champion_vs_LogisticRegression')),\n",
+        "        input_grid={\n",
+        "            \"dataset\": [vm_test_ds], \"model\" : [vm_xgb_model,vm_log_model]\n",
+        "        },\n",
+        "    ).log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc10__'></a>\n",
+        "\n",
+        "## Implement a custom test\n",
+        "\n",
+        "Let's finish up testing by implementing a custom *inline test* that outputs a FICO score-type score. An inline test refers to a test written and executed within the same environment as the code being tested — in this case, right in this Jupyter Notebook —  without requiring a separate test file or framework.\n",
+        "\n",
+        "The [`@vm.test` wrapper](https://docs.validmind.ai/validmind/validmind.html#test) allows you to create a reusable test:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "import numpy as np\n",
+        "import pandas as pd\n",
+        "import plotly.graph_objects as go\n",
+        "\n",
+        "@vm.test(\"my_custom_tests.ScoreToOdds\")\n",
+        "def score_to_odds_analysis(dataset, score_column='score', score_bands=[410, 440, 470]):\n",
+        "    \"\"\"\n",
+        "    Analyzes the relationship between score bands and odds (good:bad ratio).\n",
+        "    Good odds = (1 - default_rate) / default_rate\n",
+        "    \n",
+        "    Higher scores should correspond to higher odds of being good.\n",
+        "\n",
+        "    If there are multiple scores provided through score_column, this means that there are two different models and the scores reflect each model\n",
+        "\n",
+        "    If there are more scores provided in the score_column then focus the assessment on the differences between the two scores and indicate through evidence which one is preferred.\n",
+        "    \"\"\"\n",
+        "    df = dataset.df\n",
+        "    \n",
+        "    # Create score bands\n",
+        "    df['score_band'] = pd.cut(\n",
+        "        df[score_column],\n",
+        "        bins=[-np.inf] + score_bands + [np.inf],\n",
+        "        labels=[f'<{score_bands[0]}'] + \n",
+        "               [f'{score_bands[i]}-{score_bands[i+1]}' for i in range(len(score_bands)-1)] +\n",
+        "               [f'>{score_bands[-1]}']\n",
+        "    )\n",
+        "    \n",
+        "    # Calculate metrics per band\n",
+        "    results = df.groupby('score_band').agg({\n",
+        "        dataset.target_column: ['mean', 'count']\n",
+        "    })\n",
+        "    \n",
+        "    results.columns = ['Default Rate', 'Total']\n",
+        "    results['Good Count'] = results['Total'] - (results['Default Rate'] * results['Total'])\n",
+        "    results['Bad Count'] = results['Default Rate'] * results['Total']\n",
+        "    results['Odds'] = results['Good Count'] / results['Bad Count']\n",
+        "    \n",
+        "    # Create visualization\n",
+        "    fig = go.Figure()\n",
+        "    \n",
+        "    # Add odds bars\n",
+        "    fig.add_trace(go.Bar(\n",
+        "        name='Odds (Good:Bad)',\n",
+        "        x=results.index,\n",
+        "        y=results['Odds'],\n",
+        "        marker_color='blue'\n",
+        "    ))\n",
+        "    \n",
+        "    fig.update_layout(\n",
+        "        title='Score-to-Odds Analysis',\n",
+        "        yaxis=dict(title='Odds Ratio (Good:Bad)'),\n",
+        "        showlegend=False\n",
+        "    )\n",
+        "    \n",
+        "    return fig"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "With the custom test available, run and log the test for our champion and challenger models with our testing dataset (`vm_test_ds`):"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "result = vm.tests.run_test(\n",
+        "    \"my_custom_tests.ScoreToOdds:Champion_vs_Challenger\",\n",
+        "    inputs={\n",
+        "        \"dataset\": vm_test_ds,\n",
+        "    },\n",
+        "    param_grid={\n",
+        "        \"score_column\": [\"xgb_scores\",\"log_scores\"],\n",
+        "        \"score_bands\": [[500, 540, 570]],\n",
+        "    },\n",
+        ").log()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\"><span style=\"color: #083E44;\"><b>Want to learn more about custom tests?</b></span>\n",
+        "<br></br>\n",
+        "Refer to our in-depth introduction to custom tests: <a href=\"../../how_to/tests/custom_tests/implement_custom_tests.ipynb\" style=\"color: #DE257E;\"><b>Implement custom tests</b></a></div>"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc11__'></a>\n",
+        "\n",
+        "## Verify test runs\n",
+        "\n",
+        "Our final task is to verify that all the tests provided by the development team were run and reported accurately. Note the appended `result_ids` to delineate which dataset we ran the test with for the relevant tests.\n",
+        "\n",
+        "Here, we'll specify all the tests we'd like to independently rerun in a dictionary called `test_config`. **Note here that `inputs` and `input_grid` expect the `input_id` of the dataset or model as the value rather than the variable name we specified**:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "test_config = {\n",
+        "    # Run with the raw dataset\n",
+        "    'validmind.data_validation.DatasetDescription:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'}\n",
+        "    },\n",
+        "    'validmind.data_validation.DescriptiveStatistics:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'}\n",
+        "    },\n",
+        "    'validmind.data_validation.MissingValues:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'min_percentage_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.ClassImbalance:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'min_percent_threshold': 10}\n",
+        "    },\n",
+        "    'validmind.data_validation.Duplicates:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'min_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.HighCardinality:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {\n",
+        "            'num_threshold': 100,\n",
+        "            'percent_threshold': 0.1,\n",
+        "            'threshold_type': 'percent'\n",
+        "        }\n",
+        "    },\n",
+        "    'validmind.data_validation.Skewness:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'max_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.UniqueRows:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'min_percent_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.TooManyZeroValues:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'max_percent_threshold': 0.03}\n",
+        "    },\n",
+        "    'validmind.data_validation.IQROutliersTable:raw_data': {\n",
+        "        'inputs': {'dataset': 'raw_dataset'},\n",
+        "        'params': {'threshold': 5}\n",
+        "    },\n",
+        "    # Run with the preprocessed dataset\n",
+        "    'validmind.data_validation.DescriptiveStatistics:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'preprocess_dataset'}\n",
+        "    },\n",
+        "    'validmind.data_validation.TabularDescriptionTables:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'preprocess_dataset'}\n",
+        "    },\n",
+        "    'validmind.data_validation.MissingValues:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'preprocess_dataset'},\n",
+        "        'params': {'min_percentage_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.TabularNumericalHistograms:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'preprocess_dataset'}\n",
+        "    },\n",
+        "    'validmind.data_validation.TabularCategoricalBarPlots:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'preprocess_dataset'}\n",
+        "    },\n",
+        "    'validmind.data_validation.TargetRateBarPlots:preprocessed_data': {\n",
+        "        'inputs': {'dataset': 'preprocess_dataset'},\n",
+        "        'params': {'default_column': 'loan_status'}\n",
+        "    },\n",
+        "    # Run with the training and test datasets\n",
+        "    'validmind.data_validation.DescriptiveStatistics:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']}\n",
+        "    },\n",
+        "    'validmind.data_validation.TabularDescriptionTables:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']}\n",
+        "    },\n",
+        "    'validmind.data_validation.ClassImbalance:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']},\n",
+        "        'params': {'min_percent_threshold': 10}\n",
+        "    },\n",
+        "    'validmind.data_validation.UniqueRows:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']},\n",
+        "        'params': {'min_percent_threshold': 1}\n",
+        "    },\n",
+        "    'validmind.data_validation.TabularNumericalHistograms:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']}\n",
+        "    },\n",
+        "    'validmind.data_validation.MutualInformation:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']},\n",
+        "        'params': {'min_threshold': 0.01}\n",
+        "    },\n",
+        "    'validmind.data_validation.PearsonCorrelationMatrix:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']}\n",
+        "    },\n",
+        "    'validmind.data_validation.HighPearsonCorrelation:development_data': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset']},\n",
+        "        'params': {'max_threshold': 0.3, 'top_n_correlations': 10}\n",
+        "    },\n",
+        "    'validmind.model_validation.ModelMetadata': {\n",
+        "        'input_grid': {'model': ['xgb_model_developer_champion', 'rf_model']}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.ModelParameters': {\n",
+        "        'input_grid': {'model': ['xgb_model_developer_champion', 'rf_model']}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.ROCCurve': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model_developer_champion']}\n",
+        "    },\n",
+        "    'validmind.model_validation.sklearn.MinimumROCAUCScore': {\n",
+        "        'input_grid': {'dataset': ['train_dataset', 'test_dataset'], 'model': ['xgb_model_developer_champion']},\n",
+        "        'params': {'min_threshold': 0.5}\n",
+        "    }\n",
+        "}"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "Then batch run and log our tests in `test_config`:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "for t in test_config:\n",
+        "    print(t)\n",
+        "    try:\n",
+        "        # Check if test has input_grid\n",
+        "        if 'input_grid' in test_config[t]:\n",
+        "            # For tests with input_grid, pass the input_grid configuration\n",
+        "            if 'params' in test_config[t]:\n",
+        "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid'], params=test_config[t]['params']).log()\n",
+        "            else:\n",
+        "                vm.tests.run_test(t, input_grid=test_config[t]['input_grid']).log()\n",
+        "        else:\n",
+        "            # Original logic for regular inputs\n",
+        "            if 'params' in test_config[t]:\n",
+        "                vm.tests.run_test(t, inputs=test_config[t]['inputs'], params=test_config[t]['params']).log()\n",
+        "            else:\n",
+        "                vm.tests.run_test(t, inputs=test_config[t]['inputs']).log()\n",
+        "    except Exception as e:\n",
+        "        print(f\"Error running test {t}: {str(e)}\")"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc12__'></a>\n",
+        "\n",
+        "## Next steps"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc12_1__'></a>\n",
+        "\n",
+        "### Work with your validation report\n",
+        "\n",
+        "Now that you've logged all your test results and verified the work done by the development team, head to the ValidMind Platform to wrap up your validation report:\n",
+        "\n",
+        "1. From the **Inventory** in the ValidMind Platform, go to the model you connected to earlier.\n",
+        "\n",
+        "2. In the left sidebar that appears for your model, click **Validation** under Documents.\n",
+        "\n",
+        "Include your logged test results as evidence, create risk assessment notes, add artifacts, and assess compliance, then submit your report for review when it's ready. (**Learn more:** [Preparing validation reports](https://docs.validmind.ai/guide/validation/preparing-validation-reports.html))"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc12_2__'></a>\n",
+        "\n",
+        "### Discover more learning resources\n",
+        "\n",
+        "We also offer many interactive notebooks to help you use the ValidMind Library to streamline your work:\n",
+        "\n",
+        "- [Run tests & test suites](https://docs.validmind.ai/developer/how-to/testing-overview.html)\n",
+        "- [Use ValidMind Library features](https://docs.validmind.ai/developer/how-to/feature-overview.html)\n",
+        "- [Code samples by use case](https://docs.validmind.ai/developer/samples-jupyter-notebooks.html)\n",
+        "\n",
+        "Or, visit our [documentation](https://docs.validmind.ai/) to learn more about ValidMind."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<a id='toc13__'></a>\n",
+        "\n",
+        "## Upgrade ValidMind\n",
+        "\n",
+        "<div class=\"alert alert-block alert-info\" style=\"background-color: #B5B5B510; color: black; border: 1px solid #083E44; border-left-width: 5px; box-shadow: 2px 2px 4px rgba(0, 0, 0, 0.2);border-radius: 5px;\">After installing ValidMind, you’ll want to periodically make sure you are on the latest version to access any new features and other enhancements.</div>\n",
+        "\n",
+        "Retrieve the information for the currently installed version of ValidMind:"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {},
+      "source": [
+        "%pip show validmind"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "If the version returned is lower than the version indicated in our [production open-source code](https://github.com/validmind/validmind-library/blob/prod/validmind/__version__.py), restart your notebook and run:\n",
+        "\n",
+        "```bash\n",
+        "%pip install --upgrade validmind\n",
+        "```"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "You may need to restart your kernel after running the upgrade package for changes to be applied."
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {},
+      "source": [
+        "<!-- VALIDMIND COPYRIGHT -->\n",
+        "\n",
+        "<small>\n",
+        "\n",
+        "***\n",
+        "\n",
+        "Copyright © 2023-2026 ValidMind Inc. All rights reserved.<br>\n",
+        "Refer to [LICENSE](https://github.com/validmind/validmind-library/blob/main/LICENSE) for details.<br>\n",
+        "SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial</small>"
+      ],
+      "id": "copyright-7c52ad62bcf7411eaaa00aefbac6c756"
+    }
+  ],
+  "metadata": {
+    "kernelspec": {
+      "display_name": "ValidMind Library",
+      "language": "python",
+      "name": "validmind"
+    },
+    "language_info": {
+      "name": "python",
+      "version": "3.10.13"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 2
+}
diff --git a/site/notebooks/use_cases/model_validation/xgb_model_champion.pkl b/site/notebooks/use_cases/validation/xgb_model_champion.pkl
similarity index 100%
rename from site/notebooks/use_cases/model_validation/xgb_model_champion.pkl
rename to site/notebooks/use_cases/validation/xgb_model_champion.pkl
diff --git a/site/releases/2023/2023-nov-09/highlights.qmd b/site/releases/2023/2023-nov-09/highlights.qmd
index f1c7e0e7be..b86f956921 100644
--- a/site/releases/2023/2023-nov-09/highlights.qmd
+++ b/site/releases/2023/2023-nov-09/highlights.qmd
@@ -151,7 +151,7 @@ You can easily switch between views using the **Display Table** or **Display Car
 
 ::: {.w-30-ns}
 
-[Test descriptions](/developer/test-descriptions.qmd){.button}
+[{{< var vm.product >}} test sandbox](/developer/how-to/test-sandbox.qmd){.button}
 
 :::
 
diff --git a/site/releases/2023/2023-oct-25/highlights.qmd b/site/releases/2023/2023-oct-25/highlights.qmd
index 029a1c34df..26d86b9730 100644
--- a/site/releases/2023/2023-oct-25/highlights.qmd
+++ b/site/releases/2023/2023-oct-25/highlights.qmd
@@ -133,9 +133,9 @@ From this page you can manage:
 
 ::: {.w-20-ns .tc}
 
-[RougeScore](/tests/model_validation/RougeScore.md){.button}
+[{{< var vm.product >}} test sandbox](/developer/how-to/test-sandbox.qmd){.button}
 
-[BertScore](/tests/model_validation/BertScore.md){.button}
+Includes `RougeScore` and `BertScore`.
 
 :::
 
@@ -161,9 +161,9 @@ We introduced several new tests to evaluate safety and bias risks in text summar
 
 ::: {.w-30-ns}
 
-[ToxicityScore](/tests/model_validation/ToxicityScore.md){.button}
+[{{< var vm.product >}} test sandbox](/developer/how-to/test-sandbox.qmd){.button}
 
-[RegardScore](/tests/model_validation/RegardScore.md){.button}
+Includes `ToxicityScore` and `RegardScore`.
 
 :::
 
@@ -215,7 +215,7 @@ We now programmatically embed our Jupyter Notebooks in our documentation site an
 :::: {.flex .flex-wrap .justify-around}
 
 ::: {.w-70-ns}
-We expanded our platform overview to provide more background information about what {{< var vm.product >}} offers and how we enable you to comply with policies and regulations such as SR 11-7 and SS1/23. 
+We expanded our platform overview to provide more background information about what {{< var vm.product >}} offers and how we enable you to comply with policies and regulations such as SR 26-2 and SS1/23. 
 
 :::
 
@@ -235,7 +235,7 @@ We updated the quickstart section of our documentation to reflect recent {{< var
 :::
 
 ::: {.w-20-ns .tc}
-[Quickstart — Model Development](/get-started/developer/quickstart-developer.qmd){.button}
+[Quickstart — Development](/get-started/developer/quickstart-developer.qmd){.button}
 
 :::
 
diff --git a/site/releases/2023/2023-sep-27/highlights.qmd b/site/releases/2023/2023-sep-27/highlights.qmd
index 6e1d0f074c..a970802e1b 100644
--- a/site/releases/2023/2023-sep-27/highlights.qmd
+++ b/site/releases/2023/2023-sep-27/highlights.qmd
@@ -125,7 +125,7 @@ We also updated the quickstart notebook to have a consistent experience.
 :::
 
 ::: {.w-40-ns}
-[Quickstart for model documentation](/notebooks/quickstart/quickstart_model_documentation.ipynb){.button .button-green}
+[Quickstart for documentation](/notebooks/quickstart/quickstart_documentation.ipynb){.button .button-green}
 
 :::
 
@@ -265,9 +265,9 @@ We made a number of changes to tests to improve the developer experience:
 
 [run_documentation_tests()](/validmind/validmind.qmd#run_documentation_tests){.button target="_blank"}
 
-[ClassifierPerformance](/tests/model_validation/sklearn/ClassifierPerformance.md){.button}
+[{{< var vm.product >}} test sandbox](/developer/how-to/test-sandbox.qmd){.button target="_blank"}
 
-[MinimumF1Score](/tests/model_validation/sklearn/MinimumF1Score.md){.button}
+Includes `ClassifierPerformance` and `MinimumF1Score`.
 
 :::
 
@@ -285,7 +285,7 @@ We made a number of changes to tests to improve the developer experience:
 :::
 
 ::: {.w-20-ns}
-[Test descriptions](/developer/test-descriptions.qmd){.button}
+[{{< var vm.product >}} test sandbox](/developer/how-to/test-sandbox.qmd){.button}
 
 :::
 
diff --git a/site/releases/2023/release-notes-2023-jul-24.qmd b/site/releases/2023/release-notes-2023-jul-24.qmd
index a47cc470f4..5c9bdc6b02 100644
--- a/site/releases/2023/release-notes-2023-jul-24.qmd
+++ b/site/releases/2023/release-notes-2023-jul-24.qmd
@@ -109,7 +109,7 @@ We've now enhanced the flexibility of documenting models by allowing you to swap
 :::: {.flex .flex-wrap .justify-around}
 
 ::: {.w-50-ns .tc}
-[Install and initialize the {{< var validmind.developer >}}](/developer/model-documentation/install-and-initialize-validmind-library.qmd){.button .button-green}
+[Install and initialize the {{< var validmind.developer >}}](/developer/quickstart/install-and-initialize-validmind-library.qmd){.button .button-green}
 
 [Working with model findings](/guide/validation/working-with-artifacts.qmd){.button .button-green}
 
diff --git a/site/releases/2023/release-notes-2023-jun-22.qmd b/site/releases/2023/release-notes-2023-jun-22.qmd
index eeb5fa428a..dd13a76447 100644
--- a/site/releases/2023/release-notes-2023-jun-22.qmd
+++ b/site/releases/2023/release-notes-2023-jun-22.qmd
@@ -106,7 +106,7 @@ We revised our quickstart guide to be more modular and to highlight that our sug
 :::
 
 ::: {.w-20-ns .tc}
-[Quickstart — Model Development](/get-started/developer/quickstart-developer.qmd){.button}
+[Quickstart — Development](/get-started/developer/quickstart-developer.qmd){.button}
 
 :::
 
diff --git a/site/releases/2023/release-notes-2023-may-30.qmd b/site/releases/2023/release-notes-2023-may-30.qmd
index 31eecb08ec..775616f5da 100644
--- a/site/releases/2023/release-notes-2023-may-30.qmd
+++ b/site/releases/2023/release-notes-2023-may-30.qmd
@@ -34,7 +34,7 @@ Plots and visual outputs have been enhanced with the Plotly package. Users can n
 :::
 
 ::: {.w-30-ns .tc}
-[Test descriptions](/developer/test-descriptions.qmd){.button .button-green}
+[{{< var vm.product >}} test sandbox](/developer/how-to/test-sandbox.qmd){.button .button-green}
 
 :::
 
diff --git a/site/releases/2024/2024-aug-13/release-notes.qmd b/site/releases/2024/2024-aug-13/release-notes.qmd
index 0110c52e8e..3302c709e4 100644
--- a/site/releases/2024/2024-aug-13/release-notes.qmd
+++ b/site/releases/2024/2024-aug-13/release-notes.qmd
@@ -32,7 +32,7 @@ To make comparison tests easier to analyze, we've added support to specify an in
 ::: {.w-30-ns}
 
 ::: {.tc}
-[Run comparison tests](/notebooks/how_to/tests/run_tests/2_run_comparison_tests.ipynb){.button .button-green}
+[Run comparison tests](/notebooks/how_to/tests/run_tests/2-run_comparison_tests.ipynb){.button .button-green}
 :::
 
 :::
@@ -192,7 +192,7 @@ Manage both upstream and downstream model interdependencies:
 
 ::: {.w-50-ns}
 
-![Model dependency management](manage-model-interdependencies.png){fig-alt="An screenshot showcasing the Manage Model Interdependences screen" .screenshot group="interdependencies"}
+![Model dependency management](manage-model-interdependencies.png){fig-alt="A screenshot showcasing the Manage Model Interdependencies screen" .screenshot group="interdependencies"}
 
 :::
 
@@ -208,7 +208,7 @@ URL: https://github.com/validmind/validmind-library/pull/140
 Labels: bug
 --->
 
-- We've excluded categorical and binary features from the outlier tests [`IQROutliersTable`](/tests/data_validation/IQROutliersTable.md) and [`IQROutliersBarPlot`](/tests/data_validation/IQROutliersBarPlot.md).
+- We've excluded categorical and binary features from the outlier tests `IQROutliersTable` and `IQROutliersBarPlot` (see the [{{< var vm.product >}} test sandbox](/developer/how-to/test-sandbox.qmd) for descriptions).
 - This fix ensures that outlier detection is applied correctly and appropriately, improving computational efficiency and leading to more relevant, accurate, and meaningful insights from the data.
 
 <!---
diff --git a/site/releases/2024/2024-dec-06/release-notes.qmd b/site/releases/2024/2024-dec-06/release-notes.qmd
index 5ec54b7efd..653ce046b3 100644
--- a/site/releases/2024/2024-dec-06/release-notes.qmd
+++ b/site/releases/2024/2024-dec-06/release-notes.qmd
@@ -13,7 +13,7 @@ listing:
     max-description-length: 250
     # image-height: 100%
     contents:
-      - path: ../../../about/overview-model-documentation.qmd
+      - path: ../../../about/overview-documentation.qmd
         title: "Learn more — {{< var validmind.developer >}}"
         description: "The {{< var validmind.developer >}} is a Python library and documentation engine designed to streamline the process of documenting various types of models."
     fields: [title, description]
@@ -23,9 +23,9 @@ listing:
     max-description-length: 250
     # image-height: 100%
     contents:
-      - path: ../../../about/overview-model-risk-management.qmd
+      - path: ../../../about/library-and-platform.qmd
         title: "Learn more — <br>{{< var validmind.platform >}}"
-        description: "The {{< var validmind.platform >}} offers an integrated solution to manage validation reports, track findings, and report on model risk compliance across your model portfolio."
+        description: "The {{< var validmind.platform >}} is an easy-to-use web-based interface that enables you to track the model lifecycle, customize workflows, and collaborate on documentation and validation."
     fields: [title, description]
   - id: academy
     type: grid
@@ -216,7 +216,7 @@ You can now add, edit, or remove custom data to your analytics within the {{< va
 :::
 
 ::: {.w-50-ns .tc}
-![Example setup for a custom stacked bar chart](/guide/reporting/custom-visualization-setup.png){width=85% fig-alt="An screenshot of an example setup for a custom stacked bar chart" .screenshot}
+![Example setup for a custom stacked bar chart](/guide/reporting/custom-visualization-setup.png){width=85% fig-alt="A screenshot of an example setup for a custom stacked bar chart" .screenshot}
 
 :::
 
@@ -713,7 +713,7 @@ If more than one set of test results has been logged with the {{< var validmind.
 
 ::::
 
-![Historical test result filters](test-result-filters.png){ fig-alt="An screenshot of the historical test result filters" .screenshot width=90%}
+![Historical test result filters](test-result-filters.png){ fig-alt="A screenshot of the historical test result filters" .screenshot width=90%}
 
 
 <!---
@@ -1031,7 +1031,7 @@ We've refined our developer guide on how to use the {{< var validmind.developer
 :::
 
 ::: {.w-30-ns .tc}
-[Documenting models](/developer/model-documentation/documenting-models.qmd){.button}
+[Documenting models](/developer/quickstart/documenting-models.qmd){.button}
 
 :::
 
@@ -1050,7 +1050,7 @@ In our Jupyter Notebook samples, we've now included information within the noteb
 :::
 
 ::: {.w-30-ns .tc}
-[Upgrade {{< var vm.product >}}](/developer/model-documentation/install-and-initialize-validmind-library.qmd#upgrade){.button}
+[Upgrade {{< var vm.product >}}](/developer/quickstart/install-and-initialize-validmind-library.qmd#upgrade){.button}
 
 :::
 
diff --git a/site/releases/2024/2024-dec-24/release-notes.qmd b/site/releases/2024/2024-dec-24/release-notes.qmd
index a9bd930fd3..ffc2466be9 100644
--- a/site/releases/2024/2024-dec-24/release-notes.qmd
+++ b/site/releases/2024/2024-dec-24/release-notes.qmd
@@ -319,7 +319,7 @@ Our documentation guides have also been updated to match this new experience:
 :::
 
 ::: {.w-40-ns .tc}
-[Store model credentials in `.env` files](/developer/model-documentation/store-credentials-in-env-file.qmd){.button}
+[Store model credentials in `.env` files](/developer/quickstart/store-credentials-in-env-file.qmd){.button}
 
 :::
 
diff --git a/site/releases/2024/2024-feb-14/highlights.qmd b/site/releases/2024/2024-feb-14/highlights.qmd
index 251aa2817f..ca223cc2e9 100644
--- a/site/releases/2024/2024-feb-14/highlights.qmd
+++ b/site/releases/2024/2024-feb-14/highlights.qmd
@@ -173,7 +173,7 @@ To enable model developers to know what task types and tags are available to fil
 
 [init_dataset()](/validmind/validmind.qmd#init_dataset){.button target="_blank" .button-green}
 
-[init_model()](/validmind/validmind.qmd#init_model){.button target="_blank".button-green} 
+[init_model()](/validmind/validmind.qmd#init_model){.button target="_blank" .button-green}
 
 :::
 
@@ -203,7 +203,7 @@ We simplified the instructions for getting started with the {{< var validmind.de
 :::
 
 ::: {.w-50-ns}
-[Install and initalize the {{< var validmind.developer >}}](/developer/model-documentation/install-and-initialize-validmind-library.qmd){.button .button-green}
+[Install and initalize the {{< var validmind.developer >}}](/developer/quickstart/install-and-initialize-validmind-library.qmd){.button .button-green}
 
 :::
 
@@ -252,7 +252,7 @@ You can now narrow down models in your **{{< fa cubes >}} Inventory** with our a
 :::
 
 ::: {.w-30-ns .tc}
-[Search, filter, and sort models](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-models){.button}
+[Search, filter, and sort records](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records){.button}
 
 :::
 
diff --git a/site/releases/2024/2024-jul-22/release-notes.qmd b/site/releases/2024/2024-jul-22/release-notes.qmd
index c48cea4673..71b8cdb63f 100644
--- a/site/releases/2024/2024-jul-22/release-notes.qmd
+++ b/site/releases/2024/2024-jul-22/release-notes.qmd
@@ -44,7 +44,7 @@ You can now run comparison tests with the {{< var validmind.developer >}}.
 :::
 
 ::: {.w-30-ns}
-[Run comparison tests](/notebooks/how_to/tests/run_tests/2_run_comparison_tests.ipynb){.button .button-green}
+[Run comparison tests](/notebooks/how_to/tests/run_tests/2-run_comparison_tests.ipynb){.button .button-green}
 
 :::
 
@@ -294,7 +294,7 @@ We fixed a number of missing test descriptions that were caused by a scripting i
 
 ::: {.w-20-ns}
 
-[Test descriptions](/developer/test-descriptions.qmd){.button}
+[{{< var vm.product >}} test sandbox](/developer/how-to/test-sandbox.qmd){.button}
 
 :::
 
diff --git a/site/releases/2024/2024-mar-27/highlights.qmd b/site/releases/2024/2024-mar-27/highlights.qmd
index c1ab680729..893de5aa54 100644
--- a/site/releases/2024/2024-mar-27/highlights.qmd
+++ b/site/releases/2024/2024-mar-27/highlights.qmd
@@ -442,7 +442,7 @@ The user guide sections for working with model documentation and preparing valid
 
 ::: {.w-40-ns}
 
-[Quickstart — Model Development](/get-started/developer/quickstart-developer.qmd){.button}
+[Quickstart — Development](/get-started/developer/quickstart-developer.qmd){.button}
 
 :::
 
@@ -458,7 +458,7 @@ We improved our supported models documentation with additional information about
 :::
 
 ::: {.w-30-ns .tc}
-[Supported models and frameworks](/developer/supported-models-and-frameworks.qmd){.button}
+[Supported records and frameworks](/developer/supported-records-and-frameworks.qmd){.button}
 
 :::
 
diff --git a/site/releases/2024/2024-may-22/release-notes.qmd b/site/releases/2024/2024-may-22/release-notes.qmd
index aeea16fdec..6a7e6319af 100644
--- a/site/releases/2024/2024-may-22/release-notes.qmd
+++ b/site/releases/2024/2024-may-22/release-notes.qmd
@@ -43,7 +43,7 @@ You can use this notebook to learn how the end-to-end documentation process work
 
 ::: {.w-40-ns}
 
-[Try notebook on JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/101-set_up_validmind.ipynb){.button .button-green}
+[Try notebook on JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/1-set_up_validmind.ipynb){.button .button-green}
 
 :::
 
@@ -547,12 +547,12 @@ Labels: enhancement
 --->
 #### New text data validation tests
 
-The following tests for text data validation have been added:
+The following tests for text data validation have been added (browse descriptions in the [{{< var vm.product >}} test sandbox](/developer/how-to/test-sandbox.qmd)):
 
-- [`validmind.data_validation.nlp.LanguageDetection`](/tests/data_validation/nlp/LanguageDetection.md)
-- [`validmind.data_validation.nlp.Toxicity`](/tests/data_validation/nlp/Toxicity.md)
-- [`validmind.data_validation.nlp.PolarityAndSubjectivity`](/tests/data_validation/nlp/PolarityAndSubjectivity.md)
-- [`validmind.data_validation.nlp.Sentiment`](/tests/data_validation/nlp/Sentiment.md)
+- `validmind.data_validation.nlp.LanguageDetection`
+- `validmind.data_validation.nlp.Toxicity`
+- `validmind.data_validation.nlp.PolarityAndSubjectivity`
+- `validmind.data_validation.nlp.Sentiment`
 
 <!--- NR TO DO This notebook is not in main
 To test run notebook: `rag_langchain_demo.ipynb` --->
@@ -820,7 +820,7 @@ Also available is an improved look and functionality for filtering the **{{< fa
 
 ::: {.w-40-ns}
 
-[Search, filter, and sort models](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-models){.button}
+[Search, filter, and sort records](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records){.button}
 
 
 :::
@@ -1097,5 +1097,5 @@ These features provide a rich context for testing and evaluation. You can use re
 
 <!-- FOOTNOTES -->
 
-[^1]: See the full list of tests at [Test descriptions](/developer/test-descriptions.qmd) or try the [Test sandbox](/developer/how-to/test-sandbox.qmd).
+[^1]: Browse tests and read descriptions in the [{{< var vm.product >}} test sandbox](/developer/how-to/test-sandbox.qmd).
 
diff --git a/site/releases/2024/2024-oct-22/release-notes.qmd b/site/releases/2024/2024-oct-22/release-notes.qmd
index cbf0130253..4bcff311ff 100644
--- a/site/releases/2024/2024-oct-22/release-notes.qmd
+++ b/site/releases/2024/2024-oct-22/release-notes.qmd
@@ -33,7 +33,7 @@ Labels: documentation
 --->
 ### Support for ongoing monitoring
 
-Monitoring is a critical component of model risk management, as emphasized in regulations such as SR 11-7, SS1/23, and E-24. With this release of {{< var vm.product >}}, we officially support ongoing monitoring. You can enable this feature for both existing and new models.
+Monitoring is a critical component of model risk management, as emphasized in regulations such as SR 26-2, SS1/23, and E-24. With this release of {{< var vm.product >}}, we officially support ongoing monitoring. You can enable this feature for both existing and new models.
 
 ![Ongoing monitoring of a model](/releases/2024/2024-oct-22/358433496-02a6d5b9-0521-4110-b45c-b91e06798a97.png){fig-alt="An image showing some ongoing monitoring data on the ValidMind Platform" .screenshot}
 
@@ -174,7 +174,7 @@ When you need to decommission models that you no longer need, you can now archiv
 :::: {.flex .flex-wrap .justify-around}
 
 ::: {.w-70-ns}
-You now have new stages for inventory models, including `ACTIVE`, `ARCHIVED`, and `DELETED`, which are shown as a new column in the model inventory and as field in the model overview. 
+You now have new stages for inventory models, including `ACTIVE`, `ARCHIVED`, and `DELETED`, which are shown as a new column in the model inventory and as a field in the model overview. 
 
 :::
 
diff --git a/site/releases/2025/2025-apr-24/release-notes.qmd b/site/releases/2025/2025-apr-24/release-notes.qmd
index 041f8062b5..7c105dfde2 100644
--- a/site/releases/2025/2025-apr-24/release-notes.qmd
+++ b/site/releases/2025/2025-apr-24/release-notes.qmd
@@ -8,8 +8,8 @@ listing:
     grid-columns: 1
     max-description-length: 250
     contents:
-    - path: ../../../developer/validmind-library.qmd#for-model-development
-      title: "{{< var vm.product >}} for model development {{< fa chevron-right >}}"
+    - path: ../../../developer/validmind-library.qmd#development
+      title: "{{< var vm.product >}} for development {{< fa chevron-right >}}"
       description: "Learn how to use {{< var vm.product >}} for your end-to-end model documentation process based on common model development scenarios with our series of four introductory notebooks."
 ---
 
@@ -45,7 +45,7 @@ We've revamped our old *Introduction for model developers* notebook into a serie
 :::
 
 ::: {.w-40-ns .tc}
-[{{< fa brands github >}} Access Notebooks on GitHub](https://github.com/validmind/validmind-library/tree/main/notebooks/tutorials/model_development){.button .button-green target="_blank"}
+[{{< fa brands github >}} Access Notebooks on GitHub](https://github.com/validmind/validmind-library/tree/main/notebooks/tutorials/development){.button .button-green target="_blank"}
 
 :::
 
diff --git a/site/releases/2025/2025-jan-31/release-notes.qmd b/site/releases/2025/2025-jan-31/release-notes.qmd
index 543ba4acf5..eecdd7e308 100644
--- a/site/releases/2025/2025-jan-31/release-notes.qmd
+++ b/site/releases/2025/2025-jan-31/release-notes.qmd
@@ -18,15 +18,15 @@ listing:
     max-description-length: 250
     # image-height: 100%
     contents:
-      - path: https://jupyterhub.validmind.ai/hub/user-redirect/lab/tree/code_samples/credit_risk/application_scorecard_with_ml.ipynb
+      - path: https://jupyterhub.validmind.ai/hub/user-redirect/lab/tree/use_cases/credit_risk/application_scorecard_with_ml.ipynb
         title: "Document an application scorecard model"
         categories: ["Individual Tests"]
         description: "Open notebook in JupyterHub {{< fa chevron-right >}}"
-      - path: https://jupyterhub.validmind.ai/hub/user-redirect/lab/tree/code_samples/credit_risk/application_scorecard_full_suite.ipynb
+      - path: https://jupyterhub.validmind.ai/hub/user-redirect/lab/tree/use_cases/credit_risk/application_scorecard_full_suite.ipynb
         title: "Document an application scorecard model"
         categories: ["Full Test Suite"]
         description: "Open notebook in JupyterHub {{< fa chevron-right >}}"
-      - path: https://jupyterhub.validmind.ai/hub/user-redirect/lab/tree/code_samples/credit_risk/application_scorecard_executive.ipynb
+      - path: https://jupyterhub.validmind.ai/hub/user-redirect/lab/tree/use_cases/credit_risk/application_scorecard_executive.ipynb
         title: "Document an application scorecard model"
         categories: ["Single Function"]
         description: "Open notebook in JupyterHub {{< fa chevron-right >}}"
@@ -36,7 +36,7 @@ listing:
     max-description-length: 250
     # image-height: 100%
     contents:
-      - path: https://jupyterhub.validmind.ai/hub/user-redirect/lab/tree/code_samples/ongoing_monitoring/application_scorecard_ongoing_monitoring.ipynb
+      - path: https://jupyterhub.validmind.ai/hub/user-redirect/lab/tree/use_cases/ongoing_monitoring/application_scorecard_ongoing_monitoring.ipynb
         title: "Ongoing monitoring for application scorecard"
         description: "Open notebook in JupyterHub {{< fa chevron-right >}}"
   - id: e2e-template
@@ -178,16 +178,16 @@ We've introduced enhancements to the {{< var validmind.developer >}} that focus
 
 :::
 
-- **New tests**:
+- **New tests** (browse descriptions in the [{{< var vm.product >}} test sandbox](/developer/how-to/test-sandbox.qmd)):
 
-  - [`MutualInformation`](/tests/data_validation/MutualInformation.md): Evaluates feature relevance by calculating mutual information scores between features and the target variable.  
-  - [`ScoreBandDefaultRates`](/tests/data_validation/ScoreBandDefaultRates.md): Analyzes default rates and population distribution across credit score bands.  
-  - [`CalibrationCurve`](/tests/model_validation/sklearn/CalibrationCurve.md): Assesses calibration by comparing predicted probabilities against observed frequencies.  
-  - [`ClassifierThresholdOptimization`](/tests/model_validation/sklearn/ClassifierThresholdOptimization.md): Visualizes threshold optimization methods for binary classification models.  
-  - [`ModelParameters`](/tests/model_validation/sklearn/ModelParameters.md): Extracts and displays model parameters for transparency and reproducibility.  
-  - [`ScoreProbabilityAlignment`](/tests/model_validation/sklearn/ScoreProbabilityAlignment.md): Evaluates alignment between credit scores and predicted probabilities.
+  - `MutualInformation`: Evaluates feature relevance by calculating mutual information scores between features and the target variable.  
+  - `ScoreBandDefaultRates`: Analyzes default rates and population distribution across credit score bands.  
+  - `CalibrationCurve`: Assesses calibration by comparing predicted probabilities against observed frequencies.  
+  - `ClassifierThresholdOptimization`: Visualizes threshold optimization methods for binary classification models.  
+  - `ModelParameters`: Extracts and displays model parameters for transparency and reproducibility.  
+  - `ScoreProbabilityAlignment`: Evaluates alignment between credit scores and predicted probabilities.
 
-Modifications have also been made to existing tests to improve functionality and accuracy. The [`TooManyZeroValues`](/tests/data_validation/TooManyZeroValues.md) test now includes a row count and applies a percentage threshold for zero values.
+Modifications have also been made to existing tests to improve functionality and accuracy. The `TooManyZeroValues` test now includes a row count and applies a percentage threshold for zero values.
 
 The [`split`](/validmind/validmind/datasets/regression/lending_club.qmd#preprocess){target="_blank"} function in `lending_club.py` has been enhanced to support an optional validation set, allowing for more flexible dataset splitting.
 
@@ -214,25 +214,25 @@ Several enhancements to the {{< var validmind.developer >}} focus on ongoing mon
 
 - **Custom tests**: Define and run your own tests using the {{< var vm.developer >}}:
 
-   - [`ScoreBandDiscriminationMetrics.py`](https://github.com/validmind/validmind-library/blob/main/notebooks/code_samples/credit_risk/custom_tests/ScoreBandDiscriminationMetrics.py): Evaluates discrimination metrics across different score bands.  
+   - [`ScoreBandDiscriminationMetrics.py`](https://github.com/validmind/validmind-library/blob/main/notebooks/use_cases/credit_risk/custom_tests/ScoreBandDiscriminationMetrics.py): Evaluates discrimination metrics across different score bands.  
 
-- **New tests**:
+- **New tests** (browse descriptions in the [{{< var vm.product >}} test sandbox](/developer/how-to/test-sandbox.qmd)):
    
-   - [`CalibrationCurveDrift`](/tests/ongoing_monitoring/CalibrationCurveDrift.md): Evaluates changes in probability calibration.  
-   - [`ClassDiscriminationDrift`](/tests/ongoing_monitoring/ClassDiscriminationDrift.md): Compares classification discrimination metrics.  
-   - [`ClassImbalanceDrift`](/tests/ongoing_monitoring/ClassImbalanceDrift.md): Evaluates drift in class distribution.  
-   - [`ClassificationAccuracyDrift`](/tests/ongoing_monitoring/ClassificationAccuracyDrift.md): Compares classification accuracy metrics.  
-   - [`ConfusionMatrixDrift`](/tests/ongoing_monitoring/ConfusionMatrixDrift.md): Compares confusion matrix metrics.  
-   - [`CumulativePredictionProbabilitiesDrift`](/tests/ongoing_monitoring/CumulativePredictionProbabilitiesDrift.md): Compares cumulative prediction probability distributions.  
-   - [`FeatureDrift`](/tests/ongoing_monitoring/FeatureDrift.md): Evaluates changes in feature distribution.  
-   - [`PredictionAcrossEachFeature`](/tests/ongoing_monitoring/PredictionAcrossEachFeature.md): Assesses prediction distributions across features.  
-   - [`PredictionCorrelation`](/tests/ongoing_monitoring/PredictionCorrelation.md): Assesses correlation changes between predictions and features.  
-   - [`PredictionProbabilitiesHistogramDrift`](/tests/ongoing_monitoring/PredictionProbabilitiesHistogramDrift.md): Compares prediction probability distributions.  
-   - [`PredictionQuantilesAcrossFeatures`](/tests/ongoing_monitoring/PredictionQuantilesAcrossFeatures.md): Assesses prediction distributions across features using quantiles.  
-   - [`ROCCurveDrift`](/tests/ongoing_monitoring/ROCCurveDrift.md): Compares ROC curves.  
-   - [`ScoreBandsDrift`](/tests/ongoing_monitoring/ScoreBandsDrift.md): Analyzes drift in score bands.  
-   - [`ScorecardHistogramDrift`](/tests/ongoing_monitoring/ScorecardHistogramDrift.md): Compares score distributions.  
-   - [`TargetPredictionDistributionPlot`](/tests/ongoing_monitoring/TargetPredictionDistributionPlot.md): Assesses differences in prediction distributions.  
+   - `CalibrationCurveDrift`: Evaluates changes in probability calibration.  
+   - `ClassDiscriminationDrift`: Compares classification discrimination metrics.  
+   - `ClassImbalanceDrift`: Evaluates drift in class distribution.  
+   - `ClassificationAccuracyDrift`: Compares classification accuracy metrics.  
+   - `ConfusionMatrixDrift`: Compares confusion matrix metrics.  
+   - `CumulativePredictionProbabilitiesDrift`: Compares cumulative prediction probability distributions.  
+   - `FeatureDrift`: Evaluates changes in feature distribution.  
+   - `PredictionAcrossEachFeature`: Assesses prediction distributions across features.  
+   - `PredictionCorrelation`: Assesses correlation changes between predictions and features.  
+   - `PredictionProbabilitiesHistogramDrift`: Compares prediction probability distributions.  
+   - `PredictionQuantilesAcrossFeatures`: Assesses prediction distributions across features using quantiles.  
+   - `ROCCurveDrift`: Compares ROC curves.  
+   - `ScoreBandsDrift`: Analyzes drift in score bands.  
+   - `ScorecardHistogramDrift`: Compares score distributions.  
+   - `TargetPredictionDistributionPlot`: Assesses differences in prediction distributions.  
    
 We also improved dataset loading, preprocessing, and feature engineering functions with verbosity control for cleaner output.  
 
@@ -357,7 +357,7 @@ This enhancement makes it easier to distinguish between ValidMind's standard tes
 :::
 
 ::: {.w-30-ns .tr} 
-[Test descriptions](/developer/test-descriptions.qmd){.button target="_blank"}
+[{{< var vm.product >}} test sandbox](/developer/how-to/test-sandbox.qmd){.button target="_blank"}
 :::
 
 ::::
@@ -540,7 +540,7 @@ We replaced the plugin for the editor of mathematical equations and formulas. Th
 The new editor also includes a real-time preview and common mathematical symbols for easier equation creation.
 
 ::: {.tc}
-[Add mathematical formulas](/guide/documentation/work-with-content-blocks.html#add-mathematical-formulas.qmd){.button}
+[Add mathematical formulas](/guide/documentation/work-with-content-blocks.qmd#insert-mathematical-formulas){.button}
 :::
 
 :::
diff --git a/site/releases/_metadata.yml b/site/releases/_metadata.yml
index 623ad3459e..e521a2dd9a 100644
--- a/site/releases/_metadata.yml
+++ b/site/releases/_metadata.yml
@@ -2,8 +2,6 @@
 # Refer to the LICENSE file in the root of this repository for details.
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
 
-search: false
-
 filters:
   - category-filter
 
diff --git a/site/scripts/__pycache__/generate_chatbot_product_map.cpython-314.pyc b/site/scripts/__pycache__/generate_chatbot_product_map.cpython-314.pyc
new file mode 100644
index 0000000000..b898ef5f9d
Binary files /dev/null and b/site/scripts/__pycache__/generate_chatbot_product_map.cpython-314.pyc differ
diff --git a/site/scripts/__pycache__/test_generate_chatbot_product_map.cpython-314.pyc b/site/scripts/__pycache__/test_generate_chatbot_product_map.cpython-314.pyc
new file mode 100644
index 0000000000..80669ed834
Binary files /dev/null and b/site/scripts/__pycache__/test_generate_chatbot_product_map.cpython-314.pyc differ
diff --git a/site/scripts/generate_chatbot_product_map.py b/site/scripts/generate_chatbot_product_map.py
new file mode 100644
index 0000000000..e1d6f51dd5
--- /dev/null
+++ b/site/scripts/generate_chatbot_product_map.py
@@ -0,0 +1,679 @@
+#!/usr/bin/env python3
+# Copyright © 2023-2026 ValidMind Inc. All rights reserved.
+# Refer to the LICENSE file in the root of this repository for details.
+# SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
+"""
+Generate a product-to-documentation map for the in-app chatbot (LanceDB / RAG).
+
+Correlates frontend routes and help links with documentation pages and headings.
+
+Usage (from documentation repo root):
+    # CI / default: build map from committed frontend snapshot (no frontend checkout)
+    python site/scripts/generate_chatbot_product_map.py
+
+    # Refresh snapshot + map when frontend sources change (local frontend checkout)
+    python site/scripts/generate_chatbot_product_map.py --from-frontend
+    python site/scripts/generate_chatbot_product_map.py --from-frontend --frontend-root ../frontend
+"""
+
+from __future__ import annotations
+
+import argparse
+import json
+import re
+from dataclasses import dataclass, field
+from datetime import datetime, timezone
+from pathlib import Path
+
+try:
+    import yaml
+except ImportError:  # pragma: no cover
+    yaml = None  # type: ignore
+
+
+DOCS_URL_PATTERN = re.compile(
+    r"(?:VALIDMIND_DOCS_URL|docs\.validmind\.ai)"
+    r'[^`"\']*?'
+    r'(/(?:guide|get-started|developer|faq|support|training|about|reference)[^`"\')\s#]+)'
+    r"(?:#([a-zA-Z0-9_-]+))?"
+)
+
+HELP_LINK_PATTERN = re.compile(
+    r"helpLink=\{?`(?:\$\{CONFIG\.VALIDMIND_DOCS_URL\}|https://docs\.validmind\.ai)"
+    r'(/[^`"\')\s#]+)(?:#([a-zA-Z0-9_-]+))?`?\}?'
+)
+
+DOCUMENTATION_LINK_PATTERN = re.compile(
+    r'documentationLink=\{?`(?:\$\{CONFIG\.VALIDMIND_DOCS_URL\}|https://docs\.validmind\.ai)'
+    r'(/[^`"\')\s#]+)(?:#([a-zA-Z0-9_-]+))?`?\}?'
+)
+
+LINK_PROP_PATTERN = re.compile(
+    r'link=\{?`(?:\$\{CONFIG\.VALIDMIND_DOCS_URL\}|https://docs\.validmind\.ai)'
+    r'(/[^`"\')\s#]+)(?:#([a-zA-Z0-9_-]+))?`?\}?'
+)
+
+SETTING_GROUP_TITLE_PATTERN = re.compile(
+    r'<SettingGroup\b[^>]*\btitle="([^"]+)"',
+)
+
+SETTING_LINK_PATTERN = re.compile(
+    r'<SettingLink\b[^>]*\btitle="([^"]+)"[^>]*\bpath="([^"]+)"',
+)
+
+ATTR_PATTERN = re.compile(r'(\w+)=["{`]([^"`}]+)["`}]')
+
+HEADING_PATTERN = re.compile(r"^(#{2,3})\s+(.+)$", re.MULTILINE)
+
+SIDEBAR_PATH_PATTERN = re.compile(
+    r"(?:path|documentationLink):\s*['\"](/[^'\"]+)['\"]"
+)
+SIDEBAR_LABEL_PATTERN = re.compile(
+    r"label:\s*(?:copy\([^)]+\)|['\"]([^'\"]+)['\"])"
+)
+
+# Map settings link titles (lowercase) to likely guide doc path segments for related docs.
+# Frontend help URLs that do not match published doc paths.
+DOC_PATH_ALIASES: dict[str, str] = {
+    "/guide/model-workflows/setting-up-model-workflows.html": (
+        "/guide/workflows/setting-up-workflows.html"
+    ),
+}
+
+RELATED_DOC_PREFIXES = (
+    "/guide/",
+    "/get-started/",
+    "/support/",
+    "/faq/faq-",
+    "/about/contributing/",
+)
+
+RELATED_DOC_KEYWORDS: dict[str, list[str]] = {
+    "workflows": ["workflows", "model-workflows"],
+    "workflow": ["workflows", "model-workflows"],
+    "roles": ["configuration/manage-roles", "configuration/managing-users"],
+    "permissions": ["configuration/manage-permissions", "configuration/managing-users"],
+    "groups": ["configuration/manage-groups", "configuration/managing-users"],
+    "users": ["configuration/managing-users", "configuration/manage-users"],
+    "invitation": ["configuration/managing-users", "configuration/manage-users"],
+    "integrations": ["integrations", "configuration"],
+    "templates": ["templates", "model-documentation"],
+    "document": ["templates", "model-documentation"],
+    "inventory": ["inventory", "model-inventory"],
+    "finding": ["model-validation", "findings"],
+    "artifact": ["model-validation", "templates"],
+    "attestation": ["attestation"],
+    "regulation": ["templates/customize-virtual-document-validator", "model-validation"],
+    "risk": ["model-validation/manage-validation-guidelines"],
+    "authentication": ["configuration/managing-your-organization"],
+    "organization": ["configuration/managing-your-organization"],
+    "profile": ["configuration/manage-your-profile", "configuration/personalizing-validmind"],
+    "analytics": ["reporting", "monitoring"],
+    "dashboard": ["configuration/customize-your-dashboard"],
+}
+
+
+@dataclass
+class DocRef:
+    path: str  # URL path like /guide/foo/bar.html
+    anchor: str | None = None
+
+    @property
+    def key(self) -> str:
+        return f"{self.path}#{self.anchor}" if self.anchor else self.path
+
+
+@dataclass
+class ProductRoute:
+    path: str
+    label: str
+    group: str | None = None
+    primary_docs: list[DocRef] = field(default_factory=list)
+    related_docs: list[DocRef] = field(default_factory=list)
+    notes: list[str] = field(default_factory=list)
+
+
+def find_repo_root() -> Path:
+    current = Path(__file__).resolve()
+    for parent in current.parents:
+        if (parent / ".git").is_dir():
+            return parent
+    return current.parent.parent.parent
+
+
+def html_path_to_qmd(site_dir: Path, doc_path: str) -> Path | None:
+    """Map /guide/foo/bar.html -> site/guide/foo/bar.qmd"""
+    path = doc_path.strip()
+    if not path.startswith("/"):
+        path = "/" + path
+    if path.endswith(".html"):
+        path = path[:-5]
+    rel = path.lstrip("/") + ".qmd"
+    candidate = site_dir / rel
+    return candidate if candidate.is_file() else None
+
+
+def extract_headings(qmd_path: Path, max_level: int = 3) -> list[str]:
+    text = qmd_path.read_text(encoding="utf-8")
+    headings: list[str] = []
+    for match in HEADING_PATTERN.finditer(text):
+        level = len(match.group(1))
+        if level > max_level:
+            continue
+        title = match.group(2).strip()
+        title = re.sub(r"\{[^}]*\}", "", title)
+        title = re.sub(r"\[([^\]]+)\]\([^)]+\)", r"\1", title)
+        title = re.sub(r"\s+", " ", title).strip()
+        if title:
+            headings.append(title)
+    return headings[:12]
+
+
+def parse_doc_refs_from_text(text: str) -> list[DocRef]:
+    refs: list[DocRef] = []
+    seen: set[str] = set()
+
+    def add(path: str, anchor: str | None) -> None:
+        if not path.endswith(".html"):
+            path = path.rstrip("/") + ".html"
+        path = resolve_doc_path(path)
+        ref = DocRef(path=path, anchor=anchor)
+        if ref.key not in seen:
+            seen.add(ref.key)
+            refs.append(ref)
+
+    for pattern in (HELP_LINK_PATTERN, DOCUMENTATION_LINK_PATTERN, LINK_PROP_PATTERN):
+        for m in pattern.finditer(text):
+            add(m.group(1), m.group(2))
+
+    for m in DOCS_URL_PATTERN.finditer(text):
+        add(m.group(1), m.group(2))
+
+    return refs
+
+
+def resolve_doc_path(path: str) -> str:
+    return DOC_PATH_ALIASES.get(path, path)
+
+
+def parse_settings_index(frontend_root: Path) -> list[ProductRoute]:
+    settings_file = frontend_root / "src/pages/Settings/index.tsx"
+    if not settings_file.is_file():
+        return []
+
+    content = settings_file.read_text(encoding="utf-8")
+    routes: list[ProductRoute] = []
+    seen_paths: set[str] = set()
+
+    group_positions = [
+        (m.start(), m.group(1))
+        for m in SETTING_GROUP_TITLE_PATTERN.finditer(content)
+    ]
+
+    def group_for_position(pos: int) -> str | None:
+        title = None
+        for gpos, gtitle in group_positions:
+            if gpos <= pos:
+                title = gtitle
+            else:
+                break
+        return title
+
+    for link_match in SETTING_LINK_PATTERN.finditer(content):
+        title = link_match.group(1).strip()
+        path = link_match.group(2).strip()
+        if not path.startswith("/settings") or path in seen_paths:
+            continue
+        seen_paths.add(path)
+        pos = link_match.start()
+        # Group-level helpLink appears before SettingLinks in the same group.
+        window_start = max(0, pos - 1200)
+        window = content[window_start:pos]
+        group_help = parse_doc_refs_from_text(window)
+        route = ProductRoute(
+            path=path,
+            label=title,
+            group=group_for_position(pos),
+        )
+        if group_help:
+            route.primary_docs.extend(group_help)
+        routes.append(route)
+
+    return routes
+
+
+def file_to_route_hint(file_path: Path) -> str | None:
+    """Infer product route from frontend page index files only."""
+    if file_path.name != "index.tsx":
+        return None
+    parts = file_path.parts
+    if "pages" not in parts or "components" in parts:
+        return None
+    idx = parts.index("pages")
+    rest = parts[idx + 1 :]
+    if not rest:
+        return None
+    if rest[0] == "Settings":
+        if len(rest) == 1 or (len(rest) == 2 and rest[1] == "index.tsx"):
+            return "/settings"
+        # Settings/Workflows/index.tsx -> /settings/workflows
+        slug = rest[1].replace("_", "-")
+        # CamelCase to kebab
+        slug = re.sub(r"(?<!^)(?=[A-Z])", "-", rest[1]).lower()
+        return f"/settings/{slug}"
+    page = rest[0]
+    kebab = re.sub(r"(?<!^)(?=[A-Z])", "-", page).lower()
+    if kebab == "model-inventory" and len(rest) > 1:
+        return None
+    if len(rest) > 1:
+        return None
+    return f"/{kebab}"
+
+
+def scan_frontend_doc_links(frontend_root: Path) -> dict[str, list[DocRef]]:
+    """Map approximate product route -> doc refs from source files."""
+    by_route: dict[str, list[DocRef]] = {}
+    src = frontend_root / "src"
+    if not src.is_dir():
+        return by_route
+
+    for path in list(src.rglob("*.tsx")) + list(src.rglob("*.ts")):
+        if "node_modules" in path.parts or ".test." in path.name:
+            continue
+        if path.name != "index.tsx" and "Settings" not in path.parts:
+            continue
+        text = path.read_text(encoding="utf-8", errors="ignore")
+        refs = parse_doc_refs_from_text(text)
+        if not refs:
+            continue
+        route_hint = file_to_route_hint(path)
+        if route_hint:
+            existing = by_route.setdefault(route_hint, [])
+            seen = {r.key for r in existing}
+            for ref in refs:
+                if ref.key not in seen:
+                    seen.add(ref.key)
+                    existing.append(ref)
+    return by_route
+
+
+def parse_sidebar_nav(frontend_root: Path) -> list[ProductRoute]:
+    sidebar_file = frontend_root / "src/components/Sidebar/index.tsx"
+    if not sidebar_file.is_file():
+        return []
+    content = sidebar_file.read_text(encoding="utf-8")
+    routes: list[ProductRoute] = []
+    # Match menu item objects with path and label
+    blocks = re.split(r"\{\s*key:\s*['\"]", content)
+    for block in blocks[1:]:
+        path_m = re.search(r"path:\s*['\"]([^'\"]+)['\"]", block)
+        if not path_m:
+            continue
+        path = path_m.group(1)
+        if not path or path == "":
+            continue
+        label_m = re.search(r"label:\s*(?:copy\(['\"]([^'\"]+)['\"]\)|['\"]([^'\"]+)['\"])", block)
+        label = (label_m.group(1) or label_m.group(2) or path) if label_m else path
+        doc_m = DOCUMENTATION_LINK_PATTERN.search(block)
+        route = ProductRoute(path=path, label=label, group="Main navigation")
+        if doc_m:
+            route.primary_docs.append(DocRef(path=doc_m.group(1), anchor=doc_m.group(2)))
+        routes.append(route)
+    return routes
+
+
+def collect_all_doc_qmd_paths(site_dir: Path) -> list[str]:
+    """Return URL-style paths for all guide-related qmd files."""
+    paths: list[str] = []
+    for qmd in site_dir.rglob("*.qmd"):
+        rel = qmd.relative_to(site_dir).as_posix()
+        if rel.startswith(("internal/", "tests/", "notebooks/", "llm/")):
+            continue
+        url = "/" + rel[:-4] + ".html"
+        paths.append(url)
+    return sorted(paths)
+
+
+def is_user_facing_doc(path: str) -> bool:
+    if "/_source/" in path:
+        return False
+    if any(part.startswith("_") for part in path.split("/") if part):
+        return False
+    return path.startswith(RELATED_DOC_PREFIXES)
+
+
+def suggest_related_docs(route: ProductRoute, all_doc_paths: list[str]) -> list[DocRef]:
+    """Suggest related documentation based on route/title keywords."""
+    haystack = f"{route.path} {route.label} {route.group or ''}".lower()
+    segments: set[str] = set()
+    for keyword, doc_segments in RELATED_DOC_KEYWORDS.items():
+        if keyword in haystack:
+            segments.update(doc_segments)
+
+    primary_paths = {d.path for d in route.primary_docs}
+    related: list[DocRef] = []
+    for doc_path in all_doc_paths:
+        if doc_path in primary_paths or not is_user_facing_doc(doc_path):
+            continue
+        inner = doc_path.lower()
+        if any(seg in inner for seg in segments):
+            related.append(DocRef(path=doc_path))
+    related.sort(key=lambda r: r.path)
+    return related[:6]
+
+
+DEFAULT_SNAPSHOT_NAME = "chatbot-product-map-frontend-snapshot.json"
+
+
+def doc_ref_to_dict(ref: DocRef) -> dict[str, str | None]:
+    return {"path": ref.path, "anchor": ref.anchor}
+
+
+def doc_ref_from_dict(data: dict[str, str | None]) -> DocRef:
+    return DocRef(path=data["path"], anchor=data.get("anchor"))
+
+
+def route_to_dict(route: ProductRoute) -> dict:
+    return {
+        "path": route.path,
+        "label": route.label,
+        "group": route.group,
+        "primary_docs": [doc_ref_to_dict(d) for d in route.primary_docs],
+    }
+
+
+def route_from_dict(data: dict) -> ProductRoute:
+    return ProductRoute(
+        path=data["path"],
+        label=data["label"],
+        group=data.get("group"),
+        primary_docs=[doc_ref_from_dict(d) for d in data.get("primary_docs", [])],
+    )
+
+
+def extract_frontend_snapshot(frontend_root: Path) -> dict:
+    """Extract route/help-link data from frontend for vendoring in the docs repo."""
+    settings = parse_settings_index(frontend_root)
+    nav = parse_sidebar_nav(frontend_root)
+    file_links = scan_frontend_doc_links(frontend_root)
+    return {
+        "version": 1,
+        "generated_at": datetime.now(timezone.utc).isoformat(),
+        "settings": [route_to_dict(r) for r in settings],
+        "nav": [route_to_dict(r) for r in nav],
+        "file_links": {
+            path: [doc_ref_to_dict(d) for d in refs]
+            for path, refs in sorted(file_links.items())
+        },
+    }
+
+
+def load_frontend_snapshot(snapshot_path: Path) -> tuple[list[ProductRoute], list[ProductRoute], dict[str, list[DocRef]]]:
+    data = json.loads(snapshot_path.read_text(encoding="utf-8"))
+    settings = [route_from_dict(r) for r in data.get("settings", [])]
+    nav = [route_from_dict(r) for r in data.get("nav", [])]
+    file_links = {
+        path: [doc_ref_from_dict(d) for d in refs]
+        for path, refs in data.get("file_links", {}).items()
+    }
+    return settings, nav, file_links
+
+
+def write_frontend_snapshot(snapshot_path: Path, payload: dict) -> None:
+    snapshot_path.parent.mkdir(parents=True, exist_ok=True)
+    snapshot_path.write_text(json.dumps(payload, indent=2) + "\n", encoding="utf-8")
+
+
+def resolve_frontend_root(repo_root: Path, explicit: Path | None) -> Path:
+    if explicit is not None:
+        candidate = explicit.resolve()
+        if candidate.is_dir():
+            return candidate
+        raise SystemExit(f"Frontend root not found: {candidate}")
+
+    for candidate in (repo_root / "frontend", repo_root.parent / "frontend"):
+        if candidate.is_dir():
+            return candidate.resolve()
+    raise SystemExit(
+        "Frontend root not found. Use --from-frontend with a local checkout, or rely on "
+        f"the committed snapshot at site/llm/{DEFAULT_SNAPSHOT_NAME}."
+    )
+
+
+def merge_routes(
+    settings: list[ProductRoute],
+    nav: list[ProductRoute],
+    file_links: dict[str, list[DocRef]],
+) -> dict[str, ProductRoute]:
+    by_path: dict[str, ProductRoute] = {}
+
+    def get_or_add(route: ProductRoute) -> ProductRoute:
+        if route.path not in by_path:
+            by_path[route.path] = route
+        else:
+            existing = by_path[route.path]
+            if route.label and existing.label == route.path:
+                existing.label = route.label
+            if route.group and not existing.group:
+                existing.group = route.group
+        return by_path[route.path]
+
+    settings_paths: set[str] = set()
+    for route in settings:
+        merged = get_or_add(route)
+        settings_paths.add(route.path)
+    for route in nav:
+        get_or_add(route)
+
+    for path, refs in file_links.items():
+        if path in settings_paths:
+            route = by_path[path]
+            seen = {d.key for d in route.primary_docs}
+            for ref in refs:
+                if ref.key not in seen:
+                    seen.add(ref.key)
+                    route.primary_docs.append(ref)
+            continue
+        if path not in by_path:
+            by_path[path] = ProductRoute(path=path, label=path, group="Main navigation")
+        route = by_path[path]
+        seen = {d.key for d in route.primary_docs}
+        for ref in refs:
+            if ref.key not in seen:
+                seen.add(ref.key)
+                route.primary_docs.append(ref)
+
+    return by_path
+
+
+def format_doc_line(
+    ref: DocRef, site_dir: Path, llm_output_dir: Path | None
+) -> str:
+    qmd = html_path_to_qmd(site_dir, ref.path)
+    anchor_suffix = f" (section: #{ref.anchor})" if ref.anchor else ""
+    line = f"- `{ref.path}`{anchor_suffix}"
+    if qmd:
+        headings = extract_headings(qmd)
+        if headings:
+            line += f"\n  - Sections: {'; '.join(headings[:8])}"
+        if llm_output_dir:
+            rel_md = qmd.relative_to(site_dir).with_suffix(".md").as_posix()
+            md_file = llm_output_dir / rel_md
+            if not md_file.is_file():
+                line += "\n  - Note: not yet in `_llm-output` (run `make render-llm`)"
+    else:
+        line += "\n  - Note: no matching `.qmd` source found"
+    return line
+
+
+def render_markdown(
+    routes: dict[str, ProductRoute],
+    site_dir: Path,
+    all_doc_paths: list[str],
+    llm_output_dir: Path | None,
+) -> str:
+    lines = [
+        "# ValidMind product-to-documentation map",
+        "",
+        "> Auto-generated. Maps in-product routes to documentation URLs and key sections.",
+        "> For how documentation is organized by topic, see `AGENTS.md` and",
+        "> [Using the documentation](/about/using-the-documentation.html).",
+        "",
+    ]
+
+    settings_routes = sorted(
+        (r for r in routes.values() if r.path.startswith("/settings")),
+        key=lambda r: r.path,
+    )
+    other_routes = sorted(
+        (r for r in routes.values() if not r.path.startswith("/settings")),
+        key=lambda r: r.path,
+    )
+
+    def render_section(title: str, section_routes: list[ProductRoute]) -> None:
+        if not section_routes:
+            return
+        lines.append(f"## {title}")
+        lines.append("")
+        current_group: str | None = None
+        for route in section_routes:
+            if title == "Settings" and route.group and route.group != current_group:
+                current_group = route.group
+                lines.append(f"### {current_group}")
+                lines.append("")
+            lines.append(f"#### `{route.path}` — {route.label}")
+            lines.append("")
+            if not route.primary_docs:
+                related = suggest_related_docs(route, all_doc_paths)
+                if related:
+                    route.related_docs = related
+                    route.notes.append(
+                        "No direct help link in frontend; related docs inferred from keywords."
+                    )
+                else:
+                    route.notes.append(
+                        "No direct help link; content may be covered under scattered guide sections."
+                    )
+            if route.primary_docs:
+                lines.append("**Docs (primary):**")
+                lines.append("")
+                for ref in route.primary_docs:
+                    lines.append(format_doc_line(ref, site_dir, llm_output_dir))
+                lines.append("")
+            related = route.related_docs or suggest_related_docs(route, all_doc_paths)
+            # Exclude primary from related
+            primary_keys = {d.path for d in route.primary_docs}
+            related = [r for r in related if r.path not in primary_keys]
+            if related:
+                lines.append("**Docs (related):**")
+                lines.append("")
+                for ref in related[:6]:
+                    lines.append(format_doc_line(ref, site_dir, llm_output_dir))
+                lines.append("")
+            for note in route.notes:
+                lines.append(f"- *{note}*")
+            if route.notes:
+                lines.append("")
+
+    render_section("Settings", settings_routes)
+    render_section("Main application", other_routes)
+
+    lines.append("## Documentation index (human-oriented)")
+    lines.append("")
+    lines.append(
+        "See `AGENTS.md` and `about/using-the-documentation.md` in the "
+        "LLM corpus for guides organized by feature area (Configuration, Workflows, "
+        "Inventory, etc.)."
+    )
+    lines.append("")
+    return "\n".join(lines)
+
+
+def main() -> int:
+    parser = argparse.ArgumentParser(description="Generate chatbot product-to-docs map")
+    parser.add_argument(
+        "--from-frontend",
+        action="store_true",
+        help="Re-extract route/help-link data from frontend and update the committed snapshot",
+    )
+    parser.add_argument(
+        "--frontend-root",
+        type=Path,
+        default=None,
+        help="Path to validmind/frontend (only with --from-frontend)",
+    )
+    parser.add_argument(
+        "--snapshot",
+        type=Path,
+        default=None,
+        help=f"Frontend snapshot JSON (default: site/llm/{DEFAULT_SNAPSHOT_NAME})",
+    )
+    parser.add_argument(
+        "--site-dir",
+        type=Path,
+        default=None,
+        help="Path to documentation site/ (default: <repo>/site)",
+    )
+    parser.add_argument(
+        "--output",
+        type=Path,
+        default=None,
+        help="Output markdown path (default: site/llm/chatbot-product-map.md)",
+    )
+    parser.add_argument(
+        "--json-output",
+        type=Path,
+        default=None,
+        help="Optional JSON output of merged routes (debug/tooling)",
+    )
+    args = parser.parse_args()
+
+    repo_root = find_repo_root()
+    site_dir = (args.site_dir or repo_root / "site").resolve()
+    snapshot_path = (
+        args.snapshot or site_dir / "llm" / DEFAULT_SNAPSHOT_NAME
+    ).resolve()
+    output_path = (args.output or site_dir / "llm/chatbot-product-map.md").resolve()
+    llm_output = site_dir / "llm/_llm-output"
+
+    if args.from_frontend:
+        frontend_root = resolve_frontend_root(repo_root, args.frontend_root)
+        payload = extract_frontend_snapshot(frontend_root)
+        write_frontend_snapshot(snapshot_path, payload)
+        print(f"Wrote {snapshot_path}")
+        settings, nav, file_links = load_frontend_snapshot(snapshot_path)
+    elif snapshot_path.is_file():
+        settings, nav, file_links = load_frontend_snapshot(snapshot_path)
+    else:
+        raise SystemExit(
+            f"Frontend snapshot not found: {snapshot_path}\n"
+            "Run with --from-frontend and a local validmind/frontend checkout to create it."
+        )
+
+    routes = merge_routes(settings, nav, file_links)
+    all_doc_paths = collect_all_doc_qmd_paths(site_dir)
+
+    md = render_markdown(routes, site_dir, all_doc_paths, llm_output if llm_output.is_dir() else None)
+    output_path.parent.mkdir(parents=True, exist_ok=True)
+    output_path.write_text(md, encoding="utf-8")
+    print(f"Wrote {output_path} ({len(routes)} routes)")
+
+    if args.json_output:
+        payload = {
+            path: {
+                "label": r.label,
+                "group": r.group,
+                "primary_docs": [doc_ref_to_dict(d) for d in r.primary_docs],
+                "related_docs": [doc_ref_to_dict(d) for d in r.related_docs],
+                "notes": r.notes,
+            }
+            for path, r in sorted(routes.items())
+        }
+        args.json_output.write_text(json.dumps(payload, indent=2) + "\n", encoding="utf-8")
+        print(f"Wrote {args.json_output}")
+
+    return 0
+
+
+if __name__ == "__main__":
+    raise SystemExit(main())
diff --git a/site/scripts/lighthouse_urls.py b/site/scripts/lighthouse_urls.py
new file mode 100644
index 0000000000..b7aa13619b
--- /dev/null
+++ b/site/scripts/lighthouse_urls.py
@@ -0,0 +1,314 @@
+#!/usr/bin/env python3
+"""Generate Lighthouse preview URLs from PR diffs or sitemap depth."""
+
+from __future__ import annotations
+
+import argparse
+import fnmatch
+import json
+import os
+import re
+import subprocess
+import sys
+import xml.etree.ElementTree as ET
+from pathlib import Path
+from urllib.parse import urlparse
+
+import requests
+
+ROOT_PAGES = [
+    "index.html",
+    "get-started/get-started.html",
+    "guide/guides.html",
+    "developer/validmind-library.html",
+    "support/support.html",
+    "releases/all-releases.html",
+    "training/training.html",
+]
+
+GLOBAL_PATTERNS = [
+    "site/_quarto.yml",
+    "site/_quarto-*.yml",
+    "site/_variables.yml",
+    "site/theme.scss",
+    "site/styles.css",
+    "site/_extensions/**",
+]
+
+OUTPUT_FILE_RE = re.compile(
+    r"^\s*output-file:\s*[_]?([^\s#]+\.html)\s*$",
+    re.MULTILINE,
+)
+
+SITEMAP_NS = {"sm": "http://www.sitemaps.org/schemas/sitemap/0.9"}
+
+
+def _matches_global_pattern(path: str) -> bool:
+    for pattern in GLOBAL_PATTERNS:
+        if fnmatch.fnmatch(path, pattern):
+            return True
+    return False
+
+
+def _parse_output_file(qmd_path: Path) -> str | None:
+    try:
+        text = qmd_path.read_text(encoding="utf-8")
+    except OSError:
+        return None
+    match = OUTPUT_FILE_RE.search(text)
+    if not match:
+        return None
+    name = match.group(1).lstrip("_")
+    return str(qmd_path.parent.relative_to(Path("site")) / name).replace("\\", "/")
+
+
+def qmd_path_to_html(path: str) -> str | None:
+    """Map a site/ source path to a preview HTML path."""
+    if not path.startswith("site/"):
+        return None
+
+    rel = path[len("site/") :]
+    p = Path(rel)
+
+    if p.suffix == ".qmd":
+        if p.name == "index.qmd":
+            return str(p.parent / "index.html").replace("\\", "/")
+        return str(p.with_suffix(".html")).replace("\\", "/")
+
+    return None
+
+
+def asset_path_to_html(path: str) -> str | None:
+    """Map co-located assets under site/ to their page HTML."""
+    if not path.startswith("site/"):
+        return None
+    rel = Path(path[len("site/") :])
+    if rel.suffix == ".qmd":
+        return qmd_path_to_html(path)
+
+    parent = rel.parent
+    if parent == Path("."):
+        return None
+
+    site_parent = Path("site") / parent
+    index_qmd = site_parent / "index.qmd"
+    if index_qmd.exists():
+        return str(parent / "index.html").replace("\\", "/")
+
+    for qmd in sorted(site_parent.glob("*.qmd")):
+        if qmd.name != "index.qmd":
+            return str(parent / f"{qmd.stem}.html").replace("\\", "/")
+
+    return None
+
+
+def changed_file_to_html(path: str) -> list[str]:
+    """Return HTML paths affected by a single changed file."""
+    if _matches_global_pattern(path):
+        return list(ROOT_PAGES)
+
+    if path.endswith(".qmd"):
+        html = qmd_path_to_html(path)
+        if html:
+            qmd_file = Path(path)
+            custom = _parse_output_file(qmd_file) if qmd_file.exists() else None
+            results = [html]
+            if custom and custom not in results:
+                results.append(custom)
+            return results
+        return []
+
+    html = asset_path_to_html(path)
+    return [html] if html else []
+
+
+def git_changed_files(base_ref: str) -> list[str]:
+    subprocess.run(
+        ["git", "fetch", "origin", base_ref],
+        check=True,
+        capture_output=True,
+    )
+    result = subprocess.run(
+        [
+            "git",
+            "diff",
+            "--name-only",
+            f"origin/{base_ref}...HEAD",
+            "--",
+            ":(top)site/",
+        ],
+        check=True,
+        capture_output=True,
+        text=True,
+    )
+    return [line.strip() for line in result.stdout.splitlines() if line.strip()]
+
+
+def urls_from_changed_files(base_ref: str) -> tuple[list[str], bool]:
+    """Return sorted HTML paths and whether global fallback was used."""
+    changed = git_changed_files(base_ref)
+    if not changed:
+        return [], False
+
+    html_paths: set[str] = set()
+    used_global_fallback = False
+
+    for path in changed:
+        if _matches_global_pattern(path):
+            used_global_fallback = True
+            html_paths.update(ROOT_PAGES)
+            continue
+        for html in changed_file_to_html(path):
+            html_paths.add(html)
+
+    if used_global_fallback:
+        return sorted(ROOT_PAGES), True
+
+    return sorted(html_paths), False
+
+
+def _path_depth(html_path: str) -> int:
+    path = html_path.replace(".html", "").strip("/")
+    if not path or path == "index":
+        return 0
+    return len([s for s in path.split("/") if s])
+
+
+def urls_from_sitemap(preview_base_url: str, max_depth: int) -> list[str]:
+    sitemap_url = f"{preview_base_url.rstrip('/')}/sitemap.xml"
+    response = requests.get(sitemap_url, timeout=60)
+    response.raise_for_status()
+    root = ET.fromstring(response.content)
+    urls: set[str] = set()
+
+    for url_el in root.findall(".//sm:url", SITEMAP_NS):
+        loc = url_el.find("sm:loc", SITEMAP_NS)
+        if loc is None or not loc.text:
+            continue
+        parsed = urlparse(loc.text)
+        path = parsed.path.lstrip("/")
+        if not path.endswith(".html"):
+            continue
+
+        segments = path.split("/")
+        pr_idx = next((i for i, s in enumerate(segments) if s == "pr_previews"), -1)
+        if pr_idx >= 0 and len(segments) > pr_idx + 4:
+            path = "/".join(segments[pr_idx + 4 :])
+
+        if _path_depth(path) <= max_depth:
+            urls.add(path)
+
+    if max_depth == 0:
+        return sorted(ROOT_PAGES)
+
+    return sorted(urls)
+
+
+def verify_urls(
+    preview_base_url: str,
+    html_paths: list[str],
+    installation_user: str | None = None,
+    installation_password: str | None = None,
+) -> list[str]:
+    """Keep only paths that return HTTP 200 on the preview."""
+    base = preview_base_url.rstrip("/")
+    ok: list[str] = []
+
+    for path in html_paths:
+        path = path.lstrip("/")
+        url = f"{base}/{path}"
+        if path.startswith("installation/") and installation_user and installation_password:
+            parsed = urlparse(url)
+            url = (
+                f"https://{installation_user}:{installation_password}@"
+                f"{parsed.netloc}{parsed.path}"
+            )
+
+        try:
+            status = requests.head(
+                url,
+                allow_redirects=True,
+                timeout=30,
+                headers={"User-Agent": "Mozilla/5.0"},
+            ).status_code
+            if status == 405:
+                status = requests.get(
+                    url,
+                    allow_redirects=True,
+                    timeout=30,
+                    headers={"User-Agent": "Mozilla/5.0"},
+                ).status_code
+        except requests.RequestException as exc:
+            print(f"WARN: Could not reach {path}: {exc}", file=sys.stderr)
+            continue
+
+        if status == 200:
+            ok.append(path)
+            print(f"OK: {path}", file=sys.stderr)
+        else:
+            print(f"WARN: Skipping {path} (HTTP {status})", file=sys.stderr)
+
+    return ok
+
+
+def write_url_list(preview_base_url: str, html_paths: list[str], out_path: Path) -> None:
+    base = preview_base_url.rstrip("/")
+    lines = [f"{base}/{p.lstrip('/')}" for p in html_paths]
+    out_path.write_text("\n".join(lines) + ("\n" if lines else ""), encoding="utf-8")
+
+
+def main() -> int:
+    parser = argparse.ArgumentParser(description="Generate Lighthouse URL list")
+    parser.add_argument("--mode", choices=["changed", "depth"], required=True)
+    parser.add_argument("--base-ref", default="main")
+    parser.add_argument("--depth", type=int, default=0, choices=[0, 1, 2])
+    parser.add_argument("--preview-url", required=True)
+    parser.add_argument("--output", default="lhci-urls.txt")
+    parser.add_argument("--metadata", default="lighthouse-metadata.json")
+    parser.add_argument(
+        "--skip-file",
+        help="If set and no URLs, write this path so workflow can detect skip",
+    )
+    args = parser.parse_args()
+
+    metadata: dict = {
+        "mode": args.mode,
+        "depth": args.depth if args.mode == "depth" else None,
+        "global_fallback": False,
+        "skip": False,
+        "paths": [],
+    }
+
+    if args.mode == "changed":
+        paths, global_fallback = urls_from_changed_files(args.base_ref)
+        metadata["global_fallback"] = global_fallback
+    else:
+        paths = urls_from_sitemap(args.preview_url, args.depth)
+
+    if not paths:
+        metadata["skip"] = True
+        Path(args.metadata).write_text(json.dumps(metadata, indent=2), encoding="utf-8")
+        if args.skip_file:
+            Path(args.skip_file).write_text("skip\n", encoding="utf-8")
+        print("No pages to audit in this PR.", file=sys.stderr)
+        return 0
+
+    verified = verify_urls(
+        args.preview_url,
+        paths,
+        installation_user=os.environ.get("INSTALLATION_USER"),
+        installation_password=os.environ.get("INSTALLATION_PW"),
+    )
+    if not verified:
+        print("Error: No URLs returned HTTP 200 on the preview.", file=sys.stderr)
+        return 1
+
+    metadata["paths"] = verified
+    Path(args.metadata).write_text(json.dumps(metadata, indent=2), encoding="utf-8")
+    write_url_list(args.preview_url, verified, Path(args.output))
+    print(f"Wrote {len(verified)} URL(s) to {args.output}", file=sys.stderr)
+    return 0
+
+
+if __name__ == "__main__":
+    sys.exit(main())
diff --git a/site/scripts/test_generate_chatbot_product_map.py b/site/scripts/test_generate_chatbot_product_map.py
new file mode 100644
index 0000000000..60e48dfb07
--- /dev/null
+++ b/site/scripts/test_generate_chatbot_product_map.py
@@ -0,0 +1,110 @@
+# Copyright © 2023-2026 ValidMind Inc. All rights reserved.
+# SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
+
+"""Unit tests for generate_chatbot_product_map.py"""
+
+import unittest
+from pathlib import Path
+
+import generate_chatbot_product_map as gen
+
+
+class TestGenerateChatbotProductMap(unittest.TestCase):
+    def test_resolve_doc_path_alias(self) -> None:
+        self.assertEqual(
+            gen.resolve_doc_path(
+                "/guide/model-workflows/setting-up-model-workflows.html"
+            ),
+            "/guide/workflows/setting-up-workflows.html",
+        )
+
+    def test_parse_doc_refs_from_help_link(self) -> None:
+        text = (
+            "helpLink={`${CONFIG.VALIDMIND_DOCS_URL}"
+            "/guide/configuration/managing-users.html`}"
+        )
+        refs = gen.parse_doc_refs_from_text(text)
+        self.assertEqual(len(refs), 1)
+        self.assertEqual(refs[0].path, "/guide/configuration/managing-users.html")
+
+    def test_html_path_to_qmd(self) -> None:
+        site = Path(__file__).resolve().parents[1]
+        qmd = gen.html_path_to_qmd(site, "/guide/workflows/setting-up-workflows.html")
+        self.assertIsNotNone(qmd)
+        self.assertEqual(qmd.name, "setting-up-workflows.qmd")
+
+    def test_extract_headings(self) -> None:
+        qmd = (
+            Path(__file__).resolve().parents[1]
+            / "guide/workflows/setting-up-workflows.qmd"
+        )
+        headings = gen.extract_headings(qmd)
+        self.assertTrue(any("workflows" in h.lower() for h in headings))
+
+    def test_is_user_facing_doc(self) -> None:
+        self.assertTrue(gen.is_user_facing_doc("/guide/workflows/manage-workflow-tasks.html"))
+        self.assertFalse(gen.is_user_facing_doc("/_source/release-notes/foo.html"))
+        self.assertFalse(gen.is_user_facing_doc("/guide/workflows/_partial.html"))
+
+    def test_collect_all_doc_qmd_paths_sorted(self) -> None:
+        site = Path(__file__).resolve().parents[1]
+        paths = gen.collect_all_doc_qmd_paths(site)
+        self.assertEqual(paths, sorted(paths))
+
+    def test_suggest_related_docs_sorted_and_stable(self) -> None:
+        site = Path(__file__).resolve().parents[1]
+        all_paths = gen.collect_all_doc_qmd_paths(site)
+        route = gen.ProductRoute(
+            path="/settings/templates",
+            label="Templates",
+            group="Configuration",
+        )
+        first = gen.suggest_related_docs(route, all_paths)
+        second = gen.suggest_related_docs(route, all_paths)
+        self.assertEqual(first, second)
+        self.assertEqual([r.path for r in first], sorted(r.path for r in first))
+
+    def test_file_to_route_hint_settings_index(self) -> None:
+        self.assertEqual(
+            gen.file_to_route_hint(Path("src/pages/Settings/index.tsx")),
+            "/settings",
+        )
+        self.assertEqual(
+            gen.file_to_route_hint(Path("src/pages/Settings/Workflows/index.tsx")),
+            "/settings/workflows",
+        )
+
+    def test_frontend_snapshot_roundtrip(self) -> None:
+        payload = {
+            "version": 1,
+            "settings": [
+                {
+                    "path": "/settings/workflows",
+                    "label": "Workflows",
+                    "group": "Governance",
+                    "primary_docs": [
+                        {
+                            "path": "/guide/workflows/setting-up-workflows.html",
+                            "anchor": None,
+                        }
+                    ],
+                }
+            ],
+            "nav": [],
+            "file_links": {},
+        }
+        site = Path(__file__).resolve().parents[1]
+        snapshot_path = site / "llm" / ".test-snapshot.json"
+        try:
+            gen.write_frontend_snapshot(snapshot_path, payload)
+            settings, nav, file_links = gen.load_frontend_snapshot(snapshot_path)
+            self.assertEqual(len(settings), 1)
+            self.assertEqual(settings[0].path, "/settings/workflows")
+            self.assertEqual(nav, [])
+            self.assertEqual(file_links, {})
+        finally:
+            snapshot_path.unlink(missing_ok=True)
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/site/scripts/test_lighthouse_urls.py b/site/scripts/test_lighthouse_urls.py
new file mode 100644
index 0000000000..8741af75e4
--- /dev/null
+++ b/site/scripts/test_lighthouse_urls.py
@@ -0,0 +1,102 @@
+#!/usr/bin/env python3
+"""Unit tests for lighthouse_urls.py"""
+
+import tempfile
+import unittest
+from pathlib import Path
+from unittest import mock
+
+from lighthouse_urls import (
+    ROOT_PAGES,
+    _matches_global_pattern,
+    asset_path_to_html,
+    changed_file_to_html,
+    qmd_path_to_html,
+    urls_from_changed_files,
+)
+
+
+class TestQmdMapping(unittest.TestCase):
+    def test_simple_qmd(self):
+        self.assertEqual(
+            qmd_path_to_html("site/guide/foo.qmd"),
+            "guide/foo.html",
+        )
+
+    def test_index_qmd(self):
+        self.assertEqual(
+            qmd_path_to_html("site/guide/foo/index.qmd"),
+            "guide/foo/index.html",
+        )
+
+    def test_root_index(self):
+        self.assertEqual(
+            qmd_path_to_html("site/index.qmd"),
+            "index.html",
+        )
+
+
+class TestGlobalPatterns(unittest.TestCase):
+    def test_quarto_yml(self):
+        self.assertTrue(_matches_global_pattern("site/_quarto.yml"))
+
+    def test_theme_scss(self):
+        self.assertTrue(_matches_global_pattern("site/theme.scss"))
+
+    def test_extensions(self):
+        self.assertTrue(_matches_global_pattern("site/_extensions/foo/bar.lua"))
+
+    def test_page_qmd_not_global(self):
+        self.assertFalse(_matches_global_pattern("site/guide/foo.qmd"))
+
+
+class TestChangedFileToHtml(unittest.TestCase):
+    def test_global_returns_root_pages(self):
+        result = changed_file_to_html("site/_quarto.yml")
+        self.assertEqual(result, ROOT_PAGES)
+
+    def test_asset_with_index_qmd(self):
+        import os
+
+        with tempfile.TemporaryDirectory() as tmp:
+            root = Path(tmp)
+            (root / "site" / "guide" / "foo").mkdir(parents=True)
+            (root / "site" / "guide" / "foo" / "index.qmd").write_text("---\n")
+            (root / "site" / "guide" / "foo" / "pic.png").write_bytes(b"")
+            prev = os.getcwd()
+            try:
+                os.chdir(tmp)
+                html = asset_path_to_html("site/guide/foo/pic.png")
+            finally:
+                os.chdir(prev)
+            self.assertEqual(html, "guide/foo/index.html")
+
+
+class TestUrlsFromChangedFiles(unittest.TestCase):
+    def test_empty_diff(self):
+        with mock.patch("lighthouse_urls.git_changed_files", return_value=[]):
+            paths, fallback = urls_from_changed_files("main")
+            self.assertEqual(paths, [])
+            self.assertFalse(fallback)
+
+    def test_single_qmd(self):
+        with mock.patch(
+            "lighthouse_urls.git_changed_files",
+            return_value=["site/developer/how-to/test-sandbox.qmd"],
+        ):
+            paths, fallback = urls_from_changed_files("main")
+            self.assertEqual(paths, ["developer/how-to/test-sandbox.html"])
+            self.assertFalse(fallback)
+
+    def test_global_fallback(self):
+        with mock.patch(
+            "lighthouse_urls.git_changed_files",
+            return_value=["site/_variables.yml", "site/guide/foo.qmd"],
+        ):
+            paths, fallback = urls_from_changed_files("main")
+            self.assertEqual(set(paths), set(ROOT_PAGES))
+            self.assertTrue(fallback)
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/site/support/_submit-feedback.qmd b/site/support/_submit-feedback.qmd
index 605b5f2ba8..8c8122e005 100644
--- a/site/support/_submit-feedback.qmd
+++ b/site/support/_submit-feedback.qmd
@@ -8,7 +8,7 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 Did you know you can submit feedback without leaving the {{< var validmind.platform >}}? 
 
-1. [Log in to ValidMind](/guide/access/log-in-to-validmind.qmd).
+1. [Log in to {{< var vm.product >}}](/guide/access/log-in-to-validmind.qmd).
 
 2. On any page within the {{< var vm.platform >}}, click on **Talk to us.**
 
diff --git a/site/support/support.qmd b/site/support/support.qmd
index aec916f877..ae75dc12e8 100644
--- a/site/support/support.qmd
+++ b/site/support/support.qmd
@@ -23,7 +23,7 @@ listing:
     grid-columns: 1
     contents:
       - path: https://support.validmind.com
-        title: "{{< fa cricle-question >}} {{< var vm.product >}} Help Center"
+        title: "{{< fa circle-question >}} {{< var vm.product >}} Help Center"
         subtitle: "https://{{< var support.center >}} {{< fa angle-right >}}"
         description: "Sign in with your {{< var vm.product >}} account and then click on **Submit a request**."
     fields: [title, subtitle, description]
diff --git a/site/support/troubleshooting.qmd b/site/support/troubleshooting.qmd
index 22427e52a6..443618c45e 100644
--- a/site/support/troubleshooting.qmd
+++ b/site/support/troubleshooting.qmd
@@ -64,9 +64,9 @@ or
 
 ### Fix
 
-Make sure that you are using the correct initialization credentials for the model you are trying to connect to. 
+Make sure that you are using the correct initialization credentials for the record (model) you are trying to connect to. 
 
-Follow the steps in [Install and initialize the {{< var validmind.developer >}}](/developer/model-documentation/install-and-initialize-validmind-library.qmd) for detailed instructions on how to integrate the {{< var vm.developer >}} and upload to the {{< var vm.platform >}}.
+Follow the steps in [Install and initialize the {{< var validmind.developer >}}](/developer/quickstart/install-and-initialize-validmind-library.qmd) for detailed instructions on how to integrate the {{< var vm.developer >}} and upload to the {{< var vm.platform >}}.
 
 ## SSL verification errors when initializing the {{< var validmind.developer >}} {#ssl-verification-when-initializing-library} 
 
@@ -98,4 +98,4 @@ Contact your internal IT team. Provide details about your Python environment and
 
 [^2]: [Manage permissions](/guide/configuration/manage-permissions.qmd)
 
-[^3]: [Upgrade {{< var vm.product >}}](/developer/model-documentation/install-and-initialize-validmind-library.qmd#upgrade)
+[^3]: [Upgrade {{< var vm.product >}}](/developer/quickstart/install-and-initialize-validmind-library.qmd#upgrade)
diff --git a/site/tests/_metadata.yml b/site/tests/_metadata.yml
deleted file mode 100644
index 159dcf69a0..0000000000
--- a/site/tests/_metadata.yml
+++ /dev/null
@@ -1,14 +0,0 @@
-# Copyright © 2023-2026 ValidMind Inc. All rights reserved.
-# Refer to the LICENSE file in the root of this repository for details.
-# SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
-
-format:
-  html:
-    grid:
-      sidebar-width: 450px
-      margin-width: 450px
-    page-layout: full
-    from: markdown-smart
-    css:
-      - /validmind/validmind.css
-      - /developer/developer.css
\ No newline at end of file
diff --git a/site/tests/data_validation/ACFandPACFPlot.md b/site/tests/data_validation/ACFandPACFPlot.md
deleted file mode 100644
index d649e985cb..0000000000
--- a/site/tests/data_validation/ACFandPACFPlot.md
+++ /dev/null
@@ -1,39 +0,0 @@
-# ACFandPACFPlot
-
-Analyzes time series data using Autocorrelation Function (ACF) and Partial Autocorrelation Function (PACF) plots to
-reveal trends and correlations.
-
-### Purpose
-
-The ACF (Autocorrelation Function) and PACF (Partial Autocorrelation Function) plot test is employed to analyze
-time series data in machine learning models. It illuminates the correlation of the data over time by plotting the
-correlation of the series with its own lags (ACF), and the correlations after removing effects already accounted
-for by earlier lags (PACF). This information can identify trends, such as seasonality, degrees of autocorrelation,
-and inform the selection of order parameters for AutoRegressive Integrated Moving Average (ARIMA) models.
-
-### Test Mechanism
-
-The `ACFandPACFPlot` test accepts a dataset with a time-based index. It first confirms the index is of a datetime
-type, then handles any NaN values. The test subsequently generates ACF and PACF plots for each column in the
-dataset, producing a subplot for each. If the dataset doesn't include key columns, an error is returned.
-
-### Signs of High Risk
-
-- Sudden drops in the correlation at a specific lag might signal a model at high risk.
-- Consistent high correlation across multiple lags could also indicate non-stationarity in the data, which may
-suggest that a model estimated on this data won't generalize well to future, unknown data.
-
-### Strengths
-
-- ACF and PACF plots offer clear graphical representations of the correlations in time series data.
-- These plots are effective at revealing important data characteristics such as seasonality, trends, and
-correlation patterns.
-- The insights from these plots aid in better model configuration, particularly in the selection of ARIMA model
-parameters.
-
-### Limitations
-
-- ACF and PACF plots are exclusively for time series data and hence, can't be applied to all ML models.
-- These plots require large, consistent datasets as gaps could lead to misleading results.
-- The plots can only represent linear correlations and fail to capture any non-linear relationships within the data.
-- The plots might be difficult for non-experts to interpret and should not replace more advanced analyses.
\ No newline at end of file
diff --git a/site/tests/data_validation/ADF.md b/site/tests/data_validation/ADF.md
deleted file mode 100644
index 7dc8863c7c..0000000000
--- a/site/tests/data_validation/ADF.md
+++ /dev/null
@@ -1,36 +0,0 @@
-# ADF
-
-Assesses the stationarity of a time series dataset using the Augmented Dickey-Fuller (ADF) test.
-
-### Purpose
-
-The Augmented Dickey-Fuller (ADF) test metric is used to determine the order of integration, i.e., the stationarity
-of a given time series dataset. The stationary property of data is pivotal in many machine learning models as it
-impacts the reliability and effectiveness of predictions and forecasts.
-
-### Test Mechanism
-
-The ADF test is executed using the `adfuller` function from the `statsmodels` library on each feature of the
-dataset. Multiple outputs are generated for each run, including the ADF test statistic and p-value, count of lags
-used, the number of observations considered in the test, critical values at various confidence levels, and the
-information criterion. These results are stored for each feature for subsequent analysis.
-
-### Signs of High Risk
-
-- An inflated ADF statistic and high p-value (generally above 0.05) indicate a high risk to the model's performance
-due to the presence of a unit root indicating non-stationarity.
-- Non-stationarity might result in untrustworthy or insufficient forecasts.
-
-### Strengths
-
-- The ADF test is robust to sophisticated correlations within the data, making it suitable for settings where data
-displays complex stochastic behavior.
-- It provides explicit outputs like test statistics, critical values, and information criterion, enhancing
-understanding and transparency in the model validation process.
-
-### Limitations
-
-- The ADF test might demonstrate low statistical power, making it challenging to differentiate between a unit root
-and near-unit-root processes, potentially causing false negatives.
-- It assumes the data follows an autoregressive process, which might not always be the case.
-- The test struggles with time series data that have structural breaks.
\ No newline at end of file
diff --git a/site/tests/data_validation/AutoAR.md b/site/tests/data_validation/AutoAR.md
deleted file mode 100644
index 3b6f45019e..0000000000
--- a/site/tests/data_validation/AutoAR.md
+++ /dev/null
@@ -1,43 +0,0 @@
-# AutoAR
-
-Automatically identifies the optimal Autoregressive (AR) order for a time series using BIC and AIC criteria.
-
-### Purpose
-
-The AutoAR test is intended to automatically identify the Autoregressive (AR) order of a time series by utilizing
-the Bayesian Information Criterion (BIC) and Akaike Information Criterion (AIC). AR order is crucial in forecasting
-tasks as it dictates the quantity of prior terms in the sequence to use for predicting the current term. The
-objective is to select the most fitting AR model that encapsulates the trend and seasonality in the time series
-data.
-
-### Test Mechanism
-
-The test mechanism operates by iterating through a possible range of AR orders up to a defined maximum. An AR model
-is fitted for each order, and the corresponding BIC and AIC are computed. BIC and AIC statistical measures are
-designed to penalize models for complexity, preferring simpler models that fit the data proficiently. To verify the
-stationarity of the time series, the Augmented Dickey-Fuller test is executed. The AR order, BIC, and AIC findings
-are compiled into a dataframe for effortless comparison. Then, the AR order with the smallest BIC is established as
-the desirable order for each variable.
-
-### Signs of High Risk
-
-- An augmented Dickey Fuller test p-value > 0.05, indicating the time series isn't stationary, may lead to
-inaccurate results.
-- Problems with the model fitting procedure, such as computational or convergence issues.
-- Continuous selection of the maximum specified AR order may suggest an insufficient set limit.
-
-### Strengths
-
-- The test independently pinpoints the optimal AR order, thereby reducing potential human bias.
-- It strikes a balance between model simplicity and goodness-of-fit to avoid overfitting.
-- Has the capability to account for stationarity in a time series, an essential aspect for dependable AR modeling.
-- The results are aggregated into a comprehensive table, enabling an easy interpretation.
-
-### Limitations
-
-- The tests need a stationary time series input.
-- They presume a linear relationship between the series and its lags.
-- The search for the best model is constrained by the maximum AR order supplied in the parameters. Therefore, a low
-max_ar_order could result in subpar outcomes.
-- AIC and BIC may not always agree on the selection of the best model. This potentially requires the user to juggle
-interpretational choices.
\ No newline at end of file
diff --git a/site/tests/data_validation/AutoMA.md b/site/tests/data_validation/AutoMA.md
deleted file mode 100644
index 29fc90bccc..0000000000
--- a/site/tests/data_validation/AutoMA.md
+++ /dev/null
@@ -1,46 +0,0 @@
-# AutoMA
-
-Automatically selects the optimal Moving Average (MA) order for each variable in a time series dataset based on
-minimal BIC and AIC values.
-
-### Purpose
-
-The `AutoMA` metric serves an essential role of automated decision-making for selecting the optimal Moving Average
-(MA) order for every variable in a given time series dataset. The selection is dependent on the minimalization of
-BIC (Bayesian Information Criterion) and AIC (Akaike Information Criterion); these are established statistical
-tools used for model selection. Furthermore, prior to the commencement of the model fitting process, the algorithm
-conducts a stationarity test (Augmented Dickey-Fuller test) on each series.
-
-### Test Mechanism
-
-Starting off, the `AutoMA` algorithm checks whether the `max_ma_order` parameter has been provided. It consequently
-loops through all variables in the dataset, carrying out the Dickey-Fuller test for stationarity. For each
-stationary variable, it fits an ARIMA model for orders running from 0 to `max_ma_order`. The result is a list
-showcasing the BIC and AIC values of the ARIMA models based on different orders. The MA order, which yields the
-smallest BIC, is chosen as the 'best MA order' for every single variable. The final results include a table
-summarizing the auto MA analysis and another table listing the best MA order for each variable.
-
-### Signs of High Risk
-
-- When a series is non-stationary (p-value>0.05 in the Dickey-Fuller test), the produced result could be inaccurate.
-- Any error that arises in the process of fitting the ARIMA models, especially with a higher MA order, can
-potentially indicate risks and might need further investigation.
-
-### Strengths
-
-- The metric facilitates automation in the process of selecting the MA order for time series forecasting. This
-significantly saves time and reduces efforts conventionally necessary for manual hyperparameter tuning.
-- The use of both BIC and AIC enhances the likelihood of selecting the most suitable model.
-- The metric ascertains the stationarity of the series prior to model fitting, thus ensuring that the underlying
-assumptions of the MA model are fulfilled.
-
-### Limitations
-
-- If the time series fails to be stationary, the metric may yield inaccurate results. Consequently, it necessitates
-pre-processing steps to stabilize the series before fitting the ARIMA model.
-- The metric adopts a rudimentary model selection process based on BIC and doesn't consider other potential model
-selection strategies. Depending on the specific dataset, other strategies could be more appropriate.
-- The 'max_ma_order' parameter must be manually input which doesn't always guarantee optimal performance,
-especially when configured too low.
-- The computation time increases with the rise in `max_ma_order`, hence, the metric may become computationally
-costly for larger values.
\ No newline at end of file
diff --git a/site/tests/data_validation/AutoStationarity.md b/site/tests/data_validation/AutoStationarity.md
deleted file mode 100644
index 7094888928..0000000000
--- a/site/tests/data_validation/AutoStationarity.md
+++ /dev/null
@@ -1,44 +0,0 @@
-# AutoStationarity
-
-Automates Augmented Dickey-Fuller test to assess stationarity across multiple time series in a DataFrame.
-
-### Purpose
-
-The AutoStationarity metric is intended to automatically detect and evaluate the stationary nature of each time
-series in a DataFrame. It incorporates the Augmented Dickey-Fuller (ADF) test, a statistical approach used to
-assess stationarity. Stationarity is a fundamental property suggesting that statistic features like mean and
-variance remain unchanged over time. This is necessary for many time-series models.
-
-### Test Mechanism
-
-The mechanism for the AutoStationarity test involves applying the Augmented Dicky-Fuller test to each time series
-within the given dataframe to assess if they are stationary. Every series in the dataframe is looped, using the ADF
-test up to a defined maximum order (configurable and by default set to 5). The p-value resulting from the ADF test
-is compared against a predetermined threshold (also configurable and by default set to 0.05). The time series is
-deemed stationary at its current differencing order if the p-value is less than the threshold.
-
-### Signs of High Risk
-
-- A significant number of series not achieving stationarity even at the maximum order of differencing can indicate
-high risk or potential failure in the model.
-- This could suggest the series may not be appropriately modeled by a stationary process, hence other modeling
-approaches might be required.
-
-### Strengths
-
-- The key strength in this metric lies in the automation of the ADF test, enabling mass stationarity analysis
-across various time series and boosting the efficiency and credibility of the analysis.
-- The utilization of the ADF test, a widely accepted method for testing stationarity, lends authenticity to the
-results derived.
-- The introduction of the max order and threshold parameters give users the autonomy to determine their preferred
-levels of stringency in the tests.
-
-### Limitations
-
-- The Augmented Dickey-Fuller test and the stationarity test are not without their limitations. These tests are
-premised on the assumption that the series can be modeled by an autoregressive process, which may not always hold
-true.
-- The stationarity check is highly sensitive to the choice of threshold for the significance level; an extremely
-high or low threshold could lead to incorrect results regarding the stationarity properties.
-- There's also a risk of over-differencing if the maximum order is set too high, which could induce unnecessary
-cycles.
\ No newline at end of file
diff --git a/site/tests/data_validation/BivariateScatterPlots.md b/site/tests/data_validation/BivariateScatterPlots.md
deleted file mode 100644
index b945b1421d..0000000000
--- a/site/tests/data_validation/BivariateScatterPlots.md
+++ /dev/null
@@ -1,38 +0,0 @@
-# BivariateScatterPlots
-
-Generates bivariate scatterplots to visually inspect relationships between pairs of numerical predictor variables
-in machine learning classification tasks.
-
-### Purpose
-
-This function is intended for visual inspection and monitoring of relationships between pairs of numerical
-variables in a machine learning model targeting classification tasks. It helps in understanding how predictor
-variables (features) interact with each other, which can inform feature selection, model-building strategies, and
-identify potential biases or irregularities in the data.
-
-### Test Mechanism
-
-The function creates scatter plots for each pair of numerical features in the dataset. It first filters out
-non-numerical and binary features, ensuring the plots focus on meaningful numerical relationships. The resulting
-scatterplots are color-coded uniformly to avoid visual distraction, and the function returns a tuple of Plotly
-figure objects, each representing a scatter plot for a pair of features.
-
-### Signs of High Risk
-
-- Visual patterns suggesting non-linear relationships, multicollinearity, clustering, or outlier points in the
-scatter plots.
-- Such issues could affect the assumptions and performance of certain models, especially those assuming linearity,
-like logistic regression.
-
-### Strengths
-
-- Scatterplots provide an intuitive and visual tool to explore relationships between two variables.
-- They are useful for identifying outliers, variable associations, and trends, including non-linear patterns.
-- Supports visualization of binary or multi-class classification datasets, focusing on numerical features.
-
-### Limitations
-
-- Scatterplots are limited to bivariate analysis, showing relationships between only two variables at a time.
-- Not ideal for very large datasets where overlapping points can reduce the clarity of the visualization.
-- Scatterplots are exploratory tools and do not provide quantitative measures of model quality or performance.
-- Interpretation is subjective and relies on the domain knowledge and judgment of the viewer.
\ No newline at end of file
diff --git a/site/tests/data_validation/BoxPierce.md b/site/tests/data_validation/BoxPierce.md
deleted file mode 100644
index da0c787efd..0000000000
--- a/site/tests/data_validation/BoxPierce.md
+++ /dev/null
@@ -1,42 +0,0 @@
-# BoxPierce
-
-Detects autocorrelation in time-series data through the Box-Pierce test to validate model performance.
-
-### Purpose
-
-The Box-Pierce test is utilized to detect the presence of autocorrelation in a time-series dataset.
-Autocorrelation, or serial correlation, refers to the degree of similarity between observations based on the
-temporal spacing between them. This test is essential for affirming the quality of a time-series model by ensuring
-that the error terms in the model are random and do not adhere to a specific pattern.
-
-### Test Mechanism
-
-The implementation of the Box-Pierce test involves calculating a test statistic along with a corresponding p-value
-derived from the dataset features. These quantities are used to test the null hypothesis that posits the data to be
-independently distributed. This is achieved by iterating over every feature column in the time-series data and
-applying the `acorr_ljungbox` function of the statsmodels library. The function yields the Box-Pierce test
-statistic as well as the respective p-value, all of which are cached as test results.
-
-### Signs of High Risk
-
-- A low p-value, typically under 0.05 as per statistical convention, throws the null hypothesis of independence
-into question. This implies that the dataset potentially houses autocorrelations, thus indicating a high-risk
-scenario concerning model performance.
-- Large Box-Pierce test statistic values may indicate the presence of autocorrelation.
-
-### Strengths
-
-- Detects patterns in data that are supposed to be random, thereby ensuring no underlying autocorrelation.
-- Can be computed efficiently given its low computational complexity.
-- Can be widely applied to most regression problems, making it very versatile.
-
-### Limitations
-
-- Assumes homoscedasticity (constant variance) and normality of residuals, which may not always be the case in
-real-world datasets.
-- May exhibit reduced power for detecting complex autocorrelation schemes such as higher-order or negative
-correlations.
-- It only provides a general indication of the existence of autocorrelation, without providing specific insights
-into the nature or patterns of the detected autocorrelation.
-- In the presence of trends or seasonal patterns, the Box-Pierce test may yield misleading results.
-- Applicability is limited to time-series data, which limits its overall utility.
\ No newline at end of file
diff --git a/site/tests/data_validation/ChiSquaredFeaturesTable.md b/site/tests/data_validation/ChiSquaredFeaturesTable.md
deleted file mode 100644
index 9ed5ef0d0f..0000000000
--- a/site/tests/data_validation/ChiSquaredFeaturesTable.md
+++ /dev/null
@@ -1,41 +0,0 @@
-# ChiSquaredFeaturesTable
-
-Assesses the statistical association between categorical features and a target variable using the Chi-Squared test.
-
-### Purpose
-
-The `ChiSquaredFeaturesTable` function is designed to evaluate the relationship between categorical features and a
-target variable in a dataset. It performs a Chi-Squared test of independence for each categorical feature to
-determine whether a statistically significant association exists with the target variable. This is particularly
-useful in Model Risk Management for understanding the relevance of features and identifying potential biases in a
-classification model.
-
-### Test Mechanism
-
-The function creates a contingency table for each categorical feature and the target variable, then applies the
-Chi-Squared test to compute the Chi-squared statistic and the p-value. The results for each feature include the
-variable name, Chi-squared statistic, p-value, p-value threshold, and a pass/fail status based on whether the
-p-value is below the specified threshold. The output is a DataFrame summarizing these results, sorted by p-value to
-highlight the most statistically significant associations.
-
-### Signs of High Risk
-
-- High p-values (greater than the set threshold) indicate a lack of significant association between a feature and
-the target variable, resulting in a 'Fail' status.
-- Features with a 'Fail' status might not be relevant for the model, which could negatively impact model
-performance.
-
-### Strengths
-
-- Provides a clear, statistical assessment of the relationship between categorical features and the target variable.
-- Produces an easily interpretable summary with a 'Pass/Fail' outcome for each feature, helping in feature
-selection.
-- The p-value threshold is adjustable, allowing for flexibility in statistical rigor.
-
-### Limitations
-
-- Assumes the dataset is tabular and consists of categorical variables, which may not be suitable for all datasets.
-- The test is designed for classification tasks and is not applicable to regression problems.
-- As with all hypothesis tests, the Chi-Squared test can only detect associations, not causal relationships.
-- The choice of p-value threshold can affect the interpretation of feature relevance, and different thresholds may
-lead to different conclusions.
\ No newline at end of file
diff --git a/site/tests/data_validation/ClassImbalance.md b/site/tests/data_validation/ClassImbalance.md
deleted file mode 100644
index da6352b387..0000000000
--- a/site/tests/data_validation/ClassImbalance.md
+++ /dev/null
@@ -1,46 +0,0 @@
-# ClassImbalance
-
-Evaluates and quantifies class distribution imbalance in a dataset used by a machine learning model.
-
-### Purpose
-
-The Class Imbalance test is designed to evaluate the distribution of target classes in a dataset that's utilized by
-a machine learning model. Specifically, it aims to ensure that the classes aren't overly skewed, which could lead
-to bias in the model's predictions. It's crucial to have a balanced training dataset to avoid creating a model
-that's biased with high accuracy for the majority class and low accuracy for the minority class.
-
-### Test Mechanism
-
-This Class Imbalance test operates by calculating the frequency (expressed as a percentage) of each class in the
-target column of the dataset. It then checks whether each class appears in at least a set minimum percentage of the
-total records. This minimum percentage is a modifiable parameter, but the default value is set to 10%.
-
-### Signs of High Risk
-
-- Any class that represents less than the pre-set minimum percentage threshold is marked as high risk, implying a
-potential class imbalance.
-- The function provides a pass/fail outcome for each class based on this criterion.
-- Fundamentally, if any class fails this test, it's highly likely that the dataset possesses imbalanced class
-distribution.
-
-### Strengths
-
-- The test can spot under-represented classes that could affect the efficiency of a machine learning model.
-- The calculation is straightforward and swift.
-- The test is highly informative because it not only spots imbalance, but it also quantifies the degree of
-imbalance.
-- The adjustable threshold enables flexibility and adaptation to differing use-cases or domain-specific needs.
-- The test creates a visually insightful plot showing the classes and their corresponding proportions, enhancing
-interpretability and comprehension of the data.
-
-### Limitations
-
-- The test might struggle to perform well or provide vital insights for datasets with a high number of classes. In
-such cases, the imbalance could be inevitable due to the inherent class distribution.
-- Sensitivity to the threshold value might result in faulty detection of imbalance if the threshold is set
-excessively high.
-- Regardless of the percentage threshold, it doesn't account for varying costs or impacts of misclassifying
-different classes, which might fluctuate based on specific applications or domains.
-- While it can identify imbalances in class distribution, it doesn't provide direct methods to address or correct
-these imbalances.
-- The test is only applicable for classification operations and unsuitable for regression or clustering tasks.
\ No newline at end of file
diff --git a/site/tests/data_validation/DatasetDescription.md b/site/tests/data_validation/DatasetDescription.md
deleted file mode 100644
index 0534eadba5..0000000000
--- a/site/tests/data_validation/DatasetDescription.md
+++ /dev/null
@@ -1,50 +0,0 @@
-# DatasetDescription
-
-Provides comprehensive analysis and statistical summaries of each column in a machine learning model's dataset.
-
-### Purpose
-
-The test depicted in the script is meant to run a comprehensive analysis on a Machine Learning model's datasets.
-The test or metric is implemented to obtain a complete summary of the columns in the dataset, including vital
-statistics of each column such as count, distinct values, missing values, histograms for numerical, categorical,
-boolean, and text columns. This summary gives a comprehensive overview of the dataset to better understand the
-characteristics of the data that the model is trained on or evaluates.
-
-### Test Mechanism
-
-The DatasetDescription class accomplishes the purpose as follows: firstly, the test method "run" infers the data
-type of each column in the dataset and stores the details (id, column type). For each column, the
-describe_column" method is invoked to collect statistical information about the column, including count,
-missing value count and its proportion to the total, unique value count, and its proportion to the total. Depending
-on the data type of a column, histograms are generated that reflect the distribution of data within the column.
-Numerical columns use the "get_numerical_histograms" method to calculate histogram distribution, whereas for
-categorical, boolean and text columns, a histogram is computed with frequencies of each unique value in the
-datasets. For unsupported types, an error is raised. Lastly, a summary table is built to aggregate all the
-statistical insights and histograms of the columns in a dataset.
-
-### Signs of High Risk
-
-- High ratio of missing values to total values in one or more columns which may impact the quality of the
-predictions.
-- Unsupported data types in dataset columns.
-- Large number of unique values in the dataset's columns which might make it harder for the model to establish
-patterns.
-- Extreme skewness or irregular distribution of data as reflected in the histograms.
-
-### Strengths
-
-- Provides a detailed analysis of the dataset with versatile summaries like count, unique values, histograms, etc.
-- Flexibility in handling different types of data: numerical, categorical, boolean, and text.
-- Useful in detecting problems in the dataset like missing values, unsupported data types, irregular data
-distribution, etc.
-- The summary gives a comprehensive understanding of dataset features allowing developers to make informed
-decisions.
-
-### Limitations
-
-- The computation can be expensive from a resource standpoint, particularly for large datasets with numerous columns.
-- The histograms use an arbitrary number of bins which may not be the optimal number of bins for specific data
-distribution.
-- Unsupported data types for columns will raise an error which may limit evaluating the dataset.
-- Columns with all null or missing values are not included in histogram computation.
-- This test only validates the quality of the dataset but doesn't address the model's performance directly.
\ No newline at end of file
diff --git a/site/tests/data_validation/DatasetSplit.md b/site/tests/data_validation/DatasetSplit.md
deleted file mode 100644
index 5a5eb5c582..0000000000
--- a/site/tests/data_validation/DatasetSplit.md
+++ /dev/null
@@ -1,41 +0,0 @@
-# DatasetSplit
-
-Evaluates and visualizes the distribution proportions among training, testing, and validation datasets of an ML
-model.
-
-### Purpose
-
-The DatasetSplit test is designed to evaluate and visualize the distribution of data among training, testing, and
-validation datasets, if available, within a given machine learning model. The main purpose is to assess whether the
-model's datasets are split appropriately, as an imbalanced split might affect the model's ability to learn from the
-data and generalize to unseen data.
-
-### Test Mechanism
-
-The DatasetSplit test first calculates the total size of all available datasets in the model. Then, for each
-individual dataset, the methodology involves determining the size of the dataset and its proportion relative to the
-total size. The results are then conveniently summarized in a table that shows dataset names, sizes, and
-proportions. Absolute size and proportion of the total dataset size are displayed for each individual dataset.
-
-### Signs of High Risk
-
-- A very small training dataset, which may result in the model not learning enough from the data.
-- A very large training dataset and a small test dataset, which may lead to model overfitting and poor
-generalization to unseen data.
-- A small or non-existent validation dataset, which might complicate the model's performance assessment.
-
-### Strengths
-
-- The DatasetSplit test provides a clear, understandable visualization of dataset split proportions, which can
-highlight any potential imbalance in dataset splits quickly.
-- It covers a wide range of task types including classification, regression, and text-related tasks.
-- The metric is not tied to any specific data type and is applicable to tabular data, time series data, or text
-data.
-
-### Limitations
-
-- The DatasetSplit test does not provide any insight into the quality or diversity of the data within each split,
-just the size and proportion.
-- The test does not give any recommendations or adjustments for imbalanced datasets.
-- Potential lack of compatibility with more complex modes of data splitting (for example, stratified or time-based
-splits) could limit the applicability of this test.
\ No newline at end of file
diff --git a/site/tests/data_validation/DescriptiveStatistics.md b/site/tests/data_validation/DescriptiveStatistics.md
deleted file mode 100644
index edc99ca670..0000000000
--- a/site/tests/data_validation/DescriptiveStatistics.md
+++ /dev/null
@@ -1,45 +0,0 @@
-# DescriptiveStatistics
-
-Performs a detailed descriptive statistical analysis of both numerical and categorical data within a model's
-dataset.
-
-### Purpose
-
-The purpose of the Descriptive Statistics metric is to provide a comprehensive summary of both numerical and
-categorical data within a dataset. This involves statistics such as count, mean, standard deviation, minimum and
-maximum values for numerical data. For categorical data, it calculates the count, number of unique values, most
-common value and its frequency, and the proportion of the most frequent value relative to the total. The goal is to
-visualize the overall distribution of the variables in the dataset, aiding in understanding the model's behavior
-and predicting its performance.
-
-### Test Mechanism
-
-The testing mechanism utilizes two in-built functions of pandas dataframes: `describe()` for numerical fields and
-`value_counts()` for categorical fields. The `describe()` function pulls out several summary statistics, while
-`value_counts()` accounts for unique values. The resulting data is formatted into two distinct tables, one for
-numerical and another for categorical variable summaries. These tables provide a clear summary of the main
-characteristics of the variables, which can be instrumental in assessing the model's performance.
-
-### Signs of High Risk
-
-- Skewed data or significant outliers can represent high risk. For numerical data, this may be reflected via a
-significant difference between the mean and median (50% percentile).
-- For categorical data, a lack of diversity (low count of unique values), or overdominance of a single category
-(high frequency of the top value) can indicate high risk.
-
-### Strengths
-
-- Provides a comprehensive summary of the dataset, shedding light on the distribution and characteristics of the
-variables under consideration.
-- It is a versatile and robust method, applicable to both numerical and categorical data.
-- Helps highlight crucial anomalies such as outliers, extreme skewness, or lack of diversity, which are vital in
-understanding model behavior during testing and validation.
-
-### Limitations
-
-- While this metric offers a high-level overview of the data, it may fail to detect subtle correlations or complex
-patterns.
-- Does not offer any insights on the relationship between variables.
-- Alone, descriptive statistics cannot be used to infer properties about future unseen data.
-- Should be used in conjunction with other statistical tests to provide a comprehensive understanding of the
-model's data.
\ No newline at end of file
diff --git a/site/tests/data_validation/DickeyFullerGLS.md b/site/tests/data_validation/DickeyFullerGLS.md
deleted file mode 100644
index 52d4ad61e4..0000000000
--- a/site/tests/data_validation/DickeyFullerGLS.md
+++ /dev/null
@@ -1,40 +0,0 @@
-# DickeyFullerGLS
-
-Assesses stationarity in time series data using the Dickey-Fuller GLS test to determine the order of integration.
-
-### Purpose
-
-The Dickey-Fuller GLS (DFGLS) test is utilized to determine the order of integration in time series data. For
-machine learning models dealing with time series and forecasting, this metric evaluates the existence of a unit
-root, thereby checking whether a time series is non-stationary. This analysis is a crucial initial step when
-dealing with time series data.
-
-### Test Mechanism
-
-This code implements the Dickey-Fuller GLS unit root test on each attribute of the dataset. This process involves
-iterating through every column of the dataset and applying the DFGLS test to assess the presence of a unit root.
-The resulting information, including the test statistic ('stat'), the p-value ('pvalue'), the quantity of lagged
-differences utilized in the regression ('usedlag'), and the number of observations ('nobs'), is subsequently stored.
-
-### Signs of High Risk
-
-- A high p-value for the DFGLS test represents a high risk. Specifically, a p-value above a typical threshold of
-0.05 suggests that the time series data is quite likely to be non-stationary, thus presenting a high risk for
-generating unreliable forecasts.
-
-### Strengths
-
-- The Dickey-Fuller GLS test is a potent tool for checking the stationarity of time series data.
-- It helps to verify the assumptions of the models before the actual construction of the machine learning models
-proceeds.
-- The results produced by this metric offer a clear insight into whether the data is appropriate for specific
-machine learning models, especially those demanding the stationarity of time series data.
-
-### Limitations
-
-- Despite its benefits, the DFGLS test does present some drawbacks. It can potentially lead to inaccurate
-conclusions if the time series data incorporates a structural break.
-- If the time series tends to follow a trend while still being stationary, the test might misinterpret it,
-necessitating further detrending.
-- The test also presents challenges when dealing with shorter time series data or volatile data, not producing
-reliable results in these cases.
\ No newline at end of file
diff --git a/site/tests/data_validation/Duplicates.md b/site/tests/data_validation/Duplicates.md
deleted file mode 100644
index e590e437ca..0000000000
--- a/site/tests/data_validation/Duplicates.md
+++ /dev/null
@@ -1,41 +0,0 @@
-# Duplicates
-
-Tests dataset for duplicate entries, ensuring model reliability via data quality verification.
-
-### Purpose
-
-The 'Duplicates' test is designed to check for duplicate rows within the dataset provided to the model. It serves
-as a measure of data quality, ensuring that the model isn't merely memorizing duplicate entries or being swayed by
-redundant information. This is an important step in the pre-processing of data for both classification and
-regression tasks.
-
-### Test Mechanism
-
-This test operates by checking each row for duplicates in the dataset. If a text column is specified in the
-dataset, the test is conducted on this column; if not, the test is run on all feature columns. The number and
-percentage of duplicates are calculated and returned in a DataFrame. Additionally, a test is passed if the total
-count of duplicates falls below a specified minimum threshold.
-
-### Signs of High Risk
-
-- A high number of duplicate rows in the dataset, which can lead to overfitting where the model performs well on
-the training data but poorly on unseen data.
-- A high percentage of duplicate rows in the dataset, indicating potential problems with data collection or
-processing.
-
-### Strengths
-
-- Assists in improving the reliability of the model's training process by ensuring the training data is not
-contaminated with duplicate entries, which can distort statistical analyses.
-- Provides both absolute numbers and percentage values of duplicate rows, giving a thorough overview of data
-quality.
-- Highly customizable as it allows for setting a user-defined minimum threshold to determine if the test has been
-passed.
-
-### Limitations
-
-- Does not distinguish between benign duplicates (i.e., coincidental identical entries in different rows) and
-problematic duplicates originating from data collection or processing errors.
-- The test becomes more computationally intensive as the size of the dataset increases, which might not be suitable
-for very large datasets.
-- Can only check for exact duplicates and may miss semantically similar information packaged differently.
\ No newline at end of file
diff --git a/site/tests/data_validation/EngleGrangerCoint.md b/site/tests/data_validation/EngleGrangerCoint.md
deleted file mode 100644
index 3f9c85e35a..0000000000
--- a/site/tests/data_validation/EngleGrangerCoint.md
+++ /dev/null
@@ -1,39 +0,0 @@
-# EngleGrangerCoint
-
-Assesses the degree of co-movement between pairs of time series data using the Engle-Granger cointegration test.
-
-### Purpose
-
-The intent of this Engle-Granger cointegration test is to explore and quantify the degree of co-movement between
-pairs of time series variables in a dataset. This is particularly useful in enhancing the accuracy of predictive
-regressions whenever the underlying variables are co-integrated, i.e., they move together over time.
-
-### Test Mechanism
-
-The test first drops any non-applicable values from the input dataset and then iterates over each pair of variables
-to apply the Engle-Granger cointegration test. The test generates a 'p' value, which is then compared against a
-pre-specified threshold (0.05 by default). The pair is labeled as 'Cointegrated' if the 'p' value is less than or
-equal to the threshold or 'Not cointegrated' otherwise. A summary table is returned by the metric showing
-cointegration results for each variable pair.
-
-### Signs of High Risk
-
-- A significant number of hypothesized cointegrated variables do not pass the test.
-- A considerable number of 'p' values are close to the threshold, indicating minor data fluctuations can switch the
-decision between 'Cointegrated' and 'Not cointegrated'.
-
-### Strengths
-
-- Provides an effective way to analyze relationships between time series, particularly in contexts where it's
-essential to check if variables move together in a statistically significant manner.
-- Useful in various domains, especially finance or economics, where predictive models often hinge on understanding
-how different variables move together over time.
-
-### Limitations
-
-- Assumes that the time series are integrated of the same order, which isn't always true in multivariate time
-series datasets.
-- The presence of non-stationary characteristics in the series or structural breaks can result in falsely positive
-or negative cointegration results.
-- May not perform well for small sample sizes due to lack of statistical power and should be supplemented with
-other predictive indicators for a more robust model evaluation.
\ No newline at end of file
diff --git a/site/tests/data_validation/FeatureTargetCorrelationPlot.md b/site/tests/data_validation/FeatureTargetCorrelationPlot.md
deleted file mode 100644
index 80ce4088db..0000000000
--- a/site/tests/data_validation/FeatureTargetCorrelationPlot.md
+++ /dev/null
@@ -1,40 +0,0 @@
-# FeatureTargetCorrelationPlot
-
-Visualizes the correlation between input features and the model's target output in a color-coded horizontal bar
-plot.
-
-### Purpose
-
-This test is designed to graphically illustrate the correlations between distinct input features and the target
-output of a Machine Learning model. Understanding how each feature influences the model's predictions is crucial—a
-higher correlation indicates a stronger influence of the feature on the target variable. This correlation study is
-especially advantageous during feature selection and for comprehending the model's operation.
-
-### Test Mechanism
-
-This FeatureTargetCorrelationPlot test computes and presents the correlations between the features and the target
-variable using a specific dataset. These correlations are calculated and are then graphically represented in a
-horizontal bar plot, color-coded based on the strength of the correlation. A hovering template can also be utilized
-for informative tooltips. It is possible to specify the features to be analyzed and adjust the graph's height
-according to need.
-
-### Signs of High Risk
-
-- There are no strong correlations (either positive or negative) between features and the target variable. This
-could suggest high risk as the supplied features do not appear to significantly impact the prediction output.
-- The presence of duplicated correlation values might hint at redundancy in the feature set.
-
-### Strengths
-
-- Provides visual assistance to interpreting correlations more effectively.
-- Gives a clear and simple tour of how each feature affects the model's target variable.
-- Beneficial for feature selection and grasping the model's prediction nature.
-- Precise correlation values for each feature are offered by the hover template, contributing to a granular-level
-comprehension.
-
-### Limitations
-
-- The test only accepts numerical data, meaning variables of other types need to be prepared beforehand.
-- The plot assumes all correlations to be linear, thus non-linear relationships might not be captured effectively.
-- Not apt for models that employ complex feature interactions, like Decision Trees or Neural Networks, as the test
-may not accurately reflect their importance.
\ No newline at end of file
diff --git a/site/tests/data_validation/HighCardinality.md b/site/tests/data_validation/HighCardinality.md
deleted file mode 100644
index 6871bc336b..0000000000
--- a/site/tests/data_validation/HighCardinality.md
+++ /dev/null
@@ -1,37 +0,0 @@
-# HighCardinality
-
-Assesses the number of unique values in categorical columns to detect high cardinality and potential overfitting.
-
-### Purpose
-
-The “High Cardinality” test is used to evaluate the number of unique values present in the categorical columns of a
-dataset. In this context, high cardinality implies the presence of a large number of unique, non-repetitive values
-in the dataset.
-
-### Test Mechanism
-
-The test first infers the dataset's type and then calculates an initial numeric threshold based on the test
-parameters. It only considers columns classified as "Categorical". For each of these columns, the number of
-distinct values (n_distinct) and the percentage of distinct values (p_distinct) are calculated. The test will pass
-if n_distinct is less than the calculated numeric threshold. Lastly, the results, which include details such as
-column name, number of distinct values, and pass/fail status, are compiled into a table.
-
-### Signs of High Risk
-
-- A large number of distinct values (high cardinality) in one or more categorical columns implies a high risk.
-- A column failing the test (n_distinct >= num_threshold) is another indicator of high risk.
-
-### Strengths
-
-- The High Cardinality test is effective in early detection of potential overfitting and unwanted noise.
-- It aids in identifying potential outliers and inconsistencies, thereby improving data quality.
-- The test can be applied to both classification and regression task types, demonstrating its versatility.
-
-### Limitations
-
-- The test is restricted to only "Categorical" data types and is thus not suitable for numerical or continuous
-features, limiting its scope.
-- The test does not consider the relevance or importance of unique values in categorical features, potentially
-causing it to overlook critical data points.
-- The threshold (both number and percent) used for the test is static and may not be optimal for diverse datasets
-and varied applications. Further mechanisms to adjust and refine this threshold could enhance its effectiveness.
\ No newline at end of file
diff --git a/site/tests/data_validation/HighPearsonCorrelation.md b/site/tests/data_validation/HighPearsonCorrelation.md
deleted file mode 100644
index 2c029e8fca..0000000000
--- a/site/tests/data_validation/HighPearsonCorrelation.md
+++ /dev/null
@@ -1,40 +0,0 @@
-# HighPearsonCorrelation
-
-Identifies highly correlated feature pairs in a dataset suggesting feature redundancy or multicollinearity.
-
-### Purpose
-
-The High Pearson Correlation test measures the linear relationship between features in a dataset, with the main
-goal of identifying high correlations that might indicate feature redundancy or multicollinearity. Identification
-of such issues allows developers and risk management teams to properly deal with potential impacts on the machine
-learning model's performance and interpretability.
-
-### Test Mechanism
-
-The test works by generating pairwise Pearson correlations for all features in the dataset, then sorting and
-eliminating duplicate and self-correlations. It assigns a Pass or Fail based on whether the absolute value of the
-correlation coefficient surpasses a pre-set threshold (defaulted at 0.3). It lastly returns the top n strongest
-correlations regardless of passing or failing status (where n is 10 by default but can be configured by passing the
-`top_n_correlations` parameter).
-
-### Signs of High Risk
-
-- A high risk indication would be the presence of correlation coefficients exceeding the threshold.
-- If the features share a strong linear relationship, this could lead to potential multicollinearity and model
-overfitting.
-- Redundancy of variables can undermine the interpretability of the model due to uncertainty over the authenticity
-of individual variable's predictive power.
-
-### Strengths
-
-- Provides a quick and simple means of identifying relationships between feature pairs.
-- Generates a transparent output that displays pairs of correlated variables, the Pearson correlation coefficient,
-and a Pass or Fail status for each.
-- Aids in early identification of potential multicollinearity issues that may disrupt model training.
-
-### Limitations
-
-- Can only delineate linear relationships, failing to shed light on nonlinear relationships or dependencies.
-- Sensitive to outliers where a few outliers could notably affect the correlation coefficient.
-- Limited to identifying redundancy only within feature pairs; may fail to spot more complex relationships among
-three or more variables.
\ No newline at end of file
diff --git a/site/tests/data_validation/IQROutliersBarPlot.md b/site/tests/data_validation/IQROutliersBarPlot.md
deleted file mode 100644
index f81bbde730..0000000000
--- a/site/tests/data_validation/IQROutliersBarPlot.md
+++ /dev/null
@@ -1,48 +0,0 @@
-# IQROutliersBarPlot
-
-Visualizes outlier distribution across percentiles in numerical data using the Interquartile Range (IQR) method.
-
-### Purpose
-
-The InterQuartile Range Outliers Bar Plot (IQROutliersBarPlot) metric aims to visually analyze and evaluate the
-extent of outliers in numeric variables based on percentiles. Its primary purpose is to clarify the dataset's
-distribution, flag possible abnormalities in it, and gauge potential risks associated with processing potentially
-skewed data, which can affect the machine learning model's predictive prowess.
-
-### Test Mechanism
-
-The examination invokes a series of steps:
-
-1. For every numeric feature in the dataset, the 25th percentile (Q1) and 75th percentile (Q3) are calculated
-before deriving the Interquartile Range (IQR), the difference between Q1 and Q3.
-2. Subsequently, the metric calculates the lower and upper thresholds by subtracting Q1 from the `threshold` times
-IQR and adding Q3 to `threshold` times IQR, respectively. The default `threshold` is set at 1.5.
-3. Any value in the feature that falls below the lower threshold or exceeds the upper threshold is labeled as an
-outlier.
-4. The number of outliers are tallied for different percentiles, such as [0-25], [25-50], [50-75], and [75-100].
-5. These counts are employed to construct a bar plot for the feature, showcasing the distribution of outliers
-across different percentiles.
-
-### Signs of High Risk
-
-- A prevalence of outliers in the data, potentially skewing its distribution.
-- Outliers dominating higher percentiles (75-100) which implies the presence of extreme values, capable of severely
-influencing the model's performance.
-- Certain features harboring most of their values as outliers, which signifies that these features might not
-contribute positively to the model's forecasting ability.
-
-### Strengths
-
-- Effectively identifies outliers in the data through visual means, facilitating easier comprehension and offering
-insights into the outliers' possible impact on the model.
-- Provides flexibility by accommodating all numeric features or a chosen subset.
-- Task-agnostic in nature; it is viable for both classification and regression tasks.
-- Can handle large datasets as its operation does not hinge on computationally heavy operations.
-
-### Limitations
-
-- Its application is limited to numerical variables and does not extend to categorical ones.
-- Only reveals the presence and distribution of outliers and does not provide insights into how these outliers
-might affect the model's predictive performance.
-- The assumption that data is unimodal and symmetric may not always hold true. In cases with non-normal
-distributions, the results can be misleading.
\ No newline at end of file
diff --git a/site/tests/data_validation/IQROutliersTable.md b/site/tests/data_validation/IQROutliersTable.md
deleted file mode 100644
index 25ffac0411..0000000000
--- a/site/tests/data_validation/IQROutliersTable.md
+++ /dev/null
@@ -1,42 +0,0 @@
-# IQROutliersTable
-
-Determines and summarizes outliers in numerical features using the Interquartile Range method.
-
-### Purpose
-
-The "Interquartile Range Outliers Table" (IQROutliersTable) metric is designed to identify and summarize outliers
-within numerical features of a dataset using the Interquartile Range (IQR) method. This exercise is crucial in the
-pre-processing of data because outliers can substantially distort statistical analysis and impact the performance
-of machine learning models.
-
-### Test Mechanism
-
-The IQR, which is the range separating the first quartile (25th percentile) from the third quartile (75th
-percentile), is calculated for each numerical feature within the dataset. An outlier is defined as a data point
-falling below the "Q1 - 1.5 * IQR" or above "Q3 + 1.5 * IQR" range. The test computes the number of outliers and
-their summary statistics (minimum, 25th percentile, median, 75th percentile, and maximum values) for each numerical
-feature. If no specific features are chosen, the test applies to all numerical features in the dataset. The default
-outlier threshold is set to 1.5 but can be customized by the user.
-
-### Signs of High Risk
-
-- A large number of outliers in multiple features.
-- Outliers significantly distanced from the mean value of variables.
-- Extremely high or low outlier values indicative of data entry errors or other data quality issues.
-
-### Strengths
-
-- Provides a comprehensive summary of outliers for each numerical feature, helping pinpoint features with potential
-quality issues.
-- The IQR method is robust to extremely high or low outlier values as it is based on quartile calculations.
-- Can be customized to work on selected features and set thresholds for outliers.
-
-### Limitations
-
-- Might cause false positives if the variable deviates from a normal or near-normal distribution, especially for
-skewed distributions.
-- Does not provide interpretation or recommendations for addressing outliers, relying on further analysis by users
-or data scientists.
-- Only applicable to numerical features, not categorical data.
-- Default thresholds may not be optimal for data with heavy pre-processing, manipulation, or inherently high
-kurtosis (heavy tails).
\ No newline at end of file
diff --git a/site/tests/data_validation/IsolationForestOutliers.md b/site/tests/data_validation/IsolationForestOutliers.md
deleted file mode 100644
index 3e8691a750..0000000000
--- a/site/tests/data_validation/IsolationForestOutliers.md
+++ /dev/null
@@ -1,41 +0,0 @@
-# IsolationForestOutliers
-
-Detects outliers in a dataset using the Isolation Forest algorithm and visualizes results through scatter plots.
-
-### Purpose
-
-The IsolationForestOutliers test is designed to identify anomalies or outliers in the model's dataset using the
-isolation forest algorithm. This algorithm assumes that anomalous data points can be isolated more quickly due to
-their distinctive properties. By creating isolation trees and identifying instances with shorter average path
-lengths, the test is able to pick out data points that differ from the majority.
-
-### Test Mechanism
-
-The test uses the isolation forest algorithm, which builds an ensemble of isolation trees by randomly selecting
-features and splitting the data based on random thresholds. It isolates anomalies rather than focusing on normal
-data points. For each pair of variables, a scatter plot is generated which distinguishes the identified outliers
-from the inliers. The results of the test can be visualized using these scatter plots, illustrating the distinction
-between outliers and inliers.
-
-### Signs of High Risk
-
-- The presence of high contamination, indicating a large number of anomalies
-- Inability to detect clusters of anomalies that are close in the feature space
-- Misclassifying normal instances as anomalies
-- Failure to detect actual anomalies
-
-### Strengths
-
-- Ability to handle large, high-dimensional datasets
-- Efficiency in isolating anomalies instead of normal instances
-- Insensitivity to the underlying distribution of data
-- Ability to recognize anomalies even when they are not separated from the main data cloud through identifying
-distinctive properties
-- Visually presents the test results for better understanding and interpretability
-
-### Limitations
-
-- Difficult to detect anomalies that are close to each other or prevalent in datasets
-- Dependency on the contamination parameter which may need fine-tuning to be effective
-- Potential failure in detecting collective anomalies if they behave similarly to normal data
-- Potential lack of precision in identifying which features contribute most to the anomalous behavior
\ No newline at end of file
diff --git a/site/tests/data_validation/JarqueBera.md b/site/tests/data_validation/JarqueBera.md
deleted file mode 100644
index 26ae5cdd2f..0000000000
--- a/site/tests/data_validation/JarqueBera.md
+++ /dev/null
@@ -1,39 +0,0 @@
-# JarqueBera
-
-Assesses normality of dataset features in an ML model using the Jarque-Bera test.
-
-### Purpose
-
-The purpose of the Jarque-Bera test as implemented in this metric is to determine if the features in the dataset of
-a given Machine Learning model follow a normal distribution. This is crucial for understanding the distribution and
-behavior of the model's features, as numerous statistical methods assume normal distribution of the data.
-
-### Test Mechanism
-
-The test mechanism involves computing the Jarque-Bera statistic, p-value, skew, and kurtosis for each feature in
-the dataset. It utilizes the 'jarque_bera' function from the 'statsmodels' library in Python, storing the results
-in a dictionary. The test evaluates the skewness and kurtosis to ascertain whether the dataset follows a normal
-distribution. A significant p-value (typically less than 0.05) implies that the data does not possess normal
-distribution.
-
-### Signs of High Risk
-
-- A high Jarque-Bera statistic and a low p-value (usually less than 0.05) indicate high-risk conditions.
-- Such results suggest the data significantly deviates from a normal distribution. If a machine learning model
-expects feature data to be normally distributed, these findings imply that it may not function as intended.
-
-### Strengths
-
-- Provides insights into the shape of the data distribution, helping determine whether a given set of data follows
-a normal distribution.
-- Particularly useful for risk assessment for models that assume a normal distribution of data.
-- By measuring skewness and kurtosis, it provides additional insights into the nature and magnitude of a
-distribution's deviation.
-
-### Limitations
-
-- Only checks for normality in the data distribution. It cannot provide insights into other types of distributions.
-- Datasets that aren't normally distributed but follow some other distribution might lead to inaccurate risk
-assessments.
-- Highly sensitive to large sample sizes, often rejecting the null hypothesis (that data is normally distributed)
-even for minor deviations in larger datasets.
\ No newline at end of file
diff --git a/site/tests/data_validation/KPSS.md b/site/tests/data_validation/KPSS.md
deleted file mode 100644
index f741b3011f..0000000000
--- a/site/tests/data_validation/KPSS.md
+++ /dev/null
@@ -1,38 +0,0 @@
-# KPSS
-
-Assesses the stationarity of time-series data in a machine learning model using the KPSS unit root test.
-
-### Purpose
-
-The KPSS (Kwiatkowski-Phillips-Schmidt-Shin) unit root test is utilized to ensure the stationarity of data within a
-machine learning model. It specifically works on time-series data to establish the order of integration, which is
-essential for accurate forecasting. A fundamental requirement for any time series model is that the series should
-be stationary.
-
-### Test Mechanism
-
-This test calculates the KPSS score for each feature in the dataset. The KPSS score includes a statistic, a
-p-value, a used lag, and critical values. The core principle behind the KPSS test is to evaluate the hypothesis
-that an observable time series is stationary around a deterministic trend. If the computed statistic exceeds the
-critical value, the null hypothesis (that the series is stationary) is rejected, indicating that the series is
-non-stationary.
-
-### Signs of High Risk
-
-- High KPSS score, particularly if the calculated statistic is higher than the critical value.
-- Rejection of the null hypothesis, indicating that the series is recognized as non-stationary, can severely affect
-the model's forecasting capability.
-
-### Strengths
-
-- Directly measures the stationarity of a series, fulfilling a key prerequisite for many time-series models.
-- The underlying logic of the test is intuitive and simple, making it easy to understand and accessible for both
-developers and risk management teams.
-
-### Limitations
-
-- Assumes the absence of a unit root in the series and doesn't differentiate between series that are stationary and
-those border-lining stationarity.
-- The test may have restricted power against certain alternatives.
-- The reliability of the test is contingent on the number of lags selected, which introduces potential bias in the
-measurement.
\ No newline at end of file
diff --git a/site/tests/data_validation/LJungBox.md b/site/tests/data_validation/LJungBox.md
deleted file mode 100644
index d12312abf4..0000000000
--- a/site/tests/data_validation/LJungBox.md
+++ /dev/null
@@ -1,37 +0,0 @@
-# LJungBox
-
-Assesses autocorrelations in dataset features by performing a Ljung-Box test on each feature.
-
-### Purpose
-
-The Ljung-Box test is a type of statistical test utilized to ascertain whether there are autocorrelations within a
-given dataset that differ significantly from zero. In the context of a machine learning model, this test is
-primarily used to evaluate data utilized in regression tasks, especially those involving time series and
-forecasting.
-
-### Test Mechanism
-
-The test operates by iterating over each feature within the dataset and applying the `acorr_ljungbox`
-function from the `statsmodels.stats.diagnostic` library. This function calculates the Ljung-Box statistic and
-p-value for each feature. These results are then stored in a pandas DataFrame where the columns are the feature names,
-statistic, and p-value respectively. Generally, a lower p-value indicates a higher likelihood of significant
-autocorrelations within the feature.
-
-### Signs of High Risk
-
-- High Ljung-Box statistic values or low p-values.
-- Presence of significant autocorrelations in the respective features.
-- Potential for negative impact on model performance or bias if autocorrelations are not properly handled.
-
-### Strengths
-
-- Powerful tool for detecting autocorrelations within datasets, especially in time series data.
-- Provides quantitative measures (statistic and p-value) for precise evaluation.
-- Helps avoid issues related to autoregressive residuals and other challenges in regression models.
-
-### Limitations
-
-- Cannot detect all types of non-linearity or complex interrelationships among variables.
-- Testing individual features may not fully encapsulate the dynamics of the data if features interact with each other.
-- Designed more for traditional statistical models and may not be fully compatible with certain types of complex
-machine learning models.
\ No newline at end of file
diff --git a/site/tests/data_validation/LaggedCorrelationHeatmap.md b/site/tests/data_validation/LaggedCorrelationHeatmap.md
deleted file mode 100644
index e38d2bf5e6..0000000000
--- a/site/tests/data_validation/LaggedCorrelationHeatmap.md
+++ /dev/null
@@ -1,42 +0,0 @@
-# LaggedCorrelationHeatmap
-
-Assesses and visualizes correlation between target variable and lagged independent variables in a time-series
-dataset.
-
-### Purpose
-
-The LaggedCorrelationHeatmap metric is utilized to appraise and illustrate the correlation between the target
-variable and delayed copies (lags) of independent variables in a time-series dataset. It assists in revealing
-relationships in time-series data where the influence of an independent variable on the dependent variable is not
-immediate but occurs after a period (lags).
-
-### Test Mechanism
-
-To execute this test, Python's Pandas library pairs with Plotly to perform computations and present the
-visualization in the form of a heatmap. The test begins by extracting the target variable and corresponding
-independent variables from the dataset. Then, generation of lags of independent variables takes place, followed by
-the calculation of correlation between these lagged variables and the target variable. The outcome is a correlation
-matrix that gets recorded and illustrated as a heatmap, where different color intensities represent the strength of
-the correlation, making patterns easier to identify.
-
-### Signs of High Risk
-
-- Insignificant correlations across the heatmap, indicating a lack of noteworthy relationships between variables.
-- Correlations that break intuition or previous understanding, suggesting potential issues with the dataset or the
-model.
-
-### Strengths
-
-- This metric serves as an exceptional tool for exploring and visualizing time-dependent relationships between
-features and the target variable in a time-series dataset.
-- It aids in identifying delayed effects that might go unnoticed with other correlation measures.
-- The heatmap offers an intuitive visual representation of time-dependent correlations and influences.
-
-### Limitations
-
-- The metric presumes linear relationships between variables, potentially ignoring non-linear relationships.
-- The correlation considered is linear; therefore, intricate non-linear interactions might be overlooked.
-- The metric is only applicable for time-series data, limiting its utility outside of this context.
-- The number of lags chosen can significantly influence the results; too many lags can render the heatmap difficult
-to interpret, while too few might overlook delayed effects.
-- This metric does not take into account any causal relationships, but merely demonstrates correlation.
\ No newline at end of file
diff --git a/site/tests/data_validation/MissingValues.md b/site/tests/data_validation/MissingValues.md
deleted file mode 100644
index 75a78e0f6c..0000000000
--- a/site/tests/data_validation/MissingValues.md
+++ /dev/null
@@ -1,37 +0,0 @@
-# MissingValues
-
-Evaluates dataset quality by ensuring missing value percentage across all features does not exceed a set threshold.
-
-### Purpose
-
-The Missing Values test is designed to evaluate the quality of a dataset by measuring the number of missing values
-across all features. The objective is to ensure that the ratio of missing data to total data is less than a
-predefined threshold (as a percentage), defaulting to 1.0, in order to maintain the data quality necessary for
-reliable predictive strength in a machine learning model.
-
-### Test Mechanism
-
-The mechanism for this test involves iterating through each column of the dataset, counting missing values
-(represented as NaNs), and calculating the percentage they represent against the total number of rows. The test
-then checks if the missing value percentage is less than or equal to the predefined `min_percentage_threshold`. The results are
-shown in a table summarizing each column, the number of missing values, the percentage of missing values in each
-column, and a Pass/Fail status based on the threshold comparison.
-
-### Signs of High Risk
-
-- When the missing value percentage in any column exceeds the `min_percentage_threshold` value.
-- Presence of missing values across many columns, leading to multiple instances of failing the threshold.
-
-### Strengths
-
-- Quick and granular identification of missing data across each feature in the dataset.
-- Provides an effective and straightforward means of maintaining data quality, essential for constructing efficient
-machine learning models.
-
-### Limitations
-
-- Does not suggest the root causes of the missing values or recommend ways to impute or handle them.
-- May overlook features with significant missing data but still less than the `min_percentage_threshold`, potentially
-impacting the model.
-- Does not account for data encoded as values like "-999" or "None," which might not technically classify as
-missing but could bear similar implications.
\ No newline at end of file
diff --git a/site/tests/data_validation/MissingValuesBarPlot.md b/site/tests/data_validation/MissingValuesBarPlot.md
deleted file mode 100644
index eeb95dfdc4..0000000000
--- a/site/tests/data_validation/MissingValuesBarPlot.md
+++ /dev/null
@@ -1,44 +0,0 @@
-# MissingValuesBarPlot
-
-Assesses the percentage and distribution of missing values in the dataset via a bar plot, with emphasis on
-identifying high-risk columns based on a user-defined threshold.
-
-### Purpose
-
-The 'MissingValuesBarPlot' metric provides a color-coded visual representation of the percentage of missing values
-for each column in an ML model's dataset. The primary purpose of this metric is to easily identify and quantify
-missing data, which are essential steps in data preprocessing. The presence of missing data can potentially skew
-the model's predictions and decrease its accuracy. Additionally, this metric uses a pre-set threshold to categorize
-various columns into ones that contain missing data above the threshold (high risk) and below the threshold (less
-risky).
-
-### Test Mechanism
-
-The test mechanism involves scanning each column in the input dataset and calculating the percentage of missing
-values. It then compares each column's missing data percentage with the predefined threshold, categorizing columns
-with missing data above the threshold as high-risk. The test generates a bar plot in which columns with missing
-data are represented on the y-axis and their corresponding missing data percentages are displayed on the x-axis.
-The color of each bar reflects the missing data percentage in relation to the threshold: grey for values below the
-threshold and light coral for those exceeding it. The user-defined threshold is represented by a red dashed line on
-the plot.
-
-### Signs of High Risk
-
-- Columns with higher percentages of missing values beyond the threshold are high-risk. These are visually
-represented by light coral bars on the bar plot.
-
-### Strengths
-
-- Helps in quickly identifying and quantifying missing data across all columns of the dataset.
-- Facilitates pattern recognition through visual representation.
-- Enables customization of the level of risk tolerance via a user-defined threshold.
-- Supports both classification and regression tasks, sharing its versatility.
-
-### Limitations
-
-- It only considers the quantity of missing values, not differentiating between different types of missingness
-(Missing completely at random - MCAR, Missing at random - MAR, Not Missing at random - NMAR).
-- It doesn't offer insights into potential approaches for handling missing entries, such as various imputation
-strategies.
-- The metric does not consider possible impacts of the missing data on the model's accuracy or precision.
-- Interpretation of the findings and the next steps might require an expert understanding of the field.
\ No newline at end of file
diff --git a/site/tests/data_validation/MutualInformation.md b/site/tests/data_validation/MutualInformation.md
deleted file mode 100644
index 4b03511652..0000000000
--- a/site/tests/data_validation/MutualInformation.md
+++ /dev/null
@@ -1,50 +0,0 @@
-# MutualInformation
-
-Calculates mutual information scores between features and target variable to evaluate feature relevance.
-
-### Purpose
-
-The Mutual Information test quantifies the predictive power of each feature by measuring its statistical
-dependency with the target variable. This helps identify relevant features for model training and
-detect potential redundant or irrelevant variables, supporting feature selection decisions and model
-interpretability.
-
-### Test Mechanism
-
-The test employs sklearn's mutual_info_classif/mutual_info_regression functions to compute mutual
-information between each feature and the target. It produces a normalized score (0 to 1) for each
-feature, where higher scores indicate stronger relationships. Results are presented in both tabular
-format and visualized through a bar plot with a configurable threshold line.
-
-### Signs of High Risk
-
-- Many features showing very low mutual information scores
-- Key business features exhibiting unexpectedly low scores
-- All features showing similar, low information content
-- Large discrepancy between business importance and MI scores
-- Highly skewed distribution of MI scores
-- Critical features below the minimum threshold
-- Unexpected zero or near-zero scores for known important features
-- Inconsistent scores across different data samples
-
-### Strengths
-
-- Captures non-linear relationships between features and target
-- Scale-invariant measurement of feature relevance
-- Works for both classification and regression tasks
-- Provides interpretable scores (0 to 1 scale)
-- Supports automated feature selection
-- No assumptions about data distribution
-- Handles numerical and categorical features
-- Computationally efficient for most datasets
-
-### Limitations
-
-- Requires sufficient data for reliable estimates
-- May be computationally intensive for very large datasets
-- Cannot detect redundant features (pairwise relationships)
-- Sensitive to feature discretization for continuous variables
-- Does not account for feature interactions
-- May underestimate importance of rare but crucial events
-- Cannot handle missing values directly
-- May be affected by extreme class imbalance
\ No newline at end of file
diff --git a/site/tests/data_validation/PearsonCorrelationMatrix.md b/site/tests/data_validation/PearsonCorrelationMatrix.md
deleted file mode 100644
index 9f83e71b1e..0000000000
--- a/site/tests/data_validation/PearsonCorrelationMatrix.md
+++ /dev/null
@@ -1,39 +0,0 @@
-# PearsonCorrelationMatrix
-
-Evaluates linear dependency between numerical variables in a dataset via a Pearson Correlation coefficient heat map.
-
-### Purpose
-
-This test is intended to evaluate the extent of linear dependency between all pairs of numerical variables in the
-given dataset. It provides the Pearson Correlation coefficient, which reveals any high correlations present. The
-purpose of doing this is to identify potential redundancy, as variables that are highly correlated can often be
-removed to reduce the dimensionality of the dataset without significantly impacting the model's performance.
-
-### Test Mechanism
-
-This metric test generates a correlation matrix for all numerical variables in the dataset using the Pearson
-correlation formula. A heat map is subsequently created to visualize this matrix effectively. The color of each
-point on the heat map corresponds to the magnitude and direction (positive or negative) of the correlation, with a
-range from -1 (perfect negative correlation) to 1 (perfect positive correlation). Any correlation coefficients
-higher than 0.7 (in absolute terms) are indicated in white in the heat map, suggesting a high degree of correlation.
-
-### Signs of High Risk
-
-- A large number of variables in the dataset showing a high degree of correlation (coefficients approaching ±1).
-This indicates redundancy within the dataset, suggesting that some variables may not be contributing new
-information to the model.
-- Potential risk of overfitting.
-
-### Strengths
-
-- Detects and quantifies the linearity of relationships between variables, aiding in identifying redundant
-variables to simplify models and potentially improve performance.
-- The heatmap visualization provides an easy-to-understand overview of correlations, beneficial for users not
-comfortable with numerical matrices.
-
-### Limitations
-
-- Limited to detecting linear relationships, potentially missing non-linear relationships which impede
-opportunities for dimensionality reduction.
-- Measures only the degree of linear relationship, not the strength of one variable's effect on another.
-- The 0.7 correlation threshold is arbitrary and might exclude valid dependencies with lower coefficients.
\ No newline at end of file
diff --git a/site/tests/data_validation/PhillipsPerronArch.md b/site/tests/data_validation/PhillipsPerronArch.md
deleted file mode 100644
index 043128c6ec..0000000000
--- a/site/tests/data_validation/PhillipsPerronArch.md
+++ /dev/null
@@ -1,39 +0,0 @@
-# PhillipsPerronArch
-
-Assesses the stationarity of time series data in each feature of the ML model using the Phillips-Perron test.
-
-### Purpose
-
-The Phillips-Perron (PP) test is used to determine the stationarity of time series data for each feature in a
-dataset, which is crucial for forecasting tasks. It tests the null hypothesis that a time series is unit-root
-non-stationary. This is vital for understanding the stochastic behavior of the data and ensuring the robustness and
-validity of predictions generated by regression analysis models.
-
-### Test Mechanism
-
-The PP test is conducted for each feature in the dataset as follows:
-- A data frame is created from the dataset.
-- For each column, the Phillips-Perron method calculates the test statistic, p-value, lags used, and number of
-observations.
-- The results are then stored for each feature, providing a metric that indicates the stationarity of the time
-series data.
-
-### Signs of High Risk
-
-- A high p-value, indicating that the series has a unit root and is non-stationary.
-- Test statistic values exceeding critical values, suggesting non-stationarity.
-- High 'usedlag' value, pointing towards autocorrelation issues that may degrade model performance.
-
-### Strengths
-
-- Resilience against heteroskedasticity in the error term.
-- Effective for long time series data.
-- Helps in determining whether the time series is stationary, aiding in the selection of suitable forecasting
-models.
-
-### Limitations
-
-- Applicable only within a univariate time series framework.
-- Relies on asymptotic theory, which may reduce the test’s power for small sample sizes.
-- Non-stationary time series must be converted to stationary series through differencing, potentially leading to
-loss of important data points.
\ No newline at end of file
diff --git a/site/tests/data_validation/ProtectedClassesCombination.md b/site/tests/data_validation/ProtectedClassesCombination.md
deleted file mode 100644
index 89cf20f286..0000000000
--- a/site/tests/data_validation/ProtectedClassesCombination.md
+++ /dev/null
@@ -1,34 +0,0 @@
-# ProtectedClassesCombination
-
-Visualizes combinations of protected classes and their corresponding error metric differences.
-
-### Purpose
-
-This test aims to provide insights into how different combinations of protected classes affect various error metrics,
-particularly the false negative rate (FNR) and false positive rate (FPR). By visualizing these combinations,
-it helps identify potential biases or disparities in model performance across different intersectional groups.
-
-### Test Mechanism
-
-The test performs the following steps:
-1. Combines the specified protected class columns to create a single multi-class category.
-2. Calculates error metrics (FNR, FPR, etc.) for each combination of protected classes.
-3. Generates visualizations showing the distribution of these metrics across all class combinations.
-
-### Signs of High Risk
-
-- Large disparities in FNR or FPR across different protected class combinations.
-- Consistent patterns of higher error rates for specific combinations of protected attributes.
-- Unexpected or unexplainable variations in error metrics between similar group combinations.
-
-### Strengths
-
-- Provides a comprehensive view of intersectional fairness across multiple protected attributes.
-- Allows for easy identification of potentially problematic combinations of protected classes.
-- Visualizations make it easier to spot patterns or outliers in model performance across groups.
-
-### Limitations
-
-- May become complex and difficult to interpret with a large number of protected classes or combinations.
-- Does not provide statistical significance of observed differences.
-- Visualization alone may not capture all nuances of intersectional fairness.
\ No newline at end of file
diff --git a/site/tests/data_validation/ProtectedClassesDescription.md b/site/tests/data_validation/ProtectedClassesDescription.md
deleted file mode 100644
index 31a0c672a0..0000000000
--- a/site/tests/data_validation/ProtectedClassesDescription.md
+++ /dev/null
@@ -1,43 +0,0 @@
-# ProtectedClassesDescription
-
-Visualizes the distribution of protected classes in the dataset relative to the target variable
-and provides descriptive statistics.
-
-### Purpose
-
-The ProtectedClassesDescription test aims to identify potential biases or significant differences in the
-distribution of target outcomes across different protected classes. This visualization and statistical summary
-help in understanding the relationship between protected attributes and the target variable, which is crucial
-for assessing fairness in machine learning models.
-
-### Test Mechanism
-
-The function creates interactive stacked bar charts for each specified protected class using Plotly.
-Additionally, it generates a single table of descriptive statistics for all protected classes, including:
-- Protected class and category
-- Count and percentage of each category within the protected class
-- Mean, median, and mode of the target variable for each category
-- Standard deviation of the target variable for each category
-- Minimum and maximum values of the target variable for each category
-
-### Signs of High Risk
-
-- Significant imbalances in the distribution of target outcomes across different categories of a protected class.
-- Large disparities in mean, median, or mode of the target variable across categories.
-- Underrepresentation or overrepresentation of certain groups within protected classes.
-- High standard deviations in certain categories, indicating potential volatility or outliers.
-
-### Strengths
-
-- Provides both visual and statistical representation of potential biases in the dataset.
-- Allows for easy identification of imbalances in target variable distribution across protected classes.
-- Interactive plots enable detailed exploration of the data.
-- Consolidated statistical summary provides quantitative measures to complement visual analysis.
-- Applicable to both classification and regression tasks.
-
-### Limitations
-
-- Does not provide advanced statistical measures of bias or fairness.
-- May become cluttered if there are many categories within a protected class or many unique target values.
-- Interpretation may require domain expertise to understand the implications of observed disparities.
-- Does not account for intersectionality or complex interactions between multiple protected attributes.
\ No newline at end of file
diff --git a/site/tests/data_validation/ProtectedClassesDisparity.md b/site/tests/data_validation/ProtectedClassesDisparity.md
deleted file mode 100644
index c3b4bdf185..0000000000
--- a/site/tests/data_validation/ProtectedClassesDisparity.md
+++ /dev/null
@@ -1,37 +0,0 @@
-# ProtectedClassesDisparity
-
-Investigates disparities in model performance across different protected class segments.
-
-### Purpose
-
-This test aims to identify and quantify potential biases in model outcomes by comparing various performance metrics
-across different segments of protected classes. It helps in assessing whether the model produces discriminatory
-outcomes for certain groups, which is crucial for ensuring fairness in machine learning models.
-
-### Test Mechanism
-
-The test performs the following steps:
-1. Calculates performance metrics (e.g., false negative rate, false positive rate, true positive rate) for each segment
-of the specified protected classes.
-2. Computes disparity ratios by comparing these metrics between different segments and a reference group.
-3. Generates visualizations showing the disparities and their relation to a user-defined disparity tolerance threshold.
-4. Produces a comprehensive table with various disparity metrics for detailed analysis.
-
-### Signs of High Risk
-
-- Disparity ratios exceeding the specified disparity tolerance threshold.
-- Consistent patterns of higher error rates or lower performance for specific protected class segments.
-- Statistically significant differences in performance metrics across segments.
-
-### Strengths
-
-- Provides a comprehensive view of model fairness across multiple protected attributes and metrics.
-- Allows for easy identification of problematic disparities through visual and tabular representations.
-- Customizable disparity tolerance threshold to align with specific use-case requirements.
-- Applicable to various performance metrics, offering a multi-faceted analysis of model fairness.
-
-### Limitations
-
-- Relies on a predefined reference group for each protected class, which may not always be the most appropriate choice.
-- Does not account for intersectionality between different protected attributes.
-- The interpretation of results may require domain expertise to understand the implications of observed disparities.
\ No newline at end of file
diff --git a/site/tests/data_validation/ProtectedClassesThresholdOptimizer.md b/site/tests/data_validation/ProtectedClassesThresholdOptimizer.md
deleted file mode 100644
index fed7dd0c91..0000000000
--- a/site/tests/data_validation/ProtectedClassesThresholdOptimizer.md
+++ /dev/null
@@ -1,36 +0,0 @@
-# ProtectedClassesThresholdOptimizer
-
-Obtains a classifier by applying group-specific thresholds to the provided estimator.
-
-### Purpose
-
-This test aims to optimize the fairness of a machine learning model by applying different
-classification thresholds for different protected groups. It helps in mitigating bias and
-achieving more equitable outcomes across different demographic groups.
-
-### Test Mechanism
-
-The test uses Fairlearn's ThresholdOptimizer to:
-1. Fit an optimizer on the training data, considering protected classes.
-2. Apply optimized thresholds to make predictions on the test data.
-3. Calculate and report various fairness metrics.
-4. Visualize the optimized thresholds.
-
-### Signs of High Risk
-
-- Large disparities in fairness metrics (e.g., Demographic Parity Ratio, Equalized Odds Ratio)
-across different protected groups.
-- Significant differences in False Positive Rates (FPR) or True Positive Rates (TPR) between groups.
-- Thresholds that vary widely across different protected groups.
-
-### Strengths
-
-- Provides a post-processing method to improve model fairness without modifying the original model.
-- Allows for balancing multiple fairness criteria simultaneously.
-- Offers visual insights into the threshold optimization process.
-
-### Limitations
-
-- May lead to a decrease in overall model performance while improving fairness.
-- Requires access to protected attribute information at prediction time.
-- The effectiveness can vary depending on the chosen fairness constraint and objective.
\ No newline at end of file
diff --git a/site/tests/data_validation/RollingStatsPlot.md b/site/tests/data_validation/RollingStatsPlot.md
deleted file mode 100644
index a4eb2ecca0..0000000000
--- a/site/tests/data_validation/RollingStatsPlot.md
+++ /dev/null
@@ -1,49 +0,0 @@
-# RollingStatsPlot
-
-Evaluates the stationarity of time series data by plotting its rolling mean and standard deviation over a specified
-window.
-
-### Purpose
-
-The `RollingStatsPlot` metric is employed to gauge the stationarity of time series data in a given dataset. This
-metric specifically evaluates the rolling mean and rolling standard deviation of the dataset over a pre-specified
-window size. The rolling mean provides an understanding of the average trend in the data, while the rolling
-standard deviation gauges the volatility of the data within the window. It is critical in preparing time series
-data for modeling as it reveals key insights into data behavior across time.
-
-### Test Mechanism
-
-This mechanism is comprised of two steps. Initially, the rolling mean and standard deviation for each of the
-dataset's columns are calculated over a window size, which can be user-specified or by default set to 12 data
-points. Then, the calculated rolling mean and standard deviation are visualized via separate plots, illustrating
-the trends and volatility in the dataset. A straightforward check is conducted to ensure the existence of columns
-in the dataset, and to verify that the given dataset has been indexed by its date and time—a necessary prerequisite
-for time series analysis.
-
-### Signs of High Risk
-
-- The presence of non-stationary patterns in either the rolling mean or the rolling standard deviation plots, which
-could indicate trends or seasonality in the data that may affect the performance of time series models.
-- Missing columns in the dataset, which would prevent the execution of this metric correctly.
-- The detection of NaN values in the dataset, which may need to be addressed before the metric can proceed
-successfully.
-
-### Strengths
-
-- Offers visualizations of trending behavior and volatility within the data, facilitating a broader understanding
-of the dataset's inherent characteristics.
-- Checks of the dataset's integrity, such as the existence of all required columns and the availability of a
-datetime index.
-- Adjusts to accommodate various window sizes, thus allowing accurate analysis of data with differing temporal
-granularities.
-- Considers each column of the data individually, thereby accommodating multi-feature datasets.
-
-### Limitations
-
-- For all columns, a fixed-size window is utilized. This may not accurately capture patterns in datasets where
-different features may require different optimal window sizes.
-- Requires the dataset to be indexed by date and time, hence it may not be usable for datasets without a timestamp
-index.
-- Primarily serves for data visualization as it does not facilitate any quantitative measures for stationarity,
-such as through statistical tests. Therefore, the interpretation is subjective and depends heavily on modeler
-discretion.
\ No newline at end of file
diff --git a/site/tests/data_validation/RunsTest.md b/site/tests/data_validation/RunsTest.md
deleted file mode 100644
index 74ebcbfcb3..0000000000
--- a/site/tests/data_validation/RunsTest.md
+++ /dev/null
@@ -1,43 +0,0 @@
-# RunsTest
-
-Executes Runs Test on ML model to detect non-random patterns in output data sequence.
-
-### Purpose
-
-The Runs Test is a statistical procedure used to determine whether the sequence of data extracted from the ML model
-behaves randomly or not. Specifically, it analyzes runs, sequences of consecutive positives or negatives, in the
-data to check if there are more or fewer runs than expected under the assumption of randomness. This can be an
-indication of some pattern, trend, or cycle in the model's output which may need attention.
-
-### Test Mechanism
-
-The testing mechanism applies the Runs Test from the statsmodels module on each column of the training dataset. For
-every feature in the dataset, a Runs Test is executed, whose output includes a Runs Statistic and P-value. A low
-P-value suggests that data arrangement in the feature is not likely to be random. The results are stored in a
-dictionary where the keys are the feature names, and the values are another dictionary storing the test statistic
-and the P-value for each feature.
-
-### Signs of High Risk
-
-- High risk is indicated when the P-value is close to zero.
-- If the P-value is less than a predefined significance level (like 0.05), it suggests that the runs (series of
-positive or negative values) in the model's output are not random and are longer or shorter than what is expected
-under a random scenario.
-- This would mean there's a high risk of non-random distribution of errors or model outcomes, suggesting potential
-issues with the model.
-
-### Strengths
-
-- Straightforward and fast for detecting non-random patterns in data sequence.
-- Validates assumptions of randomness, which is valuable for checking error distributions in regression models,
-trendless time series data, and ensuring a classifier doesn't favor one class over another.
-- Can be applied to both classification and regression tasks, making it versatile.
-
-### Limitations
-
-- Assumes that the data is independently and identically distributed (i.i.d.), which might not be the case for many
-real-world datasets.
-- The conclusion drawn from the low P-value indicating non-randomness does not provide information about the type
-or the source of the detected pattern.
-- Sensitive to extreme values (outliers), and overly large or small run sequences can influence the results.
-- Does not provide model performance evaluation; it is used to detect patterns in the sequence of outputs only.
\ No newline at end of file
diff --git a/site/tests/data_validation/ScatterPlot.md b/site/tests/data_validation/ScatterPlot.md
deleted file mode 100644
index 44ce8fdedc..0000000000
--- a/site/tests/data_validation/ScatterPlot.md
+++ /dev/null
@@ -1,44 +0,0 @@
-# ScatterPlot
-
-Assesses visual relationships, patterns, and outliers among features in a dataset through scatter plot matrices.
-
-### Purpose
-
-The ScatterPlot test aims to visually analyze a given dataset by constructing a scatter plot matrix of its
-numerical features. The primary goal is to uncover relationships, patterns, and outliers across different features
-to provide both quantitative and qualitative insights into multidimensional relationships within the dataset. This
-visual assessment aids in understanding the efficacy of the chosen features for model training and their
-suitability.
-
-### Test Mechanism
-
-Using the Seaborn library, the ScatterPlot function creates the scatter plot matrix. The process involves
-retrieving all numerical columns from the dataset and generating a scatter matrix for these columns. The resulting
-scatter plot provides visual representations of feature relationships. The function also adjusts axis labels for
-readability and returns the final plot as a Matplotlib Figure object for further analysis and visualization.
-
-### Signs of High Risk
-
-- The emergence of non-linear or random patterns across different feature pairs, suggesting complex relationships
-unsuitable for linear assumptions.
-- Lack of clear patterns or clusters, indicating weak or non-existent correlations among features, which could
-challenge certain model types.
-- Presence of outliers, as visual outliers can adversely influence the model's performance.
-
-### Strengths
-
-- Provides insight into the multidimensional relationships among multiple features.
-- Assists in identifying trends, correlations, and outliers that could affect model performance.
-- Validates assumptions made during model creation, such as linearity.
-- Versatile for application in both regression and classification tasks.
-- Using Seaborn facilitates an intuitive and detailed visual exploration of data.
-
-### Limitations
-
-- Scatter plot matrices may become cluttered and hard to decipher as the number of features increases.
-- Primarily reveals pairwise relationships and may fail to illuminate complex interactions involving three or more
-features.
-- Being a visual tool, precision in quantitative analysis might be compromised.
-- Outliers not clearly visible in plots can be missed, affecting model performance.
-- Assumes that the dataset can fit into the computer's memory, which might not be valid for extremely large
-datasets.
\ No newline at end of file
diff --git a/site/tests/data_validation/ScoreBandDefaultRates.md b/site/tests/data_validation/ScoreBandDefaultRates.md
deleted file mode 100644
index dbb5f68144..0000000000
--- a/site/tests/data_validation/ScoreBandDefaultRates.md
+++ /dev/null
@@ -1,50 +0,0 @@
-# ScoreBandDefaultRates
-
-Analyzes default rates and population distribution across credit score bands.
-
-### Purpose
-
-The Score Band Default Rates test evaluates the discriminatory power of credit scores by analyzing
-default rates across different score bands. This helps validate score effectiveness, supports
-policy decisions, and provides insights into portfolio risk distribution.
-
-### Test Mechanism
-
-The test segments the score distribution into bands and calculates key metrics for each band:
-1. Population count and percentage in each band
-2. Default rate within each band
-3. Cumulative statistics across bands
-The results show how well the scores separate good and bad accounts.
-
-### Signs of High Risk
-
-- Non-monotonic default rates across score bands
-- Insufficient population in critical score bands
-- Unexpected default rates for score ranges
-- High concentration in specific score bands
-- Similar default rates across adjacent bands
-- Unstable default rates in key decision bands
-- Extreme population skewness
-- Poor risk separation between bands
-
-### Strengths
-
-- Clear view of score effectiveness
-- Supports policy threshold decisions
-- Easy to interpret and communicate
-- Directly links to business decisions
-- Shows risk segmentation power
-- Identifies potential score issues
-- Helps validate scoring model
-- Supports portfolio monitoring
-
-### Limitations
-
-- Sensitive to band definition choices
-- May mask within-band variations
-- Requires sufficient data in each band
-- Cannot capture non-linear patterns
-- Point-in-time analysis only
-- No temporal trend information
-- Assumes band boundaries are appropriate
-- May oversimplify risk patterns
\ No newline at end of file
diff --git a/site/tests/data_validation/SeasonalDecompose.md b/site/tests/data_validation/SeasonalDecompose.md
deleted file mode 100644
index 00e4d92c6b..0000000000
--- a/site/tests/data_validation/SeasonalDecompose.md
+++ /dev/null
@@ -1,41 +0,0 @@
-# SeasonalDecompose
-
-Assesses patterns and seasonality in a time series dataset by decomposing its features into foundational components.
-
-### Purpose
-
-The Seasonal Decompose test aims to decompose the features of a time series dataset into their fundamental
-components: observed, trend, seasonal, and residuals. By utilizing the Seasonal Decomposition of Time Series by
-Loess (STL) method, the test identifies underlying patterns, predominantly seasonality, in the dataset's features.
-This aids in developing a more comprehensive understanding of the dataset, which in turn facilitates more effective
-model validation.
-
-### Test Mechanism
-
-The testing process leverages the `seasonal_decompose` function from the `statsmodels.tsa.seasonal` library to
-evaluate each feature in the dataset. It isolates each feature into four components—observed, trend, seasonal, and
-residuals—and generates six subplot graphs per feature for visual interpretation. Prior to decomposition, the test
-scrutinizes and removes any non-finite values, ensuring the reliability of the analysis.
-
-### Signs of High Risk
-
-- **Non-Finiteness**: Datasets with a high number of non-finite values may flag as high risk since these values are
-omitted before conducting the seasonal decomposition.
-- **Frequent Warnings**: Chronic failure to infer the frequency for a scrutinized feature indicates high risk.
-- **High Seasonality**: A significant seasonal component could potentially render forecasts unreliable due to
-overwhelming seasonal variation.
-
-### Strengths
-
-- **Seasonality Detection**: Accurately discerns hidden seasonality patterns in dataset features.
-- **Visualization**: Facilitates interpretation and comprehension through graphical representations.
-- **Unrestricted Usage**: Not confined to any specific regression model, promoting wide-ranging applicability.
-
-### Limitations
-
-- **Dependence on Assumptions**: Assumes that dataset features are periodically distributed. Features with no
-inferable frequency are excluded from the test.
-- **Handling Non-Finite Values**: Disregards non-finite values during analysis, potentially resulting in an
-incomplete understanding of the dataset.
-- **Unreliability with Noisy Datasets**: Produces unreliable results when used with datasets that contain heavy
-noise.
\ No newline at end of file
diff --git a/site/tests/data_validation/ShapiroWilk.md b/site/tests/data_validation/ShapiroWilk.md
deleted file mode 100644
index 33dc50092b..0000000000
--- a/site/tests/data_validation/ShapiroWilk.md
+++ /dev/null
@@ -1,40 +0,0 @@
-# ShapiroWilk
-
-Evaluates feature-wise normality of training data using the Shapiro-Wilk test.
-
-### Purpose
-
-The Shapiro-Wilk test is utilized to investigate whether a particular dataset conforms to the standard normal
-distribution. This analysis is crucial in machine learning modeling because the normality of the data can
-profoundly impact the performance of the model. This metric is especially useful in evaluating various features of
-the dataset in both classification and regression tasks.
-
-### Test Mechanism
-
-The Shapiro-Wilk test is conducted on each feature column of the training dataset to determine if the data
-contained fall within the normal distribution. The test presents a statistic and a p-value, with the p-value
-serving to validate or repudiate the null hypothesis, which is that the tested data is normally distributed.
-
-### Signs of High Risk
-
-- A p-value that falls below 0.05 signifies a high risk as it discards the null hypothesis, indicating that the
-data does not adhere to the normal distribution.
-- For machine learning models built on the presumption of data normality, such an outcome could result in subpar
-performance or incorrect predictions.
-
-### Strengths
-
-- The Shapiro-Wilk test is esteemed for its level of accuracy, thereby making it particularly well-suited to
-datasets of small to moderate sizes.
-- It proves its versatility through its efficient functioning in both classification and regression tasks.
-- By separately testing each feature column, the Shapiro-Wilk test can raise an alarm if a specific feature does
-not comply with the normality.
-
-### Limitations
-
-- The Shapiro-Wilk test's sensitivity can be a disadvantage as it often rejects the null hypothesis (i.e., data is
-normally distributed), even for minor deviations, especially in large datasets. This may lead to unwarranted 'false
-alarms' of high risk by deeming the data as not normally distributed even if it approximates normal distribution.
-- Exceptional care must be taken in managing missing data or outliers prior to testing as these can greatly skew
-the results.
-- Lastly, the Shapiro-Wilk test is not optimally suited for processing data with pronounced skewness or kurtosis.
\ No newline at end of file
diff --git a/site/tests/data_validation/Skewness.md b/site/tests/data_validation/Skewness.md
deleted file mode 100644
index 4a2e592893..0000000000
--- a/site/tests/data_validation/Skewness.md
+++ /dev/null
@@ -1,37 +0,0 @@
-# Skewness
-
-Evaluates the skewness of numerical data in a dataset to check against a defined threshold, aiming to ensure data
-quality and optimize model performance.
-
-### Purpose
-
-The purpose of the Skewness test is to measure the asymmetry in the distribution of data within a predictive
-machine learning model. Specifically, it evaluates the divergence of said distribution from a normal distribution.
-Understanding the level of skewness helps identify data quality issues, which are crucial for optimizing the
-performance of traditional machine learning models in both classification and regression settings.
-
-### Test Mechanism
-
-This test calculates the skewness of numerical columns in the dataset, focusing specifically on numerical data
-types. The calculated skewness value is then compared against a predetermined maximum threshold, which is set by
-default to 1. If the skewness value is less than this maximum threshold, the test passes; otherwise, it fails. The
-test results, along with the skewness values and column names, are then recorded for further analysis.
-
-### Signs of High Risk
-
-- Substantial skewness levels that significantly exceed the maximum threshold.
-- Persistent skewness in the data, indicating potential issues with the foundational assumptions of the machine
-learning model.
-- Subpar model performance, erroneous predictions, or biased inferences due to skewed data distributions.
-
-### Strengths
-
-- Fast and efficient identification of unequal data distributions within a machine learning model.
-- Adjustable maximum threshold parameter, allowing for customization based on user needs.
-- Provides a clear quantitative measure to mitigate model risks related to data skewness.
-
-### Limitations
-
-- Only evaluates numeric columns, potentially missing skewness or bias in non-numeric data.
-- Assumes that data should follow a normal distribution, which may not always be applicable to real-world data.
-- Subjective threshold for risk grading, requiring expert input and recurrent iterations for refinement.
\ No newline at end of file
diff --git a/site/tests/data_validation/SpreadPlot.md b/site/tests/data_validation/SpreadPlot.md
deleted file mode 100644
index 8e35c2a090..0000000000
--- a/site/tests/data_validation/SpreadPlot.md
+++ /dev/null
@@ -1,42 +0,0 @@
-# SpreadPlot
-
-Assesses potential correlations between pairs of time series variables through visualization to enhance
-understanding of their relationships.
-
-### Purpose
-
-The SpreadPlot test aims to graphically illustrate and analyze the relationships between pairs of time series
-variables within a given dataset. This facilitated understanding helps in identifying and assessing potential time
-series correlations, such as cointegration, between the variables.
-
-### Test Mechanism
-
-The SpreadPlot test computes and represents the spread between each pair of time series variables in the dataset.
-Specifically, the difference between two variables is calculated and presented as a line graph. This process is
-iterated for each unique pair of variables in the dataset, allowing for comprehensive visualization of their
-relationships.
-
-### Signs of High Risk
-
-- Large fluctuations in the spread over a given timespan.
-- Unexpected patterns or trends that may signal potential risks in the underlying correlations between the
-variables.
-- Presence of significant missing data or extreme outlier values, which could potentially skew the spread and
-indicate high risk.
-
-### Strengths
-
-- Allows for thorough visual examination and interpretation of the correlations between time-series pairs.
-- Aids in revealing complex relationships like cointegration.
-- Enhances interpretability by visualizing the relationships, thereby helping in spotting outliers and trends.
-- Capable of handling numerous variable pairs from the dataset through a versatile and adaptable process.
-
-### Limitations
-
-- Primarily serves as a visualization tool and does not offer quantitative measurements or statistics to
-objectively determine relationships.
-- Heavily relies on the quality and granularity of the data—missing data or outliers can notably disturb the
-interpretation of relationships.
-- Can become inefficient or difficult to interpret with a high number of variables due to the profuse number of
-plots.
-- Might not completely capture intricate non-linear relationships between the variables.
\ No newline at end of file
diff --git a/site/tests/data_validation/TabularCategoricalBarPlots.md b/site/tests/data_validation/TabularCategoricalBarPlots.md
deleted file mode 100644
index 480f5c13df..0000000000
--- a/site/tests/data_validation/TabularCategoricalBarPlots.md
+++ /dev/null
@@ -1,37 +0,0 @@
-# TabularCategoricalBarPlots
-
-Generates and visualizes bar plots for each category in categorical features to evaluate the dataset's composition.
-
-### Purpose
-
-The purpose of this metric is to visually analyze categorical data using bar plots. It is intended to evaluate the
-dataset's composition by displaying the counts of each category in each categorical feature.
-
-### Test Mechanism
-
-The provided dataset is first checked to determine if it contains any categorical variables. If no categorical
-columns are found, the tool raises a ValueError. For each categorical variable in the dataset, a separate bar plot
-is generated. The number of occurrences for each category is calculated and displayed on the plot. If a dataset
-contains multiple categorical columns, multiple bar plots are produced.
-
-### Signs of High Risk
-
-- High risk could occur if the categorical variables exhibit an extreme imbalance, with categories having very few
-instances possibly being underrepresented in the model, which could affect the model's performance and its ability
-to generalize.
-- Another sign of risk is if there are too many categories in a single variable, which could lead to overfitting
-and make the model complex.
-
-### Strengths
-
-- Provides a visual and intuitively understandable representation of categorical data.
-- Aids in the analysis of variable distributions.
-- Helps in easily identifying imbalances or rare categories that could affect the model's performance.
-
-### Limitations
-
-- This method only works with categorical data and won't apply to numerical variables.
-- It does not provide informative value when there are too many categories, as the bar chart could become cluttered
-and hard to interpret.
-- Offers no insights into the model's performance or precision, but rather provides a descriptive analysis of the
-input.
\ No newline at end of file
diff --git a/site/tests/data_validation/TabularDateTimeHistograms.md b/site/tests/data_validation/TabularDateTimeHistograms.md
deleted file mode 100644
index 23966ed0d5..0000000000
--- a/site/tests/data_validation/TabularDateTimeHistograms.md
+++ /dev/null
@@ -1,43 +0,0 @@
-# TabularDateTimeHistograms
-
-Generates histograms to provide graphical insight into the distribution of time intervals in a model's datetime
-data.
-
-### Purpose
-
-The `TabularDateTimeHistograms` metric is designed to provide graphical insight into the distribution of time
-intervals in a machine learning model's datetime data. By plotting histograms of differences between consecutive
-date entries in all datetime variables, it enables an examination of the underlying pattern of time series data and
-identification of anomalies.
-
-### Test Mechanism
-
-This test operates by first identifying all datetime columns and extracting them from the dataset. For each
-datetime column, it next computes the differences (in days) between consecutive dates, excluding zero values, and
-visualizes these differences in a histogram. The Plotly library's histogram function is used to generate
-histograms, which are labeled appropriately and provide a graphical representation of the frequency of different
-day intervals in the dataset.
-
-### Signs of High Risk
-
-- If no datetime columns are detected in the dataset, this would lead to a ValueError. Hence, the absence of
-datetime columns signifies a high risk.
-- A severely skewed or irregular distribution depicted in the histogram may indicate possible complications with
-the data, such as faulty timestamps or abnormalities.
-
-### Strengths
-
-- The metric offers a visual overview of time interval frequencies within the dataset, supporting the recognition
-of inherent patterns.
-- Histogram plots can aid in the detection of potential outliers and data anomalies, contributing to an assessment
-of data quality.
-- The metric is versatile, compatible with a range of task types, including classification and regression, and can
-work with multiple datetime variables if present.
-
-### Limitations
-
-- A major weakness of this metric is its dependence on the visual examination of data, as it does not provide a
-measurable evaluation of the model.
-- The metric might overlook complex or multi-dimensional trends in the data.
-- The test is only applicable to datasets containing datetime columns and will fail if such columns are unavailable.
-- The interpretation of the histograms relies heavily on the domain expertise and experience of the reviewer.
\ No newline at end of file
diff --git a/site/tests/data_validation/TabularDescriptionTables.md b/site/tests/data_validation/TabularDescriptionTables.md
deleted file mode 100644
index 37234bfa0d..0000000000
--- a/site/tests/data_validation/TabularDescriptionTables.md
+++ /dev/null
@@ -1,48 +0,0 @@
-# TabularDescriptionTables
-
-Summarizes key descriptive statistics for numerical, categorical, and datetime variables in a dataset.
-
-### Purpose
-
-The main purpose of this metric is to gather and present the descriptive statistics of numerical, categorical, and
-datetime variables present in a dataset. The attributes it measures include the count, mean, minimum and maximum
-values, percentage of missing values, data types of fields, and unique values for categorical fields, among others.
-
-### Test Mechanism
-
-The test first segregates the variables in the dataset according to their data types (numerical, categorical, or
-datetime). Then, it compiles summary statistics for each type of variable. The specifics of these statistics vary
-depending on the type of variable:
-
-- For numerical variables, the metric extracts descriptors like count, mean, minimum and maximum values, count of
-missing values, and data types.
-- For categorical variables, it counts the number of unique values, displays unique values, counts missing values,
-and identifies data types.
-- For datetime variables, it counts the number of unique values, identifies the earliest and latest dates, counts
-missing values, and identifies data types.
-
-### Signs of High Risk
-
-- Masses of missing values in the descriptive statistics results could hint at high risk or failure, indicating
-potential data collection, integrity, and quality issues.
-- Detection of inappropriate distributions for numerical variables, like having negative values for variables that
-are always supposed to be positive.
-- Identifying inappropriate data types, like a continuous variable being encoded as a categorical type.
-
-### Strengths
-
-- Provides a comprehensive overview of the dataset.
-- Gives a snapshot into the essence of the numerical, categorical, and datetime fields.
-- Identifies potential data quality issues such as missing values or inconsistencies crucial for building credible
-machine learning models.
-- The metadata, including the data type and missing value information, are vital for anyone including data
-scientists dealing with the dataset before the modeling process.
-
-### Limitations
-
-- It does not perform any deeper statistical analysis or tests on the data.
-- It does not handle issues such as outliers, or relationships between variables.
-- It offers no insights into potential correlations or possible interactions between variables.
-- It does not investigate the potential impact of missing values on the performance of the machine learning models.
-- It does not explore potential transformation requirements that may be necessary to enhance the performance of the
-chosen algorithm.
\ No newline at end of file
diff --git a/site/tests/data_validation/TabularNumericalHistograms.md b/site/tests/data_validation/TabularNumericalHistograms.md
deleted file mode 100644
index 8ffd27735f..0000000000
--- a/site/tests/data_validation/TabularNumericalHistograms.md
+++ /dev/null
@@ -1,42 +0,0 @@
-# TabularNumericalHistograms
-
-Generates histograms for each numerical feature in a dataset to provide visual insights into data distribution and
-detect potential issues.
-
-### Purpose
-
-The purpose of this test is to provide visual analysis of numerical data through the generation of histograms for
-each numerical feature in the dataset. Histograms aid in the exploratory analysis of data, offering insight into
-the distribution of the data, skewness, presence of outliers, and central tendencies. It helps in understanding if
-the inputs to the model are normally distributed, which is a common assumption in many machine learning algorithms.
-
-### Test Mechanism
-
-This test scans the provided dataset and extracts all the numerical columns. For each numerical column, it
-constructs a histogram using plotly, with 50 bins. The deployment of histograms offers a robust visual aid,
-ensuring unruffled identification and understanding of numerical data distribution patterns.
-
-### Signs of High Risk
-
-- A high degree of skewness
-- Unexpected data distributions
-- Existence of extreme outliers in the histograms
-
-These may indicate issues with the data that the model is receiving. If data for a numerical feature is expected to
-follow a certain distribution (like a normal distribution) but does not, it could lead to sub-par performance by
-the model. As such these instances should be treated as high-risk indicators.
-
-### Strengths
-
-- Provides a simple, easy-to-interpret visualization of how data for each numerical attribute is distributed.
-- Helps detect skewed values and outliers that could potentially harm the AI model's performance.
-- Can be applied to large datasets and multiple numerical variables conveniently.
-
-### Limitations
-
-- Only works with numerical data, thus ignoring non-numerical or categorical data.
-- Does not analyze relationships between different features, only the individual feature distributions.
-- Is a univariate analysis and may miss patterns or anomalies that only appear when considering multiple variables
-together.
-- Does not provide any insight into how these features affect the output of the model; it is purely an input
-analysis tool.
\ No newline at end of file
diff --git a/site/tests/data_validation/TargetRateBarPlots.md b/site/tests/data_validation/TargetRateBarPlots.md
deleted file mode 100644
index 649cda5254..0000000000
--- a/site/tests/data_validation/TargetRateBarPlots.md
+++ /dev/null
@@ -1,37 +0,0 @@
-# TargetRateBarPlots
-
-Generates bar plots visualizing the default rates of categorical features for a classification machine learning
-model.
-
-### Purpose
-
-This test, implemented as a metric, is designed to provide an intuitive, graphical summary of the decision-making
-patterns exhibited by a categorical classification machine learning model. The model's performance is evaluated
-using bar plots depicting the ratio of target rates—meaning the proportion of positive classes—for different
-categorical inputs. This allows for an easy, at-a-glance understanding of the model's accuracy.
-
-### Test Mechanism
-
-The test involves creating a pair of bar plots for each categorical feature in the dataset. The first plot depicts
-the frequency of each category in the dataset, with each category visually distinguished by its unique color. The
-second plot shows the mean target rate of each category (sourced from the "default_column"). Plotly, a Python
-library, is used to generate these plots, with distinct plots created for each feature. If no specific columns are
-selected, the test will generate plots for each categorical column in the dataset.
-
-### Signs of High Risk
-
-- Inconsistent or non-binary values in the "default_column" could complicate or render impossible the calculation
-of average target rates.
-- Particularly low or high target rates for a specific category might suggest that the model is misclassifying
-instances of that category.
-
-### Strengths
-
-- This test offers a visually interpretable breakdown of the model's decisions, providing an easy way to spot
-irregularities, inconsistencies, or patterns.
-- Its flexibility allows for the inspection of one or multiple columns, as needed.
-
-### Limitations
-
-- The readability of the bar plots drops as the number of distinct categories increases in the dataset, which can
-make them harder to understand and less useful.
\ No newline at end of file
diff --git a/site/tests/data_validation/TimeSeriesDescription.md b/site/tests/data_validation/TimeSeriesDescription.md
deleted file mode 100644
index 7a5e826e8e..0000000000
--- a/site/tests/data_validation/TimeSeriesDescription.md
+++ /dev/null
@@ -1,34 +0,0 @@
-# TimeSeriesDescription
-
-Generates a detailed analysis for the provided time series dataset, summarizing key statistics to identify trends,
-patterns, and data quality issues.
-
-### Purpose
-
-The TimeSeriesDescription function aims to analyze an individual time series by providing a summary of key
-statistics. This helps in understanding trends, patterns, and data quality issues within the time series.
-
-### Test Mechanism
-
-The function extracts the time series data and provides a summary of key statistics. The dataset is expected to
-have a datetime index. The function checks this and raises an error if the index is not in datetime format. For
-each variable (column) in the dataset, appropriate statistics including start date, end date, frequency, number of
-missing values, count, min, and max values are calculated.
-
-### Signs of High Risk
-
-- If the index of the dataset is not in datetime format, it could lead to errors in time-series analysis.
-- Inconsistent or missing data within the dataset might affect the analysis of trends and patterns.
-
-### Strengths
-
-- Provides a comprehensive summary of key statistics for each variable, helping to identify data quality issues
-such as missing values.
-- Helps in understanding the distribution and range of the data by including min and max values.
-
-### Limitations
-
-- Assumes that the dataset is provided as a DataFrameDataset object with a .df attribute to access the pandas
-DataFrame.
-- Only analyzes datasets with a datetime index and will raise an error for other types of indices.
-- Does not handle large datasets efficiently; performance may degrade with very large datasets.
\ No newline at end of file
diff --git a/site/tests/data_validation/TimeSeriesDescriptiveStatistics.md b/site/tests/data_validation/TimeSeriesDescriptiveStatistics.md
deleted file mode 100644
index 73fa7ce2b7..0000000000
--- a/site/tests/data_validation/TimeSeriesDescriptiveStatistics.md
+++ /dev/null
@@ -1,32 +0,0 @@
-# TimeSeriesDescriptiveStatistics
-
-Evaluates the descriptive statistics of a time series dataset to identify trends, patterns, and data quality issues.
-
-### Purpose
-
-The purpose of the TimeSeriesDescriptiveStatistics function is to analyze an individual time series by providing a
-summary of key descriptive statistics. This analysis helps in understanding trends, patterns, and data quality
-issues within the time series dataset.
-
-### Test Mechanism
-
-The function extracts the time series data and provides a summary of key descriptive statistics. The dataset is
-expected to have a datetime index, and the function will check this and raise an error if the index is not in a
-datetime format. For each variable (column) in the dataset, appropriate statistics, including start date, end date,
-min, mean, max, skewness, kurtosis, and count, are calculated.
-
-### Signs of High Risk
-
-- If the index of the dataset is not in datetime format, it could lead to errors in time-series analysis.
-- Inconsistent or missing data within the dataset might affect the analysis of trends and patterns.
-
-### Strengths
-
-- Provides a comprehensive summary of key descriptive statistics for each variable.
-- Helps identify data quality issues and understand the distribution of the data.
-
-### Limitations
-
-- Assumes the dataset is provided as a DataFrameDataset object with a .df attribute to access the pandas DataFrame.
-- Only analyzes datasets with a datetime index and will raise an error for other types of indices.
-- Does not handle large datasets efficiently, and performance may degrade with very large datasets.
\ No newline at end of file
diff --git a/site/tests/data_validation/TimeSeriesFrequency.md b/site/tests/data_validation/TimeSeriesFrequency.md
deleted file mode 100644
index e51e6c6c58..0000000000
--- a/site/tests/data_validation/TimeSeriesFrequency.md
+++ /dev/null
@@ -1,44 +0,0 @@
-# TimeSeriesFrequency
-
-Evaluates consistency of time series data frequency and generates a frequency plot.
-
-### Purpose
-
-The purpose of the TimeSeriesFrequency test is to evaluate the consistency in the frequency of data points in a
-time-series dataset. This test inspects the intervals or duration between each data point to determine if a fixed
-pattern (such as daily, weekly, or monthly) exists. The identification of such patterns is crucial to time-series
-analysis as any irregularities could lead to erroneous results and hinder the model's capacity for identifying
-trends and patterns.
-
-### Test Mechanism
-
-Initially, the test checks if the dataframe index is in datetime format. Subsequently, it utilizes pandas
-`infer_freq` method to identify the frequency of each data series within the dataframe. The `infer_freq` method
-attempts to establish the frequency of a time series and returns both the frequency string and a dictionary
-relating these strings to their respective labels. The test compares the frequencies of all datasets. If they share
-a common frequency, the test passes, but it fails if they do not. Additionally, Plotly is used to create a
-frequency plot, offering a visual depiction of the time differences between consecutive entries in the dataframe
-index.
-
-### Signs of High Risk
-
-- The test fails, indicating multiple unique frequencies within the dataset. This failure could suggest irregular
-intervals between observations, potentially interrupting pattern recognition or trend analysis.
-- The presence of missing or null frequencies could be an indication of inconsistencies in data or gaps within the
-data collection process.
-
-### Strengths
-
-- This test uses a systematic approach to checking the consistency of data frequency within a time-series dataset.
-- It increases the model's reliability by asserting the consistency of observations over time, an essential factor
-in time-series analysis.
-- The test generates a visual plot, providing an intuitive representation of the dataset's frequency distribution,
-which caters to visual learners and aids in interpretation and explanation.
-
-### Limitations
-
-- This test is only applicable to time-series datasets and hence not suitable for other types of datasets.
-- The `infer_freq` method might not always correctly infer frequency when faced with missing or irregular data
-points.
-- Depending on context or the model under development, mixed frequencies might sometimes be acceptable, but this
-test considers them a failing condition.
\ No newline at end of file
diff --git a/site/tests/data_validation/TimeSeriesHistogram.md b/site/tests/data_validation/TimeSeriesHistogram.md
deleted file mode 100644
index 0ee45e1ebd..0000000000
--- a/site/tests/data_validation/TimeSeriesHistogram.md
+++ /dev/null
@@ -1,38 +0,0 @@
-# TimeSeriesHistogram
-
-Visualizes distribution of time-series data using histograms and Kernel Density Estimation (KDE) lines.
-
-### Purpose
-
-The TimeSeriesHistogram test aims to perform a histogram analysis on time-series data to assess the distribution of
-values within a dataset over time. This test is useful for regression tasks and can be applied to various types of
-data, such as internet traffic, stock prices, and weather data, providing insights into the probability
-distribution, skewness, and kurtosis of the dataset.
-
-### Test Mechanism
-
-This test operates on a specific column within the dataset that must have a datetime type index. For each column in
-the dataset, a histogram is created using Plotly's histplot function. If the dataset includes more than one
-time-series, a distinct histogram is plotted for each series. Additionally, a Kernel Density Estimate (KDE) line is
-drawn for each histogram, visualizing the data's underlying probability distribution. The x and y-axis labels are
-hidden to focus solely on the data distribution.
-
-### Signs of High Risk
-
-- The dataset lacks a column with a datetime type index.
-- The specified columns do not exist within the dataset.
-- High skewness or kurtosis in the data distribution, indicating potential bias.
-- Presence of significant outliers in the data distribution.
-
-### Strengths
-
-- Serves as a visual diagnostic tool for understanding data behavior and distribution trends.
-- Effective for analyzing both single and multiple time-series data.
-- KDE line provides a smooth estimate of the overall trend in data distribution.
-
-### Limitations
-
-- Provides a high-level view without specific numeric measures such as skewness or kurtosis.
-- The histogram loses some detail due to binning of data values.
-- Cannot handle non-numeric data columns.
-- Histogram shape may be sensitive to the number of bins used.
\ No newline at end of file
diff --git a/site/tests/data_validation/TimeSeriesLinePlot.md b/site/tests/data_validation/TimeSeriesLinePlot.md
deleted file mode 100644
index 5d1007d8ed..0000000000
--- a/site/tests/data_validation/TimeSeriesLinePlot.md
+++ /dev/null
@@ -1,42 +0,0 @@
-# TimeSeriesLinePlot
-
-Generates and analyses time-series data through line plots revealing trends, patterns, anomalies over time.
-
-### Purpose
-
-The TimeSeriesLinePlot metric is designed to generate and analyze time series data through the creation of line
-plots. This assists in the initial inspection of the data by providing a visual representation of patterns, trends,
-seasonality, irregularity, and anomalies that may be present in the dataset over a period of time.
-
-### Test Mechanism
-
-The mechanism for this Python class involves extracting the column names from the provided dataset and subsequently
-generating line plots for each column using the Plotly Python library. For every column in the dataset, a
-time-series line plot is created where the values are plotted against the dataset's datetime index. It is important
-to note that indexes that are not of datetime type will result in a ValueError.
-
-### Signs of High Risk
-
-- Presence of time-series data that does not have datetime indices.
-- Provided columns do not exist in the provided dataset.
-- The detection of anomalous patterns or irregularities in the time-series plots, indicating potential high model
-instability or probable predictive error.
-
-### Strengths
-
-- The visual representation of complex time series data, which simplifies understanding and helps in recognizing
-temporal trends, patterns, and anomalies.
-- The adaptability of the metric, which allows it to effectively work with multiple time series within the same
-dataset.
-- Enables the identification of anomalies and irregular patterns through visual inspection, assisting in spotting
-potential data or model performance problems.
-
-### Limitations
-
-- The effectiveness of the metric is heavily reliant on the quality and patterns of the provided time series data.
-- Exclusively a visual tool, it lacks the capability to provide quantitative measurements, making it less effective
-for comparing and ranking multiple models or when specific numerical diagnostics are needed.
-- The metric necessitates that the time-specific data has been transformed into a datetime index, with the data
-formatted correctly.
-- The metric has an inherent limitation in that it cannot extract deeper statistical insights from the time series
-data, which can limit its efficacy with complex data structures and phenomena.
\ No newline at end of file
diff --git a/site/tests/data_validation/TimeSeriesMissingValues.md b/site/tests/data_validation/TimeSeriesMissingValues.md
deleted file mode 100644
index f61c82db2d..0000000000
--- a/site/tests/data_validation/TimeSeriesMissingValues.md
+++ /dev/null
@@ -1,39 +0,0 @@
-# TimeSeriesMissingValues
-
-Validates time-series data quality by confirming the count of missing values is below a certain threshold.
-
-### Purpose
-
-This test is designed to validate the quality of a historical time-series dataset by verifying that the number of
-missing values is below a specified threshold. As time-series models greatly depend on the continuity and
-temporality of data points, missing values could compromise the model's performance. Consequently, this test aims
-to ensure data quality and readiness for the machine learning model, safeguarding its predictive capacity.
-
-### Test Mechanism
-
-The test method commences by validating if the dataset has a datetime index; if not, an error is raised. It
-establishes a lower limit threshold for missing values and performs a missing values check on each column of the
-dataset. An object for the test result is created stating whether the number of missing values is within the
-specified threshold. Additionally, the test calculates the percentage of missing values alongside the raw count.
-
-### Signs of High Risk
-
-- The number of missing values in any column of the dataset surpasses the threshold, marking a failure and a
-high-risk scenario. The reasons could range from incomplete data collection, faulty sensors to data preprocessing
-errors.
-
-### Strengths
-
-- Effectively identifies missing values which could adversely affect the model’s performance.
-- Applicable and customizable through the threshold parameter across different data sets.
-- Goes beyond raw numbers by calculating the percentage of missing values, offering a more relative understanding
-of data scarcity.
-
-### Limitations
-
-- Although it identifies missing values, the test does not provide solutions to handle them.
-- The test demands that the dataset should have a datetime index, hence limiting its use only to time series
-analysis.
-- The test's sensitivity to the 'min_threshold' parameter may raise false alarms if set too strictly or may
-overlook problematic data if set too loosely.
-- Solely focuses on the 'missingness' of the data and might fall short in addressing other aspects of data quality.
\ No newline at end of file
diff --git a/site/tests/data_validation/TimeSeriesOutliers.md b/site/tests/data_validation/TimeSeriesOutliers.md
deleted file mode 100644
index 4a36c9da4f..0000000000
--- a/site/tests/data_validation/TimeSeriesOutliers.md
+++ /dev/null
@@ -1,43 +0,0 @@
-# TimeSeriesOutliers
-
-Identifies and visualizes outliers in time-series data using the z-score method.
-
-### Purpose
-
-This test is designed to identify outliers in time-series data using the z-score method. It's vital for ensuring
-data quality before modeling, as outliers can skew predictive models and significantly impact their overall
-performance.
-
-### Test Mechanism
-
-The test processes a given dataset which must have datetime indexing, checks if a 'zscore_threshold' parameter has
-been supplied, and identifies columns with numeric data types. After finding numeric columns, the implementer then
-applies the z-score method to each numeric column, identifying outliers based on the threshold provided. Each
-outlier is listed together with their variable name, z-score, timestamp, and relative threshold in a dictionary and
-converted to a DataFrame for convenient output. Additionally, it produces visual plots for each time series
-illustrating outliers in the context of the broader dataset. The 'zscore_threshold' parameter sets the limit beyond
-which a data point will be labeled as an outlier. The default threshold is set at 3, indicating that any data point
-that falls 3 standard deviations away from the mean will be marked as an outlier.
-
-### Signs of High Risk
-
-- Many or substantial outliers are present within the dataset, indicating significant anomalies.
-- Data points with z-scores higher than the set threshold.
-- Potential impact on the performance of machine learning models if outliers are not properly addressed.
-
-### Strengths
-
-- The z-score method is a popular and robust method for identifying outliers in a dataset.
-- Simplifies time series maintenance by requiring a datetime index.
-- Identifies outliers for each numeric feature individually.
-- Provides an elaborate report showing variables, dates, z-scores, and pass/fail tests.
-- Offers visual inspection for detected outliers through plots.
-
-### Limitations
-
-- The test only identifies outliers in numeric columns, not in categorical variables.
-- The utility and accuracy of z-scores can be limited if the data doesn't follow a normal distribution.
-- The method relies on a subjective z-score threshold for deciding what constitutes an outlier, which might not
-always be suitable depending on the dataset and use case.
-- It does not address possible ways to handle identified outliers in the data.
-- The requirement for a datetime index could limit its application.
\ No newline at end of file
diff --git a/site/tests/data_validation/TooManyZeroValues.md b/site/tests/data_validation/TooManyZeroValues.md
deleted file mode 100644
index c5d45043c2..0000000000
--- a/site/tests/data_validation/TooManyZeroValues.md
+++ /dev/null
@@ -1,51 +0,0 @@
-# TooManyZeroValues
-
-Identifies numerical columns in a dataset that contain an excessive number of zero values, defined by a threshold
-percentage.
-
-### Purpose
-
-The 'TooManyZeroValues' test is utilized to identify numerical columns in the dataset that may present a quantity
-of zero values considered excessive. The aim is to detect situations where these may implicate data sparsity or a
-lack of variation, limiting their effectiveness within a machine learning model. The definition of 'too many' is
-quantified as a percentage of total values, with a default set to 0.03%.
-
-### Test Mechanism
-
-This test is conducted by looping through each column in the dataset and categorizing those that pertain to
-numerical data. On identifying a numerical column, the function computes the total quantity of zero values and
-their ratio to the total row count. Should the proportion exceed a pre-set threshold parameter, set by default at
-0.03%, the column is considered to have failed the test. The results for each column are summarized and
-reported, indicating the count and percentage of zero values for each numerical column, alongside a status
-indicating whether the column has passed or failed the test.
-
-### Signs of High Risk
-
-- Numerical columns showing a high ratio of zero values when compared to the total count of rows (exceeding the
-predetermined threshold).
-- Columns characterized by zero values across the board suggest a complete lack of data variation, signifying high
-risk.
-
-### Strengths
-
-- Assists in highlighting columns featuring an excess of zero values that could otherwise go unnoticed within a
-large dataset.
-- Provides the flexibility to alter the threshold that determines when the quantity of zero values becomes 'too
-many', thus catering to specific needs of a particular analysis or model.
-- Offers feedback in the form of both counts and percentages of zero values, which allows a closer inspection of
-the distribution and proportion of zeros within a column.
-- Targets specifically numerical data, thereby avoiding inappropriate application to non-numerical columns and
-mitigating the risk of false test failures.
-
-### Limitations
-
-- Is exclusively designed to check for zero values and doesn’t assess the potential impact of other values that
-could affect the dataset, such as extremely high or low figures, missing values, or outliers.
-- Lacks the ability to detect a repetitive pattern of zeros, which could be significant in time-series or
-longitudinal data.
-- Zero values can actually be meaningful in some contexts; therefore, tagging them as 'too many' could potentially
-misinterpret the data to some extent.
-- This test does not take into consideration the context of the dataset, and fails to recognize that within certain
-columns, a high number of zero values could be quite normal and not necessarily an indicator of poor data quality.
-- Cannot evaluate non-numerical or categorical columns, which might bring with them different types of concerns or
-issues.
\ No newline at end of file
diff --git a/site/tests/data_validation/UniqueRows.md b/site/tests/data_validation/UniqueRows.md
deleted file mode 100644
index 97b91643ee..0000000000
--- a/site/tests/data_validation/UniqueRows.md
+++ /dev/null
@@ -1,41 +0,0 @@
-# UniqueRows
-
-Verifies the diversity of the dataset by ensuring that the count of unique rows exceeds a prescribed threshold.
-
-### Purpose
-
-The UniqueRows test is designed to gauge the quality of the data supplied to the machine learning model by
-verifying that the count of distinct rows in the dataset exceeds a specific threshold, thereby ensuring a varied
-collection of data. Diversity in data is essential for training an unbiased and robust model that excels when faced
-with novel data.
-
-### Test Mechanism
-
-The testing process starts with calculating the total number of rows in the dataset. Subsequently, the count of
-unique rows is determined for each column in the dataset. If the percentage of unique rows (calculated as the ratio
-of unique rows to the overall row count) is less than the prescribed minimum percentage threshold given as a
-function parameter, the test passes. The results are cached and a final pass or fail verdict is given based on
-whether all columns have successfully passed the test.
-
-### Signs of High Risk
-
-- A lack of diversity in data columns, demonstrated by a count of unique rows that falls short of the preset
-minimum percentage threshold, is indicative of high risk.
-- This lack of variety in the data signals potential issues with data quality, possibly leading to overfitting in
-the model and issues with generalization, thus posing a significant risk.
-
-### Strengths
-
-- The UniqueRows test is efficient in evaluating the data's diversity across each information column in the dataset.
-- This test provides a quick, systematic method to assess data quality based on uniqueness, which can be pivotal in
-developing effective and unbiased machine learning models.
-
-### Limitations
-
-- A limitation of the UniqueRows test is its assumption that the data's quality is directly proportionate to its
-uniqueness, which may not always hold true. There might be contexts where certain non-unique rows are essential and
-should not be overlooked.
-- The test does not consider the relative 'importance' of each column in predicting the output, treating all
-columns equally.
-- This test may not be suitable or useful for categorical variables, where the count of unique categories is
-inherently limited.
\ No newline at end of file
diff --git a/site/tests/data_validation/WOEBinPlots.md b/site/tests/data_validation/WOEBinPlots.md
deleted file mode 100644
index b9a9082d8d..0000000000
--- a/site/tests/data_validation/WOEBinPlots.md
+++ /dev/null
@@ -1,47 +0,0 @@
-# WOEBinPlots
-
-Generates visualizations of Weight of Evidence (WoE) and Information Value (IV) for understanding predictive power
-of categorical variables in a data set.
-
-### Purpose
-
-This test is designed to visualize the Weight of Evidence (WoE) and Information Value (IV) for categorical
-variables in a provided dataset. By showcasing the data distribution across different categories of each feature,
-it aids in understanding each variable's predictive power in the context of a classification-based machine learning
-model. Commonly used in credit scoring models, WoE and IV are robust statistical methods for evaluating a
-variable's predictive power.
-
-### Test Mechanism
-
-The test implementation follows defined steps. Initially, it selects non-numeric columns from the dataset and
-changes them to string type, paving the way for accurate binning. It then performs an automated WoE binning
-operation on these selected features, effectively categorizing the potential values of a variable into distinct
-bins. After the binning process, the function generates two separate visualizations (a scatter chart for WoE values
-and a bar chart for IV) for each variable. These visual presentations are formed according to the spread of each
-metric across various categories of each feature.
-
-### Signs of High Risk
-
-- Errors occurring during the binning process.
-- Challenges in converting non-numeric columns into string data type.
-- Misbalance in the distribution of WoE and IV, with certain bins overtaking others conspicuously. This could
-denote that the model is disproportionately dependent on certain variables or categories for predictions, an
-indication of potential risks to its robustness and generalizability.
-
-### Strengths
-
-- Provides a detailed visual representation of the relationship between feature categories and the target variable.
-This grants an intuitive understanding of each feature's contribution to the model.
-- Allows for easy identification of features with high impact, facilitating feature selection and enhancing
-comprehension of the model's decision logic.
-- WoE conversions are monotonic, upholding the rank ordering of the original data points, which simplifies analysis.
-
-### Limitations
-
-- The method is largely reliant on the binning process, and an inappropriate binning threshold or bin number choice
-might result in a misrepresentation of the variable's distribution.
-- While excellent for categorical data, the encoding of continuous variables into categorical can sometimes lead to
-information loss.
-- Extreme or outlier values can dramatically affect the computation of WoE and IV, skewing results.
-- The method requires a sufficient number of events per bin to generate a reliable information value and weight of
-evidence.
\ No newline at end of file
diff --git a/site/tests/data_validation/WOEBinTable.md b/site/tests/data_validation/WOEBinTable.md
deleted file mode 100644
index e43529107f..0000000000
--- a/site/tests/data_validation/WOEBinTable.md
+++ /dev/null
@@ -1,38 +0,0 @@
-# WOEBinTable
-
-Assesses the Weight of Evidence (WoE) and Information Value (IV) of each feature to evaluate its predictive power
-in a binary classification model.
-
-### Purpose
-
-The Weight of Evidence (WoE) and Information Value (IV) test is designed to evaluate the predictive power of each
-feature in a machine learning model. This test generates binned groups of values from each feature, computes the
-WoE and IV for each bin, and provides insights into the relationship between each feature and the target variable,
-illustrating their contribution to the model's predictive capabilities.
-
-### Test Mechanism
-
-The test uses the `scorecardpy.woebin` method to perform automatic binning of the dataset based on WoE. The method
-accepts a list of break points for binning numeric variables through the parameter `breaks_adj`. If no breaks are
-provided, it uses default binning. The bins are then used to calculate the WoE and IV values, effectively creating
-a dataframe that includes the bin boundaries, WoE, and IV values for each feature. A target variable is required
-in the dataset to perform this analysis.
-
-### Signs of High Risk
-
-- High IV values, indicating variables with excessive predictive power which might lead to overfitting.
-- Errors during the binning process, potentially due to inappropriate data types or poorly defined bins.
-
-### Strengths
-
-- Highly effective for feature selection in binary classification problems, as it quantifies the predictive
-information within each feature concerning the binary outcome.
-- The WoE transformation creates a monotonic relationship between the target and independent variables.
-
-### Limitations
-
-- Primarily designed for binary classification tasks, making it less applicable or reliable for multi-class
-classification or regression tasks.
-- Potential difficulties if the dataset has many features, non-binnable features, or non-numeric features.
-- The metric does not help in distinguishing whether the observed predictive factor is due to data randomness or a
-true phenomenon.
\ No newline at end of file
diff --git a/site/tests/data_validation/ZivotAndrewsArch.md b/site/tests/data_validation/ZivotAndrewsArch.md
deleted file mode 100644
index 177a8d349d..0000000000
--- a/site/tests/data_validation/ZivotAndrewsArch.md
+++ /dev/null
@@ -1,38 +0,0 @@
-# ZivotAndrewsArch
-
-Evaluates the order of integration and stationarity of time series data using the Zivot-Andrews unit root test.
-
-### Purpose
-
-The Zivot-Andrews Arch metric is used to evaluate the order of integration for time series data in a machine
-learning model. It's designed to test for stationarity, a crucial aspect of time series analysis, where data points
-are independent of time. Stationarity means that the statistical properties such as mean, variance, and
-autocorrelation are constant over time.
-
-### Test Mechanism
-
-The Zivot-Andrews unit root test is performed on each feature in the dataset using the `ZivotAndrews` function from
-the `arch.unitroot` module. This function returns several metrics for each feature, including the statistical
-value, p-value (probability value), the number of lags used, and the number of observations. The p-value is used to
-decide on the null hypothesis (the time series has a unit root and is non-stationary) based on a chosen level of
-significance.
-
-### Signs of High Risk
-
-- A high p-value suggests high risk, indicating insufficient evidence to reject the null hypothesis, implying that
-the time series has a unit root and is non-stationary.
-- Non-stationary time series data can lead to misleading statistics and unreliable machine learning models.
-
-### Strengths
-
-- Dynamically tests for stationarity against structural breaks in time series data, offering robust evaluation of
-stationarity in features.
-- Especially beneficial with financial, economic, or other time-series data where data observations lack a
-consistent pattern and structural breaks may occur.
-
-### Limitations
-
-- Assumes data is derived from a single-equation, autoregressive model, making it less appropriate for multivariate
-time series data or data not aligning with this model.
-- May not account for unexpected shocks or changes in the series trend, both of which can significantly impact data
-stationarity.
\ No newline at end of file
diff --git a/site/tests/data_validation/nlp/CommonWords.md b/site/tests/data_validation/nlp/CommonWords.md
deleted file mode 100644
index 90aad0ee94..0000000000
--- a/site/tests/data_validation/nlp/CommonWords.md
+++ /dev/null
@@ -1,39 +0,0 @@
-# CommonWords
-
-Assesses the most frequent non-stopwords in a text column for identifying prevalent language patterns.
-
-### Purpose
-
-The CommonWords metric is used to identify and visualize the most prevalent words within a specified text column of
-a dataset. This provides insights into the prevalent language patterns and vocabulary, especially useful in Natural
-Language Processing (NLP) tasks such as text classification and text summarization.
-
-### Test Mechanism
-
-The test methodology involves splitting the specified text column's entries into words, collating them into a
-corpus, and then counting the frequency of each word using the Counter. The forty most frequently occurring
-non-stopwords are then visualized in an interactive bar chart using Plotly, where the x-axis represents the words,
-and the y-axis indicates their frequency of occurrence.
-
-### Signs of High Risk
-
-- A lack of distinct words within the list, or the most common words being stopwords.
-- Frequent occurrence of irrelevant or inappropriate words could point out a poorly curated or noisy dataset.
-- An error returned due to the absence of a valid Dataset object, indicating high risk as the metric cannot be
-effectively implemented without it.
-
-### Strengths
-
-- The metric provides clear insights into the language features – specifically word frequency – of unstructured
-text data.
-- It can reveal prominent vocabulary and language patterns, which prove vital for feature extraction in NLP tasks.
-- The interactive visualization helps in quickly capturing the patterns and understanding the data intuitively.
-
-### Limitations
-
-- The test disregards semantic or context-related information as it solely focuses on word frequency.
-- It intentionally ignores stopwords, which might carry necessary significance in certain scenarios.
-- The applicability is limited to English-language text data as English stopwords are used for filtering, hence
-cannot account for data in other languages.
-- The metric requires a valid Dataset object, indicating a dependency condition that limits its broader
-applicability.
\ No newline at end of file
diff --git a/site/tests/data_validation/nlp/Hashtags.md b/site/tests/data_validation/nlp/Hashtags.md
deleted file mode 100644
index 885439c504..0000000000
--- a/site/tests/data_validation/nlp/Hashtags.md
+++ /dev/null
@@ -1,42 +0,0 @@
-# Hashtags
-
-Assesses hashtag frequency in a text column, highlighting usage trends and potential dataset bias or spam.
-
-### Purpose
-
-The Hashtags test is designed to measure the frequency of hashtags used within a given text column in a dataset. It
-is particularly useful for natural language processing tasks such as text classification and text summarization.
-The goal is to identify common trends and patterns in the use of hashtags, which can serve as critical indicators
-or features within a machine learning model.
-
-### Test Mechanism
-
-The test implements a regular expression (regex) to extract all hashtags from the specified text column. For each
-hashtag found, it makes a tally of its occurrences. It then outputs a list of the top N hashtags (default is 25,
-but customizable), sorted by their counts in descending order. The results are also visualized in a bar plot, with
-frequency counts on the y-axis and the corresponding hashtags on the x-axis.
-
-### Signs of High Risk
-
-- A low diversity in the usage of hashtags, as indicated by a few hashtags being used disproportionately more than
-others.
-- Repeated usage of one or few hashtags can be indicative of spam or a biased dataset.
-- If there are no or extremely few hashtags found in the dataset, it perhaps signifies that the text data does not
-contain structured social media data.
-
-### Strengths
-
-- Provides a concise visual representation of the frequency of hashtags, which can be critical for understanding
-trends about a particular topic in text data.
-- Instrumental in tasks specifically related to social media text analytics, such as opinion analysis and trend
-discovery.
-- Adaptable, allowing the flexibility to determine the number of top hashtags to be analyzed.
-
-### Limitations
-
-- Assumes the presence of hashtags and therefore may not be applicable for text datasets that do not contain
-hashtags (e.g., formal documents, scientific literature).
-- Language-specific limitations of hashtag formulations are not taken into account.
-- Does not account for typographical errors, variations, or synonyms in hashtags.
-- Does not provide context or sentiment associated with the hashtags, so the information provided may have limited
-utility on its own.
\ No newline at end of file
diff --git a/site/tests/data_validation/nlp/LanguageDetection.md b/site/tests/data_validation/nlp/LanguageDetection.md
deleted file mode 100644
index 96ce990df3..0000000000
--- a/site/tests/data_validation/nlp/LanguageDetection.md
+++ /dev/null
@@ -1,39 +0,0 @@
-# LanguageDetection
-
-Assesses the diversity of languages in a textual dataset by detecting and visualizing the distribution of languages.
-
-### Purpose
-
-The Language Detection test aims to identify and visualize the distribution of languages present within a textual
-dataset. This test helps in understanding the diversity of languages in the data, which is crucial for developing
-and validating multilingual models.
-
-### Test Mechanism
-
-This test operates by:
-
-- Checking if the dataset has a specified text column.
-- Using a language detection library to determine the language of each text entry in the dataset.
-- Generating a histogram plot of the language distribution, with language codes on the x-axis and their frequencies
-on the y-axis.
-
-If the text column is not specified, a ValueError is raised to ensure proper dataset configuration.
-
-### Signs of High Risk
-
-- A high proportion of entries returning "Unknown" language codes.
-- Detection of unexpectedly diverse or incorrect language codes, indicating potential data quality issues.
-- Significant imbalance in language distribution, which might indicate potential biases in the dataset.
-
-### Strengths
-
-- Provides a visual representation of language diversity within the dataset.
-- Helps identify data quality issues related to incorrect or unknown language detection.
-- Useful for ensuring that multilingual models have adequate and appropriate representation from various languages.
-
-### Limitations
-
-- Dependency on the accuracy of the language detection library, which may not be perfect.
-- Languages with similar structures or limited text length may be incorrectly classified.
-- The test returns "Unknown" for entries where language detection fails, which might mask underlying issues with
-certain languages or text formats.
\ No newline at end of file
diff --git a/site/tests/data_validation/nlp/Mentions.md b/site/tests/data_validation/nlp/Mentions.md
deleted file mode 100644
index ef900a086f..0000000000
--- a/site/tests/data_validation/nlp/Mentions.md
+++ /dev/null
@@ -1,40 +0,0 @@
-# Mentions
-
-Calculates and visualizes frequencies of '@' prefixed mentions in a text-based dataset for NLP model analysis.
-
-### Purpose
-
-The "Mentions" test is designed to gauge the quality of data in a Natural Language Processing (NLP) or text-focused
-Machine Learning model. The primary objective is to identify and calculate the frequency of 'mentions' within a
-chosen text column of a dataset. A 'mention' in this context refers to individual text elements that are prefixed
-by '@'. The output of this test reveals the most frequently mentioned entities or usernames, which can be integral
-for applications such as social media analyses or customer sentiment analyses.
-
-### Test Mechanism
-
-The test first verifies the existence of a text column in the provided dataset. It then employs a regular
-expression pattern to extract mentions from the text. Subsequently, the frequency of each unique mention is
-calculated. The test selects the most frequent mentions based on default or user-defined parameters, the default
-being the top 25, for representation. This process of thresholding forms the core of the test. A treemap plot
-visualizes the test results, where the size of each rectangle corresponds to the frequency of a particular mention.
-
-### Signs of High Risk
-
-- The lack of a valid text column in the dataset, which would result in the failure of the test execution.
-- The absence of any mentions within the text data, indicating that there might not be any text associated with
-@'. This situation could point toward sparse or poor-quality data, thereby hampering the model's generalization or
-learning capabilities.
-
-### Strengths
-
-- The test is specifically optimized for text-based datasets which gives it distinct power in the context of NLP.
-- It enables quick identification and visually appealing representation of the predominant elements or mentions.
-- It can provide crucial insights about the most frequently mentioned entities or usernames.
-
-### Limitations
-
-- The test only recognizes mentions that are prefixed by '@', hence useful textual aspects not preceded by '@
-might be ignored.
-- This test isn't suited for datasets devoid of textual data.
-- It does not provide insights on less frequently occurring data or outliers, which means potentially significant
-patterns could be overlooked.
\ No newline at end of file
diff --git a/site/tests/data_validation/nlp/PolarityAndSubjectivity.md b/site/tests/data_validation/nlp/PolarityAndSubjectivity.md
deleted file mode 100644
index 02d97a2a77..0000000000
--- a/site/tests/data_validation/nlp/PolarityAndSubjectivity.md
+++ /dev/null
@@ -1,37 +0,0 @@
-# PolarityAndSubjectivity
-
-Analyzes the polarity and subjectivity of text data within a given dataset to visualize the sentiment distribution.
-
-### Purpose
-
-The Polarity and Subjectivity test is designed to evaluate the sentiment expressed in textual data. By analyzing
-these aspects, it helps to identify the emotional tone and subjectivity of the dataset, which could be crucial in
-understanding customer feedback, social media sentiments, or other text-related data.
-
-### Test Mechanism
-
-This test uses TextBlob to compute the polarity and subjectivity scores of textual data in a given dataset. The
-mechanism includes:
-
-- Iterating through each text entry in the specified column of the dataset.
-- Applying the TextBlob library to compute the polarity (ranging from -1 for negative sentiment to +1 for positive
-sentiment) and subjectivity (ranging from 0 for objective to 1 for subjective) for each entry.
-- Creating a scatter plot using Plotly to visualize the relationship between polarity and subjectivity.
-
-### Signs of High Risk
-
-- High concentration of negative polarity values indicating prevalent negative sentiments.
-- High subjectivity scores suggesting the text data is largely opinion-based rather than factual.
-- Disproportionate clusters of extreme scores (e.g., many points near -1 or +1 polarity).
-
-### Strengths
-
-- Quantifies sentiment and subjectivity which can provide actionable insights.
-- Visualizes sentiment distribution, aiding in easy interpretation.
-- Utilizes well-established TextBlob library for sentiment analysis.
-
-### Limitations
-
-- Polarity and subjectivity calculations may oversimplify nuanced text sentiments.
-- Reliance on TextBlob which may not be accurate for all domains or contexts.
-- Visualization could become cluttered with very large datasets, making interpretation difficult.
\ No newline at end of file
diff --git a/site/tests/data_validation/nlp/Punctuations.md b/site/tests/data_validation/nlp/Punctuations.md
deleted file mode 100644
index ce04812e10..0000000000
--- a/site/tests/data_validation/nlp/Punctuations.md
+++ /dev/null
@@ -1,37 +0,0 @@
-# Punctuations
-
-Analyzes and visualizes the frequency distribution of punctuation usage in a given text dataset.
-
-### Purpose
-
-The Punctuations Metric's primary purpose is to analyze the frequency of punctuation usage within a given text
-dataset. This is often used in Natural Language Processing tasks, such as text classification and text
-summarization.
-
-### Test Mechanism
-
-The test begins by verifying that the input "dataset" is of the type VMDataset. The count_mode parameter must be
-either "token" (counts punctuation marks as individual tokens) or "word" (counts punctuation marks within words).
-Following that, a corpus is created from the dataset by splitting its text on spaces. Each unique punctuation
-character in the text corpus is then tallied. The frequency distribution of each punctuation symbol is visualized
-as a bar graph, with these results being stored as Figures and associated with the main Punctuations object.
-
-### Signs of High Risk
-
-- Excessive or unusual frequency of specific punctuation marks, potentially denoting dubious quality, data
-corruption, or skewed data.
-
-### Strengths
-
-- Provides valuable insights into the distribution of punctuation usage in a text dataset.
-- Important in validating the quality, consistency, and nature of the data.
-- Can provide hints about the style or tonality of the text corpus, such as informal and emotional context
-indicated by frequent exclamation marks.
-
-### Limitations
-
-- Focuses solely on punctuation usage, potentially missing other important textual characteristics.
-- General cultural or tonality assumptions based on punctuation distribution can be misguiding, as these vary
-across different languages and contexts.
-- Less effective with languages that use non-standard or different punctuation.
-- Visualization may lack interpretability when there are many unique punctuation marks in the dataset.
\ No newline at end of file
diff --git a/site/tests/data_validation/nlp/Sentiment.md b/site/tests/data_validation/nlp/Sentiment.md
deleted file mode 100644
index 26f3bd8348..0000000000
--- a/site/tests/data_validation/nlp/Sentiment.md
+++ /dev/null
@@ -1,33 +0,0 @@
-# Sentiment
-
-Analyzes the sentiment of text data within a dataset using the VADER sentiment analysis tool.
-
-### Purpose
-
-The Sentiment test evaluates the overall sentiment of text data within a dataset. By analyzing sentiment scores, it
-aims to ensure that the model is interpreting text data accurately and is not biased towards a particular sentiment.
-
-### Test Mechanism
-
-This test uses the VADER (Valence Aware Dictionary and sEntiment Reasoner) SentimentIntensityAnalyzer. It processes
-each text entry in a specified column of the dataset to calculate the compound sentiment score, which represents
-the overall sentiment polarity. The distribution of these sentiment scores is then visualized using a KDE (Kernel
-Density Estimation) plot, highlighting any skewness or concentration in sentiment.
-
-### Signs of High Risk
-
-- Extreme polarity in sentiment scores, indicating potential bias.
-- Unusual concentration of sentiment scores in a specific range.
-- Significant deviation from expected sentiment distribution for the given text data.
-
-### Strengths
-
-- Provides a clear visual representation of sentiment distribution.
-- Uses a well-established sentiment analysis tool (VADER).
-- Can handle a wide range of text data, making it flexible for various applications.
-
-### Limitations
-
-- May not capture nuanced or context-specific sentiments.
-- Relies heavily on the accuracy of the VADER sentiment analysis tool.
-- Visualization alone may not provide comprehensive insights into underlying causes of sentiment distribution.
\ No newline at end of file
diff --git a/site/tests/data_validation/nlp/StopWords.md b/site/tests/data_validation/nlp/StopWords.md
deleted file mode 100644
index dee3a240ef..0000000000
--- a/site/tests/data_validation/nlp/StopWords.md
+++ /dev/null
@@ -1,47 +0,0 @@
-# StopWords
-
-Evaluates and visualizes the frequency of English stop words in a text dataset against a defined threshold.
-
-### Purpose
-
-The StopWords threshold test is a tool designed for assessing the quality of text data in an ML model. It focuses
-on the identification and analysis of "stop words" in a given dataset. Stop words are frequent, common, yet
-semantically insignificant words (for example: "the", "and", "is") in a language. This test evaluates the
-proportion of stop words to the total word count in the dataset, in essence, scrutinizing the frequency of stop
-word usage. The core objective is to highlight the prevalent stop words based on their usage frequency, which can
-be instrumental in cleaning the data from noise and improving ML model performance.
-
-### Test Mechanism
-
-The StopWords test initiates on receiving an input of a 'VMDataset' object. Absence of such an object will trigger
-an error. The methodology involves inspection of the text column of the VMDataset to create a 'corpus' (a
-collection of written texts). Leveraging the Natural Language Toolkit's (NLTK) stop word repository, the test
-screens the corpus for any stop words and documents their frequency. It further calculates the percentage usage of
-each stop word compared to the total word count in the corpus. This percentage is evaluated against a predefined
-min_percent_threshold'. If this threshold is breached, the test returns a failed output. Top prevailing stop words
-along with their usage percentages are returned, facilitated by a bar chart visualization of these stop words and
-their frequency.
-
-### Signs of High Risk
-
-- A percentage of any stop words exceeding the predefined 'min_percent_threshold'.
-- High frequency of stop words in the dataset which may adversely affect the application's analytical performance
-due to noise creation.
-
-### Strengths
-
-- The ability to scrutinize and quantify the usage of stop words.
-- Provides insights into potential noise in the text data due to stop words.
-- Directly aids in enhancing model training efficiency.
-- Includes a bar chart visualization feature to easily interpret and action upon the stop words frequency
-information.
-
-### Limitations
-
-- The test only supports English stop words, making it less effective with datasets of other languages.
-- The 'min_percent_threshold' parameter may require fine-tuning for different datasets, impacting the overall
-effectiveness of the test.
-- Contextual use of the stop words within the dataset is not considered, potentially overlooking their significance
-in certain contexts.
-- The test focuses specifically on the frequency of stop words, not providing direct measures of model performance
-or predictive accuracy.
\ No newline at end of file
diff --git a/site/tests/data_validation/nlp/TextDescription.md b/site/tests/data_validation/nlp/TextDescription.md
deleted file mode 100644
index d61f8c4dd4..0000000000
--- a/site/tests/data_validation/nlp/TextDescription.md
+++ /dev/null
@@ -1,43 +0,0 @@
-# TextDescription
-
-Conducts comprehensive textual analysis on a dataset using NLTK to evaluate various parameters and generate
-visualizations.
-
-### Purpose
-
-The TextDescription test aims to conduct a thorough textual analysis of a dataset using the NLTK (Natural Language
-Toolkit) library. It evaluates various metrics such as total words, total sentences, average sentence length, total
-paragraphs, total unique words, most common words, total punctuations, and lexical diversity. The goal is to
-understand the nature of the text and anticipate challenges machine learning models might face in text processing,
-language understanding, or summarization tasks.
-
-### Test Mechanism
-
-The test works by:
-
-- Parsing the dataset and tokenizing the text into words, sentences, and paragraphs using NLTK.
-- Removing stopwords and unwanted tokens.
-- Calculating parameters like total words, total sentences, average sentence length, total paragraphs, total unique
-words, total punctuations, and lexical diversity.
-- Generating scatter plots to visualize correlations between various metrics (e.g., Total Words vs Total Sentences).
-
-### Signs of High Risk
-
-- Anomalies or increased complexity in lexical diversity.
-- Longer sentences and paragraphs.
-- High uniqueness of words.
-- Large number of unwanted tokens.
-- Missing or erroneous visualizations.
-
-### Strengths
-
-- Essential for pre-processing text data in machine learning models.
-- Provides a comprehensive breakdown of text data, aiding in understanding its complexity.
-- Generates visualizations to help comprehend text structure and complexity.
-
-### Limitations
-
-- Highly dependent on the NLTK library, limiting the test to supported languages.
-- Limited customization for removing undesirable tokens and stop words.
-- Does not consider semantic or grammatical complexities.
-- Assumes well-structured documents, which may result in inaccuracies with poorly formatted text.
\ No newline at end of file
diff --git a/site/tests/data_validation/nlp/Toxicity.md b/site/tests/data_validation/nlp/Toxicity.md
deleted file mode 100644
index 053f015dba..0000000000
--- a/site/tests/data_validation/nlp/Toxicity.md
+++ /dev/null
@@ -1,37 +0,0 @@
-# Toxicity
-
-Assesses the toxicity of text data within a dataset to visualize the distribution of toxicity scores.
-
-### Purpose
-
-The Toxicity test aims to evaluate the level of toxic content present in a text dataset by leveraging a pre-trained
-toxicity model. It helps in identifying potentially harmful or offensive language that may negatively impact users
-or stakeholders.
-
-### Test Mechanism
-
-This test uses a pre-trained toxicity evaluation model and applies it to each text entry in the specified column of
-a dataset’s dataframe. The procedure involves:
-
-- Loading a pre-trained toxicity model.
-- Extracting the text from the specified column in the dataset.
-- Computing toxicity scores for each text entry.
-- Generating a KDE (Kernel Density Estimate) plot to visualize the distribution of these toxicity scores.
-
-### Signs of High Risk
-
-- High concentration of high toxicity scores in the KDE plot.
-- A significant proportion of text entries with toxicity scores above a predefined threshold.
-- Wide distribution of toxicity scores, indicating inconsistency in content quality.
-
-### Strengths
-
-- Provides a visual representation of toxicity distribution, making it easier to identify outliers.
-- Uses a robust pre-trained model for toxicity evaluation.
-- Can process large text datasets efficiently.
-
-### Limitations
-
-- Depends on the accuracy and bias of the pre-trained toxicity model.
-- Does not provide context-specific insights, which may be necessary for nuanced understanding.
-- May not capture all forms of subtle or indirect toxic language.
\ No newline at end of file
diff --git a/site/tests/model_validation/BertScore.md b/site/tests/model_validation/BertScore.md
deleted file mode 100644
index 88da9fd625..0000000000
--- a/site/tests/model_validation/BertScore.md
+++ /dev/null
@@ -1,47 +0,0 @@
-# BertScore
-
-Assesses the quality of machine-generated text using BERTScore metrics and visualizes results through histograms
-and bar charts, alongside compiling a comprehensive table of descriptive statistics.
-
-### Purpose
-
-This function is designed to assess the quality of text generated by machine learning models using BERTScore
-metrics. BERTScore evaluates text generation models' performance by calculating precision, recall, and F1 score
-based on BERT contextual embeddings.
-
-### Test Mechanism
-
-The function starts by extracting the true and predicted values from the provided dataset and model. It then
-initializes the BERTScore evaluator. For each pair of true and predicted texts, the function calculates the
-BERTScore metrics and compiles them into a dataframe. Histograms and bar charts are generated for each BERTScore
-metric (Precision, Recall, and F1 Score) to visualize their distribution. Additionally, a table of descriptive
-statistics (mean, median, standard deviation, minimum, and maximum) is compiled for each metric, providing a
-comprehensive summary of the model's performance. The test uses the `evaluation_model` param to specify the
-huggingface model to use for evaluation. `microsoft/deberta-xlarge-mnli` is the best-performing model but is
-very large and may be slow without a GPU. `microsoft/deberta-large-mnli` is a smaller model that is faster to
-run and `distilbert-base-uncased` is much lighter and can run on a CPU but is less accurate.
-
-### Signs of High Risk
-
-- Consistently low scores across BERTScore metrics could indicate poor quality in the generated text, suggesting
-that the model fails to capture the essential content of the reference texts.
-- Low precision scores might suggest that the generated text contains a lot of redundant or irrelevant information.
-- Low recall scores may indicate that important information from the reference text is being omitted.
-- An imbalanced performance between precision and recall, reflected by a low F1 Score, could signal issues in the
-model's ability to balance informativeness and conciseness.
-
-### Strengths
-
-- Provides a multifaceted evaluation of text quality through different BERTScore metrics, offering a detailed view
-of model performance.
-- Visual representations (histograms and bar charts) make it easier to interpret the distribution and trends of the
-scores.
-- Descriptive statistics offer a concise summary of the model's strengths and weaknesses in generating text.
-
-### Limitations
-
-- BERTScore relies on the contextual embeddings from BERT models, which may not fully capture all nuances of text
-similarity.
-- The evaluation relies on the availability of high-quality reference texts, which may not always be obtainable.
-- While useful for comparison, BERTScore metrics alone do not provide a complete assessment of a model's
-performance and should be supplemented with other metrics and qualitative analysis.
\ No newline at end of file
diff --git a/site/tests/model_validation/BleuScore.md b/site/tests/model_validation/BleuScore.md
deleted file mode 100644
index a4b7d0b717..0000000000
--- a/site/tests/model_validation/BleuScore.md
+++ /dev/null
@@ -1,44 +0,0 @@
-# BleuScore
-
-Evaluates the quality of machine-generated text using BLEU metrics and visualizes the results through histograms
-and bar charts, alongside compiling a comprehensive table of descriptive statistics for BLEU scores.
-
-### Purpose
-
-This function is designed to assess the quality of text generated by machine learning models using the BLEU metric.
-BLEU, which stands for Bilingual Evaluation Understudy, is a metric used to evaluate the overlap of n-grams between
-the machine-generated text and reference texts. This evaluation is crucial for tasks such as text summarization,
-machine translation, and text generation, where the goal is to produce text that accurately reflects the content
-and meaning of human-crafted references.
-
-### Test Mechanism
-
-The function starts by extracting the true and predicted values from the provided dataset and model. It then
-initializes the BLEU evaluator. For each pair of true and predicted texts, the function calculates the BLEU scores
-and compiles them into a dataframe. Histograms and bar charts are generated for the BLEU scores to visualize their
-distribution. Additionally, a table of descriptive statistics (mean, median, standard deviation, minimum, and
-maximum) is compiled for the BLEU scores, providing a comprehensive summary of the model's performance.
-
-### Signs of High Risk
-
-- Consistently low BLEU scores could indicate poor quality in the generated text, suggesting that the model fails
-to capture the essential content of the reference texts.
-- Low precision scores might suggest that the generated text contains a lot of redundant or irrelevant information.
-- Low recall scores may indicate that important information from the reference text is being omitted.
-- An imbalanced performance between precision and recall, reflected by a low BLEU score, could signal issues in the
-model's ability to balance informativeness and conciseness.
-
-### Strengths
-
-- Provides a straightforward and widely-used evaluation of text quality through BLEU scores.
-- Visual representations (histograms and bar charts) make it easier to interpret the distribution and trends of the
-scores.
-- Descriptive statistics offer a concise summary of the model's strengths and weaknesses in generating text.
-
-### Limitations
-
-- BLEU metrics primarily focus on n-gram overlap and may not fully capture semantic coherence, fluency, or
-grammatical quality of the text.
-- The evaluation relies on the availability of high-quality reference texts, which may not always be obtainable.
-- While useful for comparison, BLEU scores alone do not provide a complete assessment of a model's performance and
-should be supplemented with other metrics and qualitative analysis.
\ No newline at end of file
diff --git a/site/tests/model_validation/ClusterSizeDistribution.md b/site/tests/model_validation/ClusterSizeDistribution.md
deleted file mode 100644
index 1435f258a3..0000000000
--- a/site/tests/model_validation/ClusterSizeDistribution.md
+++ /dev/null
@@ -1,40 +0,0 @@
-# ClusterSizeDistribution
-
-Assesses the performance of clustering models by comparing the distribution of cluster sizes in model predictions
-with the actual data.
-
-### Purpose
-
-The Cluster Size Distribution test aims to assess the performance of clustering models by comparing the
-distribution of cluster sizes in the model's predictions with the actual data. This comparison helps determine if
-the clustering model's output aligns well with the true cluster distribution, providing insights into the model's
-accuracy and performance.
-
-### Test Mechanism
-
-The test mechanism involves the following steps:
-- Run the clustering model on the provided dataset to obtain predictions.
-- Convert both the actual and predicted outputs into pandas dataframes.
-- Use pandas built-in functions to derive the cluster size distributions from these dataframes.
-- Construct two histograms: one for the actual cluster size distribution and one for the predicted distribution.
-- Plot the histograms side-by-side for visual comparison.
-
-### Signs of High Risk
-
-- Discrepancies between the actual cluster size distribution and the predicted cluster size distribution.
-- Irregular distribution of data across clusters in the predicted outcomes.
-- High number of outlier clusters suggesting the model struggles to correctly group data.
-
-### Strengths
-
-- Provides a visual and intuitive way to compare the clustering model's performance against actual data.
-- Effectively reveals where the model may be over- or underestimating cluster sizes.
-- Versatile as it works well with any clustering model.
-
-### Limitations
-
-- Assumes that the actual cluster distribution is optimal, which may not always be the case.
-- Relies heavily on visual comparison, which could be subjective and may not offer a precise numerical measure of
-performance.
-- May not fully capture other important aspects of clustering, such as cluster density, distances between clusters,
-and the shape of clusters.
\ No newline at end of file
diff --git a/site/tests/model_validation/ContextualRecall.md b/site/tests/model_validation/ContextualRecall.md
deleted file mode 100644
index 0811caf43f..0000000000
--- a/site/tests/model_validation/ContextualRecall.md
+++ /dev/null
@@ -1,45 +0,0 @@
-# ContextualRecall
-
-Evaluates a Natural Language Generation model's ability to generate contextually relevant and factually correct
-text, visualizing the results through histograms and bar charts, alongside compiling a comprehensive table of
-descriptive statistics for contextual recall scores.
-
-### Purpose
-
-The Contextual Recall metric is used to evaluate the ability of a natural language generation (NLG) model to
-generate text that appropriately reflects the given context or prompt. It measures the model's capability to
-remember and reproduce the main context in its resulting output. This metric is critical in natural language
-processing tasks, as the coherency and contextuality of the generated text are essential.
-
-### Test Mechanism
-
-The function starts by extracting the true and predicted values from the provided dataset and model. It then
-tokenizes the reference and candidate texts into discernible words or tokens using NLTK. The token overlap between
-the reference and candidate texts is identified, and the Contextual Recall score is computed by dividing the number
-of overlapping tokens by the total number of tokens in the reference text. Scores are calculated for each test
-dataset instance, resulting in an array of scores. These scores are visualized using a histogram and a bar chart to
-show score variations across different rows. Additionally, a table of descriptive statistics (mean, median,
-standard deviation, minimum, and maximum) is compiled for the contextual recall scores, providing a comprehensive
-summary of the model's performance.
-
-### Signs of High Risk
-
-- Low contextual recall scores could indicate that the model is not effectively reflecting the original context in
-its output, leading to incoherent or contextually misaligned text.
-- A consistent trend of low recall scores could suggest underperformance of the model.
-
-### Strengths
-
-- Provides a quantifiable measure of a model's adherence to the context and factual elements of the generated
-narrative.
-- Visual representations (histograms and bar charts) make it easier to interpret the distribution and trends of
-contextual recall scores.
-- Descriptive statistics offer a concise summary of the model's performance in generating contextually relevant
-texts.
-
-### Limitations
-
-- The focus on word overlap could result in high scores for texts that use many common words, even when these texts
-lack coherence or meaningful context.
-- This metric does not consider the order of words, which could lead to overestimated scores for scrambled outputs.
-- Models that effectively use infrequent words might be undervalued, as these words might not overlap as often.
\ No newline at end of file
diff --git a/site/tests/model_validation/FeaturesAUC.md b/site/tests/model_validation/FeaturesAUC.md
deleted file mode 100644
index 845e8620e7..0000000000
--- a/site/tests/model_validation/FeaturesAUC.md
+++ /dev/null
@@ -1,39 +0,0 @@
-# FeaturesAUC
-
-Evaluates the discriminatory power of each individual feature within a binary classification model by calculating
-the Area Under the Curve (AUC) for each feature separately.
-
-### Purpose
-
-The central objective of this metric is to quantify how well each feature on its own can differentiate between the
-two classes in a binary classification problem. It serves as a univariate analysis tool that can help in
-pre-modeling feature selection or post-modeling interpretation.
-
-### Test Mechanism
-
-For each feature, the metric treats the feature values as raw scores to compute the AUC against the actual binary
-outcomes. It provides an AUC value for each feature, offering a simple yet powerful indication of each feature's
-univariate classification strength.
-
-### Signs of High Risk
-
-- A feature with a low AUC score may not be contributing significantly to the differentiation between the two
-classes, which could be a concern if it is expected to be predictive.
-- Conversely, a surprisingly high AUC for a feature not believed to be informative may suggest data leakage or
-other issues with the data.
-
-### Strengths
-
-- By isolating each feature, it highlights the individual contribution of features to the classification task
-without the influence of other variables.
-- Useful for both initial feature evaluation and for providing insights into the model's reliance on individual
-features after model training.
-
-### Limitations
-
-- Does not reflect the combined effects of features or any interaction between them, which can be critical in
-certain models.
-- The AUC values are calculated without considering the model's use of the features, which could lead to different
-interpretations of feature importance when considering the model holistically.
-- This metric is applicable only to binary classification tasks and cannot be directly extended to multiclass
-classification or regression without modifications.
\ No newline at end of file
diff --git a/site/tests/model_validation/MeteorScore.md b/site/tests/model_validation/MeteorScore.md
deleted file mode 100644
index a37aa3a386..0000000000
--- a/site/tests/model_validation/MeteorScore.md
+++ /dev/null
@@ -1,48 +0,0 @@
-# MeteorScore
-
-Assesses the quality of machine-generated translations by comparing them to human-produced references using the
-METEOR score, which evaluates precision, recall, and word order.
-
-### Purpose
-
-The METEOR (Metric for Evaluation of Translation with Explicit ORdering) score is designed to evaluate the quality
-of machine translations by comparing them against reference translations. It emphasizes both the accuracy and
-fluency of translations, incorporating precision, recall, and word order into its assessment.
-
-### Test Mechanism
-
-The function starts by extracting the true and predicted values from the provided dataset and model. The METEOR
-score is computed for each pair of machine-generated translation (prediction) and its corresponding human-produced
-reference. This is done by considering unigram matches between the translations, including matches based on surface
-forms, stemmed forms, and synonyms. The score is a combination of unigram precision and recall, adjusted for word
-order through a fragmentation penalty. Scores are compiled into a dataframe, and histograms and bar charts are
-generated to visualize the distribution of METEOR scores. Additionally, a table of descriptive statistics (mean,
-median, standard deviation, minimum, and maximum) is compiled for the METEOR scores, providing a comprehensive
-summary of the model's performance.
-
-### Signs of High Risk
-
-- Lower METEOR scores can indicate a lack of alignment between the machine-generated translations and their
-human-produced references, highlighting potential deficiencies in both the accuracy and fluency of translations.
-- Significant discrepancies in word order or an excessive fragmentation penalty could signal issues with how the
-translation model processes and reconstructs sentence structures, potentially compromising the natural flow of
-translated text.
-- Persistent underperformance across a variety of text types or linguistic contexts might suggest a broader
-inability of the model to adapt to the nuances of different languages or dialects, pointing towards gaps in its
-training or inherent limitations.
-
-### Strengths
-
-- Incorporates a balanced consideration of precision and recall, weighted towards recall to reflect the importance
-of content coverage in translations.
-- Directly accounts for word order, offering a nuanced evaluation of translation fluency beyond simple lexical
-matching.
-- Adapts to various forms of lexical similarity, including synonyms and stemmed forms, allowing for flexible
-matching.
-
-### Limitations
-
-- While comprehensive, the complexity of METEOR's calculation can make it computationally intensive, especially for
-large datasets.
-- The use of external resources for synonym and stemming matching may introduce variability based on the resources
-quality and relevance to the specific translation task.
\ No newline at end of file
diff --git a/site/tests/model_validation/ModelMetadata.md b/site/tests/model_validation/ModelMetadata.md
deleted file mode 100644
index 7c58fa3ce5..0000000000
--- a/site/tests/model_validation/ModelMetadata.md
+++ /dev/null
@@ -1,21 +0,0 @@
-# ModelMetadata
-
-Compare metadata of different models and generate a summary table with the results.
-
-**Purpose**: The purpose of this function is to compare the metadata of different models, including information about their architecture, framework, framework version, and programming language.
-
-**Test Mechanism**: The function retrieves the metadata for each model using `get_model_info`, renames columns according to a predefined set of labels, and compiles this information into a summary table.
-
-**Signs of High Risk**:
-- Inconsistent or missing metadata across models can indicate potential issues in model documentation or management.
-- Significant differences in framework versions or programming languages might pose challenges in model integration and deployment.
-
-**Strengths**:
-- Provides a clear comparison of essential model metadata.
-- Standardizes metadata labels for easier interpretation and comparison.
-- Helps identify potential compatibility or consistency issues across models.
-
-**Limitations**:
-- Assumes that the `get_model_info` function returns all necessary metadata fields.
-- Relies on the correctness and completeness of the metadata provided by each model.
-- Does not include detailed parameter information, focusing instead on high-level metadata.
\ No newline at end of file
diff --git a/site/tests/model_validation/ModelPredictionResiduals.md b/site/tests/model_validation/ModelPredictionResiduals.md
deleted file mode 100644
index 4590b69105..0000000000
--- a/site/tests/model_validation/ModelPredictionResiduals.md
+++ /dev/null
@@ -1,32 +0,0 @@
-# ModelPredictionResiduals
-
-Assesses normality and behavior of residuals in regression models through visualization and statistical tests.
-
-### Purpose
-
-The Model Prediction Residuals test aims to visualize the residuals of model predictions and assess their normality
-using the Kolmogorov-Smirnov (KS) test. It helps to identify potential issues related to model assumptions and
-effectiveness.
-
-### Test Mechanism
-
-The function calculates residuals and generates
-two figures: one for the time series of residuals and one for the histogram of residuals.
-It also calculates the KS test for normality and summarizes the results in a table.
-
-### Signs of High Risk
-
-- Residuals are not normally distributed, indicating potential issues with model assumptions.
-- High skewness or kurtosis in the residuals, which may suggest model misspecification.
-
-### Strengths
-
-- Provides clear visualizations of residuals over time and their distribution.
-- Includes statistical tests to assess the normality of residuals.
-- Helps in identifying potential model misspecifications and assumption violations.
-
-### Limitations
-
-- Assumes that the dataset is provided as a DataFrameDataset object with a .df attribute to access the pandas
-DataFrame.
-- Only generates plots for datasets with a datetime index, resulting in errors for other types of indices.
\ No newline at end of file
diff --git a/site/tests/model_validation/RegardScore.md b/site/tests/model_validation/RegardScore.md
deleted file mode 100644
index 799a1c0bdd..0000000000
--- a/site/tests/model_validation/RegardScore.md
+++ /dev/null
@@ -1,39 +0,0 @@
-# RegardScore
-
-Assesses the sentiment and potential biases in text generated by NLP models by computing and visualizing regard
-scores.
-
-### Purpose
-
-The `RegardScore` test aims to evaluate the levels of regard (positive, negative, neutral, or other) in texts
-generated by NLP models. It helps in understanding the sentiment and bias present in the generated content.
-
-### Test Mechanism
-
-This test extracts the true and predicted values from the provided dataset and model. It then computes the regard
-scores for each text instance using a preloaded `regard` evaluation tool. The scores are compiled into dataframes,
-and visualizations such as histograms and bar charts are generated to display the distribution of regard scores.
-Additionally, descriptive statistics (mean, median, standard deviation, minimum, and maximum) are calculated for
-the regard scores, providing a comprehensive overview of the model's performance.
-
-### Signs of High Risk
-
-- Noticeable skewness in the histogram, especially when comparing the predicted regard scores with the target
-regard scores, can indicate biases or inconsistencies in the model.
-- Lack of neutral scores in the model's predictions, despite a balanced distribution in the target data, might
-signal an issue.
-
-### Strengths
-
-- Provides a clear evaluation of regard levels in generated texts, aiding in ensuring content appropriateness.
-- Visual representations (histograms and bar charts) make it easier to interpret the distribution and trends of
-regard scores.
-- Descriptive statistics offer a concise summary of the model's performance in generating texts with balanced
-sentiments.
-
-### Limitations
-
-- The accuracy of the regard scores is contingent upon the underlying `regard` tool.
-- The scores provide a broad overview but do not specify which portions or tokens of the text are responsible for
-high regard.
-- Supplementary, in-depth analysis might be needed for granular insights.
\ No newline at end of file
diff --git a/site/tests/model_validation/RegressionResidualsPlot.md b/site/tests/model_validation/RegressionResidualsPlot.md
deleted file mode 100644
index 0da8faef07..0000000000
--- a/site/tests/model_validation/RegressionResidualsPlot.md
+++ /dev/null
@@ -1,41 +0,0 @@
-# RegressionResidualsPlot
-
-Evaluates regression model performance using residual distribution and actual vs. predicted plots.
-
-### Purpose
-
-The `RegressionResidualsPlot` metric aims to evaluate the performance of regression models. By generating and
-analyzing two plots – a distribution of residuals and a scatter plot of actual versus predicted values – this tool
-helps to visually appraise how well the model predicts and the nature of errors it makes.
-
-### Test Mechanism
-
-The process begins by extracting the true output values (`y_true`) and the model's predicted values (`y_pred`).
-Residuals are computed by subtracting predicted from true values. These residuals are then visualized using a
-histogram to display their distribution. Additionally, a scatter plot is derived to compare true values against
-predicted values, together with a "Perfect Fit" line, which represents an ideal match (predicted values equal
-actual values), facilitating the assessment of the model's predictive accuracy.
-
-### Signs of High Risk
-
-- Residuals showing a non-normal distribution, especially those with frequent extreme values.
-- Significant deviations of predicted values from actual values in the scatter plot.
-- Sparse density of data points near the "Perfect Fit" line in the scatter plot, indicating poor prediction
-accuracy.
-- Visible patterns or trends in the residuals plot, suggesting the model's failure to capture the underlying data
-structure adequately.
-
-### Strengths
-
-- Provides a direct, visually intuitive assessment of a regression model’s accuracy and handling of data.
-- Visual plots can highlight issues of underfitting or overfitting.
-- Can reveal systematic deviations or trends that purely numerical metrics might miss.
-- Applicable across various regression model types.
-
-### Limitations
-
-- Relies on visual interpretation, which can be subjective and less precise than numerical evaluations.
-- May be difficult to interpret in cases with multi-dimensional outputs due to the plots’ two-dimensional nature.
-- Overlapping data points in the residuals plot can complicate interpretation efforts.
-- Does not summarize model performance into a single quantifiable metric, which might be needed for comparative or
-summary analyses.
\ No newline at end of file
diff --git a/site/tests/model_validation/RougeScore.md b/site/tests/model_validation/RougeScore.md
deleted file mode 100644
index 4ce520aa48..0000000000
--- a/site/tests/model_validation/RougeScore.md
+++ /dev/null
@@ -1,46 +0,0 @@
-# RougeScore
-
-Assesses the quality of machine-generated text using ROUGE metrics and visualizes the results to provide
-comprehensive performance insights.
-
-### Purpose
-
-The ROUGE Score test is designed to evaluate the quality of text generated by machine learning models using various
-ROUGE metrics. ROUGE, which stands for Recall-Oriented Understudy for Gisting Evaluation, measures the overlap of
-n-grams, word sequences, and word pairs between machine-generated text and reference texts. This evaluation is
-crucial for tasks like text summarization, machine translation, and text generation, where the goal is to produce
-text that accurately reflects the content and meaning of human-crafted references.
-
-### Test Mechanism
-
-The test extracts the true and predicted values from the provided dataset and model. It initializes the ROUGE
-evaluator with the specified metric (e.g., ROUGE-1). For each pair of true and predicted texts, it calculates the
-ROUGE scores and compiles them into a dataframe. Histograms and bar charts are generated for each ROUGE metric
-(Precision, Recall, and F1 Score) to visualize their distribution. Additionally, a table of descriptive statistics
-(mean, median, standard deviation, minimum, and maximum) is compiled for each metric, providing a comprehensive
-summary of the model's performance.
-
-### Signs of High Risk
-
-- Consistently low scores across ROUGE metrics could indicate poor quality in the generated text, suggesting that
-the model fails to capture the essential content of the reference texts.
-- Low precision scores might suggest that the generated text contains a lot of redundant or irrelevant information.
-- Low recall scores may indicate that important information from the reference text is being omitted.
-- An imbalanced performance between precision and recall, reflected by a low F1 Score, could signal issues in the
-model's ability to balance informativeness and conciseness.
-
-### Strengths
-
-- Provides a multifaceted evaluation of text quality through different ROUGE metrics, offering a detailed view of
-model performance.
-- Visual representations (histograms and bar charts) make it easier to interpret the distribution and trends of the
-scores.
-- Descriptive statistics offer a concise summary of the model's strengths and weaknesses in generating text.
-
-### Limitations
-
-- ROUGE metrics primarily focus on n-gram overlap and may not fully capture semantic coherence, fluency, or
-grammatical quality of the text.
-- The evaluation relies on the availability of high-quality reference texts, which may not always be obtainable.
-- While useful for comparison, ROUGE scores alone do not provide a complete assessment of a model's performance and
-should be supplemented with other metrics and qualitative analysis.
\ No newline at end of file
diff --git a/site/tests/model_validation/TimeSeriesPredictionWithCI.md b/site/tests/model_validation/TimeSeriesPredictionWithCI.md
deleted file mode 100644
index 09a8a26f72..0000000000
--- a/site/tests/model_validation/TimeSeriesPredictionWithCI.md
+++ /dev/null
@@ -1,40 +0,0 @@
-# TimeSeriesPredictionWithCI
-
-Assesses predictive accuracy and uncertainty in time series models, highlighting breaches beyond confidence
-intervals.
-
-### Purpose
-
-The purpose of the Time Series Prediction with Confidence Intervals (CI) test is to visualize the actual versus
-predicted values for time series data, including confidence intervals, and to compute and report the number of
-breaches beyond these intervals. This helps in evaluating the reliability and accuracy of the model's predictions.
-
-### Test Mechanism
-
-The function performs the following steps:
-
-- Calculates the standard deviation of prediction errors.
-- Determines the confidence intervals using a specified confidence level, typically 95%.
-- Counts the number of actual values that fall outside the confidence intervals, referred to as breaches.
-- Generates a plot visualizing the actual values, predicted values, and confidence intervals.
-- Returns a DataFrame summarizing the breach information, including the total breaches, upper breaches, and lower
-breaches.
-
-### Signs of High Risk
-
-- A high number of breaches indicates that the model's predictions are not reliable within the specified confidence
-level.
-- Significant deviations between actual and predicted values may highlight model inadequacies or issues with data
-quality.
-
-### Strengths
-
-- Provides a visual representation of prediction accuracy and the uncertainty around predictions.
-- Includes a statistical measure of prediction reliability through confidence intervals.
-- Computes and reports breaches, offering a quantitative assessment of prediction performance.
-
-### Limitations
-
-- Assumes that the dataset is provided as a DataFrameDataset object with a datetime index.
-- Requires that `dataset.y_pred(model)` returns the predicted values for the model.
-- The calculation of confidence intervals assumes normally distributed errors, which may not hold for all datasets.
\ No newline at end of file
diff --git a/site/tests/model_validation/TimeSeriesPredictionsPlot.md b/site/tests/model_validation/TimeSeriesPredictionsPlot.md
deleted file mode 100644
index feed0a597b..0000000000
--- a/site/tests/model_validation/TimeSeriesPredictionsPlot.md
+++ /dev/null
@@ -1,26 +0,0 @@
-# TimeSeriesPredictionsPlot
-
-Plot actual vs predicted values for time series data and generate a visual comparison for the model.
-
-### Purpose
-
-The purpose of this function is to visualize the actual versus predicted values for time
-series data for a single model.
-
-### Test Mechanism
-
-The function plots the actual values from the dataset and overlays the predicted
-values from the model using Plotly for interactive visualization.
-
-- Large discrepancies between actual and predicted values indicate poor model performance.
-- Systematic deviations in predicted values can highlight model bias or issues with data patterns.
-
-### Strengths
-
-- Provides a clear visual comparison of model predictions against actual values.
-- Uses Plotly for interactive and visually appealing plots.
-
-### Limitations
-
-- Assumes that the dataset is provided as a DataFrameDataset object with a datetime index.
-- Requires that `dataset.y_pred(model)` returns the predicted values for the model.
\ No newline at end of file
diff --git a/site/tests/model_validation/TimeSeriesR2SquareBySegments.md b/site/tests/model_validation/TimeSeriesR2SquareBySegments.md
deleted file mode 100644
index ea8684ab33..0000000000
--- a/site/tests/model_validation/TimeSeriesR2SquareBySegments.md
+++ /dev/null
@@ -1,36 +0,0 @@
-# TimeSeriesR2SquareBySegments
-
-Evaluates the R-Squared values of regression models over specified time segments in time series data to assess
-segment-wise model performance.
-
-### Purpose
-
-The TimeSeriesR2SquareBySegments test aims to evaluate the R-Squared values for several regression models across
-different segments of time series data. This helps in determining how well the models explain the variability in
-the data within each specific time segment.
-
-### Test Mechanism
-- Provides a visual representation of model performance across different time segments.
-- Allows for identification of segments where the model performs poorly.
-- Calculating the R-Squared values for each segment.
-- Generating a bar chart to visually represent the R-Squared values across different models and segments.
-
-### Signs of High Risk
-
-- Significantly low R-Squared values for certain time segments, indicating poor model performance in those periods.
-- Large variability in R-Squared values across different segments for the same model, suggesting inconsistent
-performance.
-
-### Strengths
-
-- Provides a visual representation of how well models perform over different time periods.
-- Helps identify time segments where models may need improvement or retraining.
-- Facilitates comparison between multiple models in a straightforward manner.
-
-### Limitations
-
-- Assumes datasets are provided as DataFrameDataset objects with the attributes `y`, `y_pred`, and
-`feature_columns`.
-- Requires that `dataset.y_pred(model)` returns predicted values for the model.
-- Assumes that both `y_true` and `y_pred` are pandas Series with datetime indices, which may not always be the case.
-- May not account for more nuanced temporal dependencies within the segments.
\ No newline at end of file
diff --git a/site/tests/model_validation/TokenDisparity.md b/site/tests/model_validation/TokenDisparity.md
deleted file mode 100644
index 8276bfcf14..0000000000
--- a/site/tests/model_validation/TokenDisparity.md
+++ /dev/null
@@ -1,37 +0,0 @@
-# TokenDisparity
-
-Evaluates the token disparity between reference and generated texts, visualizing the results through histograms and
-bar charts, alongside compiling a comprehensive table of descriptive statistics for token counts.
-
-### Purpose
-
-The Token Disparity test aims to assess the difference in the number of tokens between reference texts and texts
-generated by the model. Understanding token disparity is essential for evaluating how well the generated content
-matches the expected length and richness of the reference texts.
-
-### Test Mechanism
-
-The test extracts true and predicted values from the dataset and model. It computes the number of tokens in each
-reference and generated text. The results are visualized using histograms and bar charts to display the
-distribution of token counts. Additionally, a table of descriptive statistics, including the mean, median, standard
-deviation, minimum, and maximum token counts, is compiled to provide a detailed summary of token usage.
-
-### Signs of High Risk
-
-- Significant disparity in token counts between reference and generated texts could indicate issues with text
-generation quality, such as verbosity or lack of detail.
-- Consistently low token counts in generated texts compared to references might suggest that the model is producing
-incomplete or overly concise outputs.
-
-### Strengths
-
-- Provides a simple yet effective evaluation of text length and token usage.
-- Visual representations (histograms and bar charts) make it easier to interpret the distribution and trends of
-token counts.
-- Descriptive statistics offer a concise summary of the model's performance in generating texts of appropriate
-length.
-
-### Limitations
-
-- Token counts alone do not provide a complete assessment of text quality and should be supplemented with other
-metrics and qualitative analysis.
\ No newline at end of file
diff --git a/site/tests/model_validation/ToxicityScore.md b/site/tests/model_validation/ToxicityScore.md
deleted file mode 100644
index 51446f1f8f..0000000000
--- a/site/tests/model_validation/ToxicityScore.md
+++ /dev/null
@@ -1,37 +0,0 @@
-# ToxicityScore
-
-Assesses the toxicity levels of texts generated by NLP models to identify and mitigate harmful or offensive content.
-
-### Purpose
-
-The ToxicityScore metric is designed to evaluate the toxicity levels of texts generated by models. This is crucial
-for identifying and mitigating harmful or offensive content in machine-generated texts.
-
-### Test Mechanism
-
-The function starts by extracting the input, true, and predicted values from the provided dataset and model. The
-toxicity score is computed for each text using a preloaded `toxicity` evaluation tool. The scores are compiled into
-dataframes, and histograms and bar charts are generated to visualize the distribution of toxicity scores.
-Additionally, a table of descriptive statistics (mean, median, standard deviation, minimum, and maximum) is
-compiled for the toxicity scores, providing a comprehensive summary of the model's performance.
-
-### Signs of High Risk
-
-- Drastic spikes in toxicity scores indicate potentially toxic content within the associated text segment.
-- Persistent high toxicity scores across multiple texts may suggest systemic issues in the model's text generation
-process.
-
-### Strengths
-
-- Provides a clear evaluation of toxicity levels in generated texts, helping to ensure content safety and
-appropriateness.
-- Visual representations (histograms and bar charts) make it easier to interpret the distribution and trends of
-toxicity scores.
-- Descriptive statistics offer a concise summary of the model's performance in generating non-toxic texts.
-
-### Limitations
-
-- The accuracy of the toxicity scores is contingent upon the underlying `toxicity` tool.
-- The scores provide a broad overview but do not specify which portions or tokens of the text are responsible for
-high toxicity.
-- Supplementary, in-depth analysis might be needed for granular insights.
\ No newline at end of file
diff --git a/site/tests/model_validation/embeddings/ClusterDistribution.md b/site/tests/model_validation/embeddings/ClusterDistribution.md
deleted file mode 100644
index 2b1c85adfb..0000000000
--- a/site/tests/model_validation/embeddings/ClusterDistribution.md
+++ /dev/null
@@ -1,40 +0,0 @@
-# ClusterDistribution
-
-Assesses the distribution of text embeddings across clusters produced by a model using KMeans clustering.
-
-### Purpose
-
-The purpose of this metric is to analyze the distribution of the clusters produced by a text embedding model. By
-dividing the text embeddings into different clusters, we can understand how the model is grouping or categorizing
-the text data. This aids in visualizing the organization and segregation of the data, thereby giving an
-understanding of how the model is processing the data.
-
-### Test Mechanism
-
-The metric applies the KMeans clustering algorithm on the predictions made by the model on the testing dataset and
-divides the text embeddings into a pre-defined number of clusters. By default, this number is set to 5 but can be
-customized as per requirements. The output of this test is a histogram plot that shows the distribution of
-embeddings across these clusters.
-
-### Signs of High Risk
-
-- If the embeddings are skewed towards one or two clusters, it indicates that the model is not effectively
-differentiating the various categories in the text data.
-- Uniform distribution of the embeddings across the clusters might show a lack of proper categorization.
-
-### Strengths
-
-- Great tool to visualize the text data categorization by the model.
-- Provides a way to assess if the model is distinguishing the categories effectively or not.
-- Flexible with the number of clusters, so it can be used on various types of data regardless of the number of
-categories.
-
-### Limitations
-
-- Success or failure of this test is based on visual interpretation, which might not be enough for making solid
-conclusions or determining the exact points of failure.
-- Assumes that the division of text embeddings across clusters should ideally be homogeneous, which might not
-always be the case depending on the nature of the text data.
-- Only applies to text embedding models, reducing its utility across various ML models.
-- Uses the KMeans clustering algorithm, which assumes that clusters are convex and isotropic, and may not work as
-intended if the true clusters in the data are not of this shape.
\ No newline at end of file
diff --git a/site/tests/model_validation/embeddings/CosineSimilarityComparison.md b/site/tests/model_validation/embeddings/CosineSimilarityComparison.md
deleted file mode 100644
index 0dce8ea17c..0000000000
--- a/site/tests/model_validation/embeddings/CosineSimilarityComparison.md
+++ /dev/null
@@ -1,44 +0,0 @@
-# CosineSimilarityComparison
-
-Assesses the similarity between embeddings generated by different models using Cosine Similarity, providing both
-statistical and visual insights.
-
-### Purpose
-
-The Cosine Similarity Comparison test aims to analyze and compare the embeddings produced by different models using
-Cosine Similarity. Cosine Similarity is a measure that calculates the cosine of the angle between two vectors,
-widely used to determine the alignment or similarity between high-dimensional vectors, such as text embeddings.
-This analysis helps understand how similar or different the models' predictions are in terms of embedding
-generation.
-
-### Test Mechanism
-
-The function starts by computing the embeddings for each model using the provided dataset. It then calculates the
-cosine similarity for every possible pair of models, generating a similarity matrix wherein each element represents
-the cosine similarity between two model embeddings. This matrix is flattened to create a bar chart for each model
-pair, visualizing their similarity distribution. Additionally, a table with descriptive statistics (mean, median,
-standard deviation, minimum, and maximum) for the similarities of each pair is compiled, referencing the compared
-models.
-
-### Signs of High Risk
-
-- A high concentration of cosine similarity values close to 1 could suggest that the models are producing very
-similar embeddings, indicating redundancy or lack of diversity in model training or design.
-- Very low similarity values near -1 highlight strong dissimilarity, suggesting models that are too divergent and
-possibly focusing on very different features of the data.
-
-### Strengths
-
-- Enables detailed comparisons between multiple models' embedding strategies through visual and statistical means.
-- Identifies models producing similar or dissimilar embeddings, useful for tasks requiring model diversity.
-- Provides quantitative and visual feedback on the degree of similarity, enhancing interpretability of model
-behavior in embedding spaces.
-
-### Limitations
-
-- The analysis is confined to the comparison of embeddings and does not assess the overall performance of the
-models in terms of their primary tasks (e.g., classification, regression).
-- Assumes that the models are suitable for generating comparable embeddings, which might not always be the case,
-especially across different types of models.
-- Interpretation of results is heavily dependent on the understanding of Cosine Similarity and the nature of
-high-dimensional embedding spaces.
\ No newline at end of file
diff --git a/site/tests/model_validation/embeddings/CosineSimilarityDistribution.md b/site/tests/model_validation/embeddings/CosineSimilarityDistribution.md
deleted file mode 100644
index 3cff6569fb..0000000000
--- a/site/tests/model_validation/embeddings/CosineSimilarityDistribution.md
+++ /dev/null
@@ -1,40 +0,0 @@
-# CosineSimilarityDistribution
-
-Assesses the similarity between predicted text embeddings from a model using a Cosine Similarity distribution
-histogram.
-
-### Purpose
-
-This metric is used to assess the degree of similarity between the embeddings produced by a text embedding model
-using Cosine Similarity. Cosine Similarity is a measure that calculates the cosine of the angle between two
-vectors. This metric is predominantly used in text analysis — in this case, to determine how closely the predicted
-text embeddings align with one another.
-
-### Test Mechanism
-
-The implementation starts by computing the cosine similarity between the predicted values of the model's test
-dataset. These cosine similarity scores are then plotted on a histogram with 100 bins to visualize the distribution
-of the scores. The x-axis of the histogram represents the computed Cosine Similarity.
-
-### Signs of High Risk
-
-- If the cosine similarity scores cluster close to 1 or -1, it may indicate overfitting, as the model's predictions
-are almost perfectly aligned. This could suggest that the model is not generalizable.
-- A broad spread of cosine similarity scores across the histogram may indicate a potential issue with the model's
-ability to generate consistent embeddings.
-
-### Strengths
-
-- Provides a visual representation of the model's performance which is easily interpretable.
-- Can help identify patterns, trends, and outliers in the model's alignment of predicted text embeddings.
-- Useful in measuring the similarity between vectors in multi-dimensional space, important in the case of text
-embeddings.
-
-### Limitations
-
-- Only evaluates the similarity between outputs. It does not provide insight into the model's ability to correctly
-classify or predict.
-- Cosine similarity only considers the angle between vectors and does not consider their magnitude. This can lead
-to high similarity scores for vectors with vastly different magnitudes but a similar direction.
-- The output is sensitive to the choice of bin number for the histogram. Different bin numbers could give a
-slightly altered perspective on the distribution of cosine similarity.
\ No newline at end of file
diff --git a/site/tests/model_validation/embeddings/CosineSimilarityHeatmap.md b/site/tests/model_validation/embeddings/CosineSimilarityHeatmap.md
deleted file mode 100644
index a42b029b08..0000000000
--- a/site/tests/model_validation/embeddings/CosineSimilarityHeatmap.md
+++ /dev/null
@@ -1,40 +0,0 @@
-# CosineSimilarityHeatmap
-
-Generates an interactive heatmap to visualize the cosine similarities among embeddings derived from a given model.
-
-### Purpose
-
-This function is designed to visually analyze the cosine similarities of embeddings from a specific model. Cosine
-similarity, a measure of the cosine of the angle between two vectors, aids in understanding the orientation and
-similarity of vectors in multi-dimensional space. This is particularly valuable for exploring text embeddings and
-their relative similarities among documents, words, or phrases.
-
-### Test Mechanism
-
-The function operates through a sequence of steps to visualize cosine similarities. Initially, embeddings are
-extracted for each dataset entry using the designated model. Following this, the function computes the pairwise
-cosine similarities among these embeddings. The computed similarities are then displayed in an interactive heatmap.
-
-### Signs of High Risk
-
-- High similarity values (close to 1) across the heatmap might not always be indicative of a risk; however, in
-contexts where diverse perspectives or features are desired, this could suggest a lack of diversity in the model's
-learning process or potential redundancy.
-- Similarly, low similarity values (close to -1) indicate strong dissimilarity, which could be beneficial in
-scenarios demanding diverse outputs. However, in cases where consistency is needed, these low values might
-highlight that the model is unable to capture a coherent set of features from the data, potentially leading to poor
-performance on related tasks.
-
-### Strengths
-
-- Provides an interactive and intuitive visual representation of embedding similarities, facilitating easy
-exploration and analysis.
-- Allows customization of visual elements such as title, axis labels, and color scale to suit specific analytical
-needs and preferences.
-
-### Limitations
-
-- As the number of embeddings increases, the effectiveness of the heatmap might diminish due to overcrowding,
-making it hard to discern detailed similarities.
-- The interpretation of the heatmap heavily relies on the appropriate setting of the color scale, as incorrect
-settings can lead to misleading visual interpretations.
\ No newline at end of file
diff --git a/site/tests/model_validation/embeddings/DescriptiveAnalytics.md b/site/tests/model_validation/embeddings/DescriptiveAnalytics.md
deleted file mode 100644
index 85d59bdab6..0000000000
--- a/site/tests/model_validation/embeddings/DescriptiveAnalytics.md
+++ /dev/null
@@ -1,43 +0,0 @@
-# DescriptiveAnalytics
-
-Evaluates statistical properties of text embeddings in an ML model via mean, median, and standard deviation
-histograms.
-
-### Purpose
-
-This metric, Descriptive Analytics for Text Embeddings Models, is employed to comprehend the fundamental properties
-and statistical characteristics of the embeddings in a Machine Learning model. It measures the dimensionality as
-well as the statistical distributions of embedding values including the mean, median, and standard deviation.
-
-### Test Mechanism
-
-The test mechanism involves using the 'DescriptiveAnalytics' class provided in the code which includes the 'run
-function. This function computes three statistical measures - mean, median, and standard deviation of the test
-predictions from the model. It generates and caches three separate histograms showing the distribution of these
-measures. Each histogram visualizes the measure's distribution across the embedding values. Therefore, the method
-does not utilize a grading scale or threshold; it is fundamentally a visual exploration and data exploration tool.
-
-### Signs of High Risk
-
-- Abnormal patterns or values in the distributions of the statistical measures. This may include skewed
-distributions or a significant amount of outliers.
-- Very high standard deviation values which indicate a high degree of variability in the data.
-- The mean and median values are vastly different, suggesting skewed data.
-
-### Strengths
-
-- Provides a visual and quantifiable understanding of the embeddings' statistical characteristics, allowing for a
-comprehensive evaluation.
-- Facilitates the identification of irregular patterns and anomalous values that might indicate issues with the
-machine learning model.
-- It considers three key statistical measures (mean, median, and standard deviation), offering a more well-rounded
-understanding of the data.
-
-### Limitations
-
-- The method does not offer an explicit measure of model performance or accuracy, as it mainly focuses on
-understanding data properties.
-- It relies heavily on the visual interpretation of histograms. This could be subjective, and important patterns
-could be overlooked if not carefully reviewed.
-- While it displays valuable information about the central tendency and spread of data, it does not provide
-information about correlations between different embedding dimensions.
\ No newline at end of file
diff --git a/site/tests/model_validation/embeddings/EmbeddingsVisualization2D.md b/site/tests/model_validation/embeddings/EmbeddingsVisualization2D.md
deleted file mode 100644
index 60ab083418..0000000000
--- a/site/tests/model_validation/embeddings/EmbeddingsVisualization2D.md
+++ /dev/null
@@ -1,41 +0,0 @@
-# EmbeddingsVisualization2D
-
-Visualizes 2D representation of text embeddings generated by a model using t-SNE technique.
-
-### Purpose
-
-The objective of this metric is to provide a visual 2D representation of the embeddings created by a text embedding
-machine learning model. By doing so, it aids in analyzing the embedding space created by the model and helps in
-understanding how the learned embeddings are distributed and how they relate to each other.
-
-### Test Mechanism
-
-This metric uses the t-Distributed Stochastic Neighbor Embedding (t-SNE) technique, which is a tool for visualizing
-high-dimensional data by reducing the dimensionality to 2. The perplexity parameter for t-SNE is set to the value
-provided by the user. If the input perplexity value is greater than the number of samples, the perplexity is
-adjusted to be one less than the number of samples. Following the reduction of dimensionality, a scatter plot is
-produced depicting each embedding as a data point in the visualized 2D plane.
-
-### Signs of High Risk
-
-- If the embeddings are highly concentrated in a specific region of the plane, it might indicate that the model is
-not learning diverse representations of the text.
-- Wide gaps or partitions in the visualization could suggest that the model is over-segmenting in the embedding
-space and may lead to poor generalization.
-
-### Strengths
-
-- Offers a powerful visual tool that can assist in understanding and interpreting high-dimensional embeddings,
-which could otherwise be difficult to visualize.
-- It is model-agnostic and can be used with any machine learning model that produces text embeddings.
-- t-SNE visualization helps in focusing on local structures and preserves the proximity of points that are close
-together in the original high-dimensional space.
-
-### Limitations
-
-- The reduction of high-dimensional data to 2D can result in loss of some information, which may lead to
-misinterpretation.
-- Due to its stochastic nature, t-SNE can produce different results when run multiple times with the same
-parameters, leading to potential inconsistency in interpretation.
-- It is designed for visual exploration and not for downstream tasks; that is, the 2D embeddings generated should
-not be directly used for further training or analysis.
\ No newline at end of file
diff --git a/site/tests/model_validation/embeddings/EuclideanDistanceComparison.md b/site/tests/model_validation/embeddings/EuclideanDistanceComparison.md
deleted file mode 100644
index 37bf509042..0000000000
--- a/site/tests/model_validation/embeddings/EuclideanDistanceComparison.md
+++ /dev/null
@@ -1,38 +0,0 @@
-# EuclideanDistanceComparison
-
-Assesses and visualizes the dissimilarity between model embeddings using Euclidean distance, providing insights
-into model behavior and potential redundancy or diversity.
-
-### Purpose
-
-The Euclidean Distance Comparison test aims to analyze and compare the embeddings produced by different models. By
-measuring the Euclidean distance between vectors in Euclidean space, it provides a metric to assess the magnitude
-of dissimilarity between embeddings created by different models. This is crucial for tasks that require models to
-produce distinct responses or feature separations.
-
-### Test Mechanism
-
-The test computes the embeddings for each model using the provided dataset and calculates the Euclidean distance
-for every possible pair of models. It generates a distance matrix where each element represents the Euclidean
-distance between two model embeddings. This matrix is then visualized through bar charts, showing the distance
-distribution for each model pair. Additionally, it compiles a table with descriptive statistics such as mean,
-median, standard deviation, minimum, and maximum distances for each model pair, including references to the
-compared models.
-
-### Signs of High Risk
-
-- Very high distance values could suggest that models are focusing on entirely different features or aspects of the
-data, which might be undesirable for ensemble methods or when a consensus is required.
-- Extremely low distances across different models might indicate redundancy, suggesting that models are not
-providing diverse enough perspectives on the data.
-
-### Strengths
-
-- Provides a clear and quantifiable measure of how different the embeddings from various models are.
-- Useful for identifying outlier models or those that behave significantly differently from others in a group.
-
-### Limitations
-
-- Euclidean distance can be sensitive to the scale of the data, meaning that preprocessing steps like normalization
-might be necessary to ensure meaningful comparisons.
-- Does not consider the orientation or angle between vectors, focusing purely on magnitude differences.
\ No newline at end of file
diff --git a/site/tests/model_validation/embeddings/EuclideanDistanceHeatmap.md b/site/tests/model_validation/embeddings/EuclideanDistanceHeatmap.md
deleted file mode 100644
index 6a0450fca1..0000000000
--- a/site/tests/model_validation/embeddings/EuclideanDistanceHeatmap.md
+++ /dev/null
@@ -1,38 +0,0 @@
-# EuclideanDistanceHeatmap
-
-Generates an interactive heatmap to visualize the Euclidean distances among embeddings derived from a given model.
-
-### Purpose
-
-This function visualizes the Euclidean distances between embeddings generated by a model, offering insights into
-the absolute differences between data points. Euclidean distance, a fundamental metric in data analysis, measures
-the straight-line distance between two points in Euclidean space. It is particularly useful for understanding
-spatial relationships and clustering tendencies in high-dimensional data.
-
-### Test Mechanism
-
-The function operates through a streamlined process: firstly, embeddings are extracted for each dataset entry using
-the specified model. Subsequently, it computes the pairwise Euclidean distances among these embeddings. The results
-are then visualized in an interactive heatmap format, where each cell's color intensity correlates with the
-distance magnitude between pairs of embeddings, providing a visual assessment of these distances.
-
-### Signs of High Risk
-
-- Uniformly low distances across the heatmap might suggest a lack of variability in the data or model overfitting,
-where the model fails to distinguish between distinct data points effectively.
-- Excessive variability in distances could indicate inconsistent data representation, potentially leading to
-unreliable model predictions.
-
-### Strengths
-
-- Provides a direct, intuitive visual representation of distances between embeddings, aiding in the detection of
-patterns or anomalies.
-- Allows customization of visual aspects such as the heatmap's title, axis labels, and color scale, adapting to
-various analytical needs.
-
-### Limitations
-
-- The interpretation of distances can be sensitive to the scale of data; normalization might be necessary for
-meaningful analysis.
-- Large datasets may lead to dense, cluttered heatmaps, making it difficult to discern individual distances,
-potentially requiring techniques like data sampling or dimensionality reduction for clearer visualization.
\ No newline at end of file
diff --git a/site/tests/model_validation/embeddings/PCAComponentsPairwisePlots.md b/site/tests/model_validation/embeddings/PCAComponentsPairwisePlots.md
deleted file mode 100644
index c13551b4a4..0000000000
--- a/site/tests/model_validation/embeddings/PCAComponentsPairwisePlots.md
+++ /dev/null
@@ -1,40 +0,0 @@
-# PCAComponentsPairwisePlots
-
-Generates scatter plots for pairwise combinations of principal component analysis (PCA) components of model
-embeddings.
-
-### Purpose
-
-This function visualizes the principal components of embeddings derived from a specified model. Principal Component
-Analysis (PCA) is a statistical technique that emphasizes variation and uncovers strong patterns in a dataset. It
-transforms the original variables into new, uncorrelated variables (principal components) that maximize variance.
-
-### Test Mechanism
-
-The function follows a sequential process to visualize PCA components effectively. It starts by extracting
-embeddings from the dataset, utilizing the model specified by the user. These embeddings are then standardized to
-ensure zero mean and unit variance, which is crucial to prevent any single feature from dominating due to
-scale—this standardization is a critical preprocessing step for PCA. Following this, the function calculates the
-specified number of principal components. The core of the visualization process involves creating scatter plots for
-each pairwise combination of these principal components.
-
-### Signs of High Risk
-
-- If the principal components do not account for a significant portion of the variance, it may suggest that PCA is
-not capturing the essential structures of the data.
-- Similarity in scatter plots across different pairs of components could indicate redundancy in the components,
-suggesting that fewer dimensions might be sufficient to represent the data.
-
-### Strengths
-
-- Enables a simplified visualization of multivariate data, helping to identify patterns across many variables
-effectively.
-- Provides a clear depiction of the directions of maximum variance in the data, which is valuable for feature
-selection and dimensionality reduction.
-
-### Limitations
-
-- PCA's effectiveness hinges on the scaling of the variables; improper standardization can lead to misleading
-interpretations.
-- The interpretation of principal components can be challenging, especially if they capture less significant
-variances or are difficult to relate back to the original features.
\ No newline at end of file
diff --git a/site/tests/model_validation/embeddings/StabilityAnalysisKeyword.md b/site/tests/model_validation/embeddings/StabilityAnalysisKeyword.md
deleted file mode 100644
index bcfb71d40b..0000000000
--- a/site/tests/model_validation/embeddings/StabilityAnalysisKeyword.md
+++ /dev/null
@@ -1,40 +0,0 @@
-# StabilityAnalysisKeyword
-
-Evaluates robustness of embedding models to keyword swaps in the test dataset.
-
-### Purpose
-
-This test metric is used to evaluate the robustness of text embedding machine learning models to keyword swaps. A
-keyword swap is a scenario where instances of certain specified keywords in the dataset are replaced with other
-specified words (usually synonyms). The purpose of this metric is to ensure that these models maintain performance
-stability even when the input data slightly deviates, imitating real-world variability.
-
-### Test Mechanism
-
-The test mechanism involves a perturbation of the dataset used in testing the model. Each instance of a specific
-word found in the dataset is replaced with the corresponding word as specified in a 'keyword_dict' mapping. The
-model is then re-run with the perturbed dataset and the results are compared with the non-perturbed dataset. This
-comparison quantifies the extent to which keyword swaps impact the model's performance.
-
-### Signs of High Risk
-
-- A significant drop in model performance after keyword swaps indicates a high risk of model failure in real-world
-scenarios.
-- The model results being heavily reliant on specific word choices instead of capturing the context properly.
-
-### Strengths
-
-- This test provides a way to measure model robustness to small changes in input data, which reinforces its
-applicability and reliability in real-world scenarios.
-- This test encourages a model to understand the context of a sentence rather than memorizing specific words.
-- It helps to detect overfitting - a situation where a model performs well on training data but poorly on new or
-slightly altered data.
-
-### Limitations
-
-- It may not fully address semantic differences that can be introduced through keyword swaps. That is, the
-replacement words might not preserve the exact semantic meaning of the original words.
-- It only tests for changes in keywords (word-level alterations) and might not expose model limitations related to
-structural data changes.
-- It assumes that the provided 'keyword_dict' is an accurate representation of possible real-world variations,
-which might not always be the case.
\ No newline at end of file
diff --git a/site/tests/model_validation/embeddings/StabilityAnalysisRandomNoise.md b/site/tests/model_validation/embeddings/StabilityAnalysisRandomNoise.md
deleted file mode 100644
index 59cc0b729c..0000000000
--- a/site/tests/model_validation/embeddings/StabilityAnalysisRandomNoise.md
+++ /dev/null
@@ -1,45 +0,0 @@
-# StabilityAnalysisRandomNoise
-
-Assesses the robustness of text embeddings models to random noise introduced via text perturbations.
-
-### Purpose
-
-The purpose of this test is to evaluate the robustness of a text embeddings model to random noise. It introduces
-perturbations such as swapping adjacent words, inserting typos, deleting words, or inserting random words within
-the text to determine how well the model performs under such noisy conditions.
-
-### Test Mechanism
-
-The test applies a series of pre-defined random perturbations to the text data. These perturbations include:
-
-- Swapping two adjacent words using the `random_swap` function.
-- Introducing a typo in a word using the `introduce_typo` function.
-- Deleting a word using the `random_deletion` function.
-- Inserting a random word at a random position using the `random_insertion` function.
-
-A probability parameter dictates the likelihood of each perturbation being applied to the words in the text. The
-text is initially tokenized into words, and selected perturbations are applied based on this probability.
-
-### Signs of High Risk
-
-- High error rates in model predictions or classifications after the introduction of random noise.
-- Greater sensitivity to specific types of noise, such as typographical errors or word deletions.
-- Significant change in loss function or accuracy metrics.
-- Inconsistent model outputs for slightly perturbed inputs.
-
-### Strengths
-
-- Measures model robustness against noise, reflecting real-world scenarios where data may contain errors or
-inconsistencies.
-- Easy to implement with adjustable perturbation severity through a probability parameter.
-- Identifies model sensitivity to specific types of noise, offering insights for model improvement.
-- Useful for testing models designed to handle text data.
-
-### Limitations
-
-- May be ineffective for models that are inherently resistant to noise or designed to handle such perturbations.
-- Pseudo-randomness may not accurately represent the real-world distribution of noise or typographical errors.
-- Highly dependent on the probability parameter, requiring fine-tuning to achieve an optimal balance.
-- Only assesses performance against noise in input data, not the ability to capture complex language structures or
-semantics.
-- Does not guarantee model performance on new, unseen, real-world data beyond the generated noisy test data.
\ No newline at end of file
diff --git a/site/tests/model_validation/embeddings/StabilityAnalysisSynonyms.md b/site/tests/model_validation/embeddings/StabilityAnalysisSynonyms.md
deleted file mode 100644
index 08ccf53daf..0000000000
--- a/site/tests/model_validation/embeddings/StabilityAnalysisSynonyms.md
+++ /dev/null
@@ -1,44 +0,0 @@
-# StabilityAnalysisSynonyms
-
-Evaluates the stability of text embeddings models when words in test data are replaced by their synonyms randomly.
-
-### Purpose
-
-The Stability Analysis Synonyms test is designed to gauge the robustness and stability of an embeddings model on
-text-based data. The test does so by introducing random word changes through replacing words in the test dataset
-with their synonyms.
-
-### Test Mechanism
-
-This test utilizes WordNet to find synonyms for a given word present in the test data, replacing the original word
-with this synonym based on a given probability. The probability is defined as a parameter and determines the
-likelihood of swapping a word with its synonym. By default, this is set at 0.02 but can be adjusted based on
-specific test requirements. This methodology enables an evaluation of how such replacements can affect the model's
-performance.
-
-### Signs of High Risk
-
-- The model's performance or predictions change significantly after swapping words with their synonyms.
-- The model shows high sensitivity to small perturbations, like modifying the data with synonyms.
-- The embeddings model fails to identify similar meanings between the original words and their synonyms, indicating
-it lacks semantic understanding.
-
-### Strengths
-
-- The test is flexible in its application. The 'probability' parameter can be adjusted based on the degree of
-synonym swapping required.
-- Efficient in gauging a model's sensitivity or robustness with respect to small changes in input data.
-- Provides insights into the semantic understanding of the model as it monitors the impact of swapping words with
-synonyms.
-
-### Limitations
-
-- The ability to perturb data is reliant on the availability of synonyms, limiting its efficiency.
-- It assumes that the synonyms provided by WordNet are accurate and interchangeable in all contexts, which may not
-always be the case given the intricacies of language and context-specific meanings.
-- It does not consider the influence of multi-word expressions or phrases, as synonyms are considered at the word
-level only.
-- Relies solely on the WordNet corpus for synonyms, limiting its effectiveness for specialized or domain-specific
-jargon not included in that corpus.
-- Does not consider the semantic role of the words in the sentence, meaning the swapped synonym could potentially
-alter the overall meaning of the sentence, leading to a false perception of the model's stability.
\ No newline at end of file
diff --git a/site/tests/model_validation/embeddings/StabilityAnalysisTranslation.md b/site/tests/model_validation/embeddings/StabilityAnalysisTranslation.md
deleted file mode 100644
index 72bddddae0..0000000000
--- a/site/tests/model_validation/embeddings/StabilityAnalysisTranslation.md
+++ /dev/null
@@ -1,48 +0,0 @@
-# StabilityAnalysisTranslation
-
-Evaluates robustness of text embeddings models to noise introduced by translating the original text to another
-language and back.
-
-### Purpose
-
-The purpose of this test is to assess the robustness of text embeddings models under the influence of noise. The
-noise in this scenario is introduced by translating the original text into another language and then translating it
-back to the original language. Any significant changes in the model's output between the original and
-translated-then-retranslated texts can be indicators of the model's lack of robustness to noise.
-
-### Test Mechanism
-
-The test mechanism involves several steps:
-
-1. Initialize the Marian tokenizer and model for both source and target languages.
-2. Translate the data from the source language to the target language.
-3. Translate the translated data back into the source language.
-4. Compare the original data with the data that has been translated and back-translated to observe any significant
-changes.
-
-The threshold of this test output would then be determined by the tolerance level of the model to these potentially
-noisy instances.
-
-### Signs of High Risk
-
-- Large discrepancies between the original and double-translated text, indicating a high level of risk and a lack
-of robustness to noise.
-- Translations that do not closely maintain the meaning and context of the original language, suggesting inadequate
-robustness against this type of noise.
-
-### Strengths
-
-- An effective way to assess the model's sensitivity and robustness to language translation noise.
-- Provides a realistic scenario which the model might encounter in real-world applications by using translation to
-introduce noise.
-- Tests the model's capacity to maintain semantic meaning under translational perturbations, extending beyond
-simple lexical changes.
-
-### Limitations
-
-- Relies solely on translation-related noise, potentially overlooking other types of noise such as typographical
-errors, grammatical mistakes, or random word substitutions.
-- Inaccuracies or discrepancies in the translation process itself might influence the resultant robustness score
-rather than reflect an inherent failing of the model.
-- Predominantly language-dependent, thus might not fully capture robustness for languages with fewer resources or
-those highly dissimilar to the source language.
\ No newline at end of file
diff --git a/site/tests/model_validation/embeddings/TSNEComponentsPairwisePlots.md b/site/tests/model_validation/embeddings/TSNEComponentsPairwisePlots.md
deleted file mode 100644
index 1b6db10be8..0000000000
--- a/site/tests/model_validation/embeddings/TSNEComponentsPairwisePlots.md
+++ /dev/null
@@ -1,41 +0,0 @@
-# TSNEComponentsPairwisePlots
-
-Creates scatter plots for pairwise combinations of t-SNE components to visualize embeddings and highlight potential
-clustering structures.
-
-### Purpose
-
-This function creates scatter plots for each pairwise combination of t-SNE components derived from model
-embeddings. t-SNE (t-Distributed Stochastic Neighbor Embedding) is a machine learning algorithm for dimensionality
-reduction that is particularly well-suited for the visualization of high-dimensional datasets.
-
-### Test Mechanism
-
-The function begins by extracting embeddings from the provided dataset using the specified model. These embeddings
-are then standardized to ensure that each dimension contributes equally to the distance computation. Following
-this, the t-SNE algorithm is applied to reduce the dimensionality of the data, with the number of components
-specified by the user. The results are plotted using Plotly, creating scatter plots for each unique pair of
-components if more than one component is specified.
-
-### Signs of High Risk
-
-- If the scatter plots show overlapping clusters or indistinct groupings, it might suggest that the t-SNE
-parameters (such as perplexity) are not optimally set for the given data, or the data itself does not exhibit
-clear, separable clusters.
-- Similar plots across different pairs of components could indicate redundancy in the components generated by
-t-SNE, suggesting that fewer dimensions might be sufficient to represent the data's structure.
-
-### Strengths
-
-- Provides a visual exploration tool for high-dimensional data, simplifying the detection of patterns and clusters
-which are not apparent in higher dimensions.
-- Interactive plots generated by Plotly enhance user engagement and allow for a deeper dive into specific areas of
-the plot, aiding in detailed data analysis.
-
-### Limitations
-
-- The effectiveness of t-SNE is highly dependent on the choice of parameters like perplexity and the number of
-components, which might require tuning and experimentation for optimal results.
-- t-SNE visualizations can be misleading if interpreted without considering the stochastic nature of the algorithm;
-two runs with the same parameters might yield different visual outputs, necessitating multiple runs for a
-consistent interpretation.
\ No newline at end of file
diff --git a/site/tests/model_validation/ragas/AnswerCorrectness.md b/site/tests/model_validation/ragas/AnswerCorrectness.md
deleted file mode 100644
index 33d6b72aa2..0000000000
--- a/site/tests/model_validation/ragas/AnswerCorrectness.md
+++ /dev/null
@@ -1,68 +0,0 @@
-# AnswerCorrectness
-
-Evaluates the correctness of answers in a dataset with respect to the provided ground
-truths and visualizes the results in a histogram.
-
-The assessment of Answer Correctness involves gauging the accuracy of the generated
-answer when compared to the ground truth. This evaluation relies on the `ground truth`
-and the `answer`, with scores ranging from 0 to 1. A higher score indicates a closer
-alignment between the generated answer and the ground truth, signifying better
-correctness.
-
-Answer correctness encompasses two critical aspects: semantic similarity between the
-generated answer and the ground truth, as well as factual similarity. These aspects
-are combined using a weighted scheme to formulate the answer correctness score. Users
-also have the option to employ a `threshold` value to round the resulting score to
-a binary value (0 or 1) based on the threshold.
-
-Factual correctness quantifies the factual overlap between the generated answer and
-the ground truth answer. This is done using the concepts of:
-
-- TP (True Positive): Facts or statements that are present in both the ground truth
-and the generated answer.
-- FP (False Positive): Facts or statements that are present in the generated answer
-but not in the ground truth.
-- FN (False Negative): Facts or statements that are present in the ground truth but
-not in the generated answer.
-
-### Configuring Columns
-
-This metric requires specific columns to be present in the dataset:
-
-- `user_input` (str): The text prompt or query that was input into the model.
-- `response` (str): The text response generated by the model.
-- `reference` (str): The ground truth answer that the generated answer is compared
-against.
-
-If the above data is not in the appropriate column, you can specify different column
-names for these fields using the parameters `question_column`, `answer_column`, and
-`ground_truth_column`.
-
-For example, if your dataset has this data stored in different columns, you can
-pass the following parameters:
-```python
-params = {
-user_input_column": "input_text",
-response_column": "output_text",
-reference_column": "human_answer",
-}
-```
-
-If answer and contexts are stored as a dictionary in another column, specify the
-column and key like this:
-```python
-pred_col = dataset.prediction_column(model)
-params = {
-response_column": f"{pred_col}.generated_answer",
-reference_column": f"{pred_col}.contexts",
-}
-```
-
-For more complex data structures, you can use a function to extract the answers:
-```python
-pred_col = dataset.prediction_column(model)
-params = {
-response_column": lambda row: "\\n\\n".join(row[pred_col]["messages"]),
-reference_column": lambda row: [row[pred_col]["context_message"]],
-}
-```
\ No newline at end of file
diff --git a/site/tests/model_validation/ragas/AspectCritic.md b/site/tests/model_validation/ragas/AspectCritic.md
deleted file mode 100644
index e2f0bda08c..0000000000
--- a/site/tests/model_validation/ragas/AspectCritic.md
+++ /dev/null
@@ -1,71 +0,0 @@
-# AspectCritic
-
-Evaluates generations against the following aspects: harmfulness, maliciousness,
-coherence, correctness, and conciseness.
-
-### Overview:
-
-This is designed to assess submissions against predefined and user-defined "aspects".
-For each aspect, a judge LLM is prompted to critique a piece of generated text based
-on a description of the aspect. The output of this evaluation is a binary (0/1 = yes/no)
-score that indicates whether the submission aligns with the defined aspect or not.
-
-### Inputs and Outputs:
-
-The input to this metric is a dataset containing the input `user_input` (prompt to the LLM)
-and the `response` (text generated by the LLM). Any retrieved `retrieved_contexts` can also be
-included to enhance the evaluation.
-
-The `user_input_column`, `response_column`, and `retrieved_contexts_column` parameters can be used to
-specify the names or sources for the data that this metric will evaluate if the dataset
-does not contain the required columns `user_input`, `response`, and `retrieved_contexts`.
-
-By default, the aspects evaluated are harmfulness, maliciousness, coherence,
-correctness, and conciseness. To change the aspects evaluated, the `aspects` parameter
-can be set to a list containing any of these aspects.
-
-To add custom aspects, the `additional_aspects` parameter can be passed as a list
-of tuples where each tuple contains the aspect name and a description of the aspect
-that the judge LLM will use to critique the submission.
-
-The output of this metric is a table of scores for each aspect where the aspect score
-is the number of "yes" scores divided by the total number of submissions:
-$$
-\\text{aspect score} = \\frac{\\text{number of "yes" scores}}{\\text{total number of submissions}}
-$$
-
-### Examples:
-
-- **Mapping to Required Columns:** If the dataset does not contain the columns required
-to run this metric (i.e., `user_input`, `response`, and `retrieved_contexts`), the
-
-```python
-pred_col = my_vm_dataset.prediction_column(my_vm_model)
-run_test(
-validmind.model_validation.ragas.AspectCritic",
-inputs={"dataset": my_vm_dataset},
-params={
-user_input_column": "input_prompt",
-response_column": f"{pred_col}.llm_output",
-retrieved_contexts_column": "retrieval_model_prediction",
-},
-)
-```
-
-- **Custom Aspects:** To evaluate custom aspects, the `additional_aspects` parameter can
-be set to a list of tuples where each tuple contains the aspect name and a description
-of the aspect that the judge LLM will use to critique the submission. For example, to
-evaluate whether the LLM-generated text has a "professional tone", the `additional_aspects`
-parameter can be set like this:
-
-```python
-run_test(
-validmind.model_validation.ragas.AspectCritic",
-inputs={"dataset": my_vm_dataset},
-params={
-additional_aspects": [
-("professionalism", "Does the text have a professional tone?"),
-],
-},
-)
-```
\ No newline at end of file
diff --git a/site/tests/model_validation/ragas/ContextEntityRecall.md b/site/tests/model_validation/ragas/ContextEntityRecall.md
deleted file mode 100644
index c882d128fe..0000000000
--- a/site/tests/model_validation/ragas/ContextEntityRecall.md
+++ /dev/null
@@ -1,65 +0,0 @@
-# ContextEntityRecall
-
-Evaluates the context entity recall for dataset entries and visualizes the results.
-
-### Overview
-
-This metric gives the measure of recall of the retrieved context, based on the
-number of entities present in both `reference` and `retrieved_contexts` relative to the
-number of entities present in the `reference` alone. Simply put, it is a measure
-of what fraction of entities are recalled from `reference`. This metric is
-useful in fact-based use cases like tourism help desk, historical QA, etc. This
-metric can help evaluate the retrieval mechanism for entities, based on comparison
-with entities present in `reference`, because in cases where entities matter,
-we need the `retrieved_contexts` which cover them.
-
-### Formula
-
-To compute this metric, we use two sets, $GE$ and $CE$, representing the set of
-entities present in `reference` and set of entities present in `retrieved_contexts`
-respectively. We then take the number of elements in intersection of these sets and
-divide it by the number of elements present in the $GE$, given by the formula:
-
-$$
-\\text{context entity recall} = \\frac{| CE \\cap GE |}{| GE |}
-$$
-
-### Configuring Columns
-
-This metric requires the following columns in your dataset:
-
-- `retrieved_contexts` (List[str]): A list of text contexts which will be evaluated to make
-sure if they contain the entities present in the `reference`.
-- `reference` (str): The ground truth text from which the entities will be
-extracted and compared with the entities in the `retrieved_contexts`.
-
-If the above data is not in the appropriate column, you can specify different column
-names for these fields using the parameters `retrieved_contexts_column`, and `reference_column`.
-
-For example, if your dataset has this data stored in different columns, you can
-pass the following parameters:
-```python
-{
-retrieved_contexts_column": "context_info",
-reference_column": "my_ground_truth_col",
-}
-```
-
-If the data is stored as a dictionary in another column, specify the column and key
-like this:
-```python
-pred_col = dataset.prediction_column(model)
-params = {
-retrieved_contexts_column": f"{pred_col}.contexts",
-reference_column": "my_ground_truth_col",
-}
-```
-
-For more complex situations, you can use a function to extract the data:
-```python
-pred_col = dataset.prediction_column(model)
-params = {
-retrieved_contexts_column": lambda row: [row[pred_col]["context_message"]],
-reference_column": "my_ground_truth_col",
-}
-```
\ No newline at end of file
diff --git a/site/tests/model_validation/ragas/ContextPrecision.md b/site/tests/model_validation/ragas/ContextPrecision.md
deleted file mode 100644
index d316c2e5b2..0000000000
--- a/site/tests/model_validation/ragas/ContextPrecision.md
+++ /dev/null
@@ -1,59 +0,0 @@
-# ContextPrecision
-
-Context Precision is a metric that evaluates whether all of the ground-truth
-relevant items present in the contexts are ranked higher or not. Ideally all the
-relevant chunks must appear at the top ranks. This metric is computed using the
-`question`, `ground_truth` and the `contexts`, with values ranging between 0 and 1,
-where higher scores indicate better precision.
-
-$$
-\\text{Context Precision@K} = \\frac{\\sum_{k=1}^{K} \\left( \\text{Precision@k} \\times v_k \\right)}{\\text{Total number of relevant items in the top } K \\text{ results}}
-$$
-$$
-\\text{Precision@k} = {\\text{true positives@k} \\over  (\\text{true positives@k} + \\text{false positives@k})}
-$$
-
-Where $K$ is the total number of chunks in contexts and $v_k \\in \\{0, 1\\}$ is the
-relevance indicator at rank $k$.
-
-### Configuring Columns
-
-This metric requires the following columns in your dataset:
-
-- `user_input` (str): The text query that was input into the model.
-- `retrieved_contexts` (List[str]): A list of text contexts which are retrieved and which
-will be evaluated to make sure they contain relevant info in the correct order.
-- `reference` (str): The ground truth text to compare with the retrieved contexts.
-
-If the above data is not in the appropriate column, you can specify different column
-names for these fields using the parameters `user_input_column`, `retrieved_contexts_column`
-and `reference_column`.
-
-For example, if your dataset has this data stored in different columns, you can
-pass the following parameters:
-```python
-{
-user_input_column": "question",
-retrieved_contexts_column": "context_info",
-reference_column": "my_ground_truth_col",
-}
-```
-
-If the data is stored as a dictionary in another column, specify the column and key
-like this:
-```python
-pred_col = dataset.prediction_column(model)
-params = {
-retrieved_contexts_column": f"{pred_col}.retrieved_contexts",
-reference_column": "my_ground_truth_col",
-}
-```
-
-For more complex situations, you can use a function to extract the data:
-```python
-pred_col = dataset.prediction_column(model)
-params = {
-retrieved_contexts_column": lambda x: [x[pred_col]["context_message"]],
-reference_column": "my_ground_truth_col",
-}
-```
\ No newline at end of file
diff --git a/site/tests/model_validation/ragas/ContextPrecisionWithoutReference.md b/site/tests/model_validation/ragas/ContextPrecisionWithoutReference.md
deleted file mode 100644
index 78d1bb7929..0000000000
--- a/site/tests/model_validation/ragas/ContextPrecisionWithoutReference.md
+++ /dev/null
@@ -1,53 +0,0 @@
-# ContextPrecisionWithoutReference
-
-Context Precision Without Reference is a metric used to evaluate the relevance of
-retrieved contexts compared to the expected response for a given user input. This
-metric compares each retrieved context (or chunk) with the response to estimate
-if the retrieved context is relevant.
-
-This metric can be used when you have both retrieved contexts and associated
-reference contexts for a `user_input`. Using a Language Model (LLM), it determines
-the relevance of each retrieved context by comparing it directly with the response,
-producing scores between 0 and 1, where higher scores indicate better precision in
-retrieving relevant contexts.
-
-### Configuring Columns
-
-This metric requires the following columns in your dataset:
-
-- `user_input` (str): The user query or input to the model.
-- `retrieved_contexts` (List[str]): A list of text contexts retrieved for the
-user input that will be evaluated for relevance.
-- `response` (str): The model’s output response associated with the user input.
-
-If your dataset stores this data in different columns, you can specify alternate
-column names using the parameters `user_input_column`, `retrieved_contexts_column`,
-and `response_column`.
-
-Example configuration for custom column names:
-```python
-{
-user_input_column": "user_query",
-retrieved_contexts_column": "retrieved_texts",
-response_column": "model_output",
-}
-```
-
-For datasets with data stored as dictionaries in other columns, specify the
-column and key like so:
-```python
-pred_col = dataset.prediction_column(model)
-params = {
-retrieved_contexts_column": f"{pred_col}.contexts",
-response_column": f"{pred_col}.response",
-}
-```
-
-Alternatively, for complex situations, you may use a function to extract data:
-```python
-pred_col = dataset.prediction_column(model)
-params = {
-retrieved_contexts_column": lambda x: [x[pred_col]["context_message"]],
-response_column": "my_response_col",
-}
-```
\ No newline at end of file
diff --git a/site/tests/model_validation/ragas/ContextRecall.md b/site/tests/model_validation/ragas/ContextRecall.md
deleted file mode 100644
index 4d97da3059..0000000000
--- a/site/tests/model_validation/ragas/ContextRecall.md
+++ /dev/null
@@ -1,59 +0,0 @@
-# ContextRecall
-
-Context recall measures the extent to which the retrieved context aligns with the
-annotated answer, treated as the ground truth. It is computed based on the `ground
-truth` and the `retrieved context`, and the values range between 0 and 1, with higher
-values indicating better performance.
-
-To estimate context recall from the ground truth answer, each sentence in the ground
-truth answer is analyzed to determine whether it can be attributed to the retrieved
-context or not. In an ideal scenario, all sentences in the ground truth answer
-should be attributable to the retrieved context.
-
-
-The formula for calculating context recall is as follows:
-$$
-\\text{context recall} = {|\\text{GT sentences that can be attributed to context}| \\over |\\text{Number of sentences in GT}|}
-$$
-
-### Configuring Columns
-
-This metric requires the following columns in your dataset:
-
-- `user_input` (str): The text query that was input into the model.
-- `retrieved_contexts` (List[str]): A list of text contexts which are retrieved and
-which will be evaluated to make sure they contain all items in the ground truth.
-- `reference` (str): The ground truth text to compare with the retrieved contexts.
-
-If the above data is not in the appropriate column, you can specify different column
-names for these fields using the parameters `user_input_column`,
-`retrieved_contexts_column` and `reference_column`.
-
-For example, if your dataset has this data stored in different columns, you can
-pass the following parameters:
-```python
-{
-user_input_column": "user_input",
-retrieved_contexts_column": "retrieved_contexts",
-reference_column": "reference",
-}
-```
-
-If the data is stored as a dictionary in another column, specify the column and key
-like this:
-```python
-pred_col = dataset.prediction_column(model)
-params = {
-retrieved_contexts_column": f"{pred_col}.retrieved_contexts",
-reference_column": f"{pred_col}.reference",
-}
-```
-
-For more complex situations, you can use a function to extract the data:
-```python
-pred_col = dataset.prediction_column(model)
-params = {
-retrieved_contexts_column": lambda x: [x[pred_col]["retrieved_contexts"]],
-reference_column": "my_ground_truth_col",
-}
-```
\ No newline at end of file
diff --git a/site/tests/model_validation/ragas/Faithfulness.md b/site/tests/model_validation/ragas/Faithfulness.md
deleted file mode 100644
index 8191125106..0000000000
--- a/site/tests/model_validation/ragas/Faithfulness.md
+++ /dev/null
@@ -1,64 +0,0 @@
-# Faithfulness
-
-Evaluates the faithfulness of the generated answers with respect to retrieved contexts.
-
-This metric uses a judge LLM to measure the factual consistency of the generated answer
-against the given context(s). It is calculated using the generated text `answer` from
-the LLM and the retrieved `contexts` which come from some RAG process. The score is
-a value between 0 and 1, where a higher score indicates that the generated answer is
-more faithful to the given context(s).
-
-The generated answer is regarded as faithful if all the claims that are made in the
-answer can be inferred from the given context. To calculate this a set of claims from
-the generated answer is first identified. Then each one of these claims are cross checked
-with given context to determine if it can be inferred from given context or not. The
-faithfulness score formula is as follows:
-
-$$
-\\text{Faithfulness score} = {|\\text{Number of claims in the generated answer that can be inferred from given context}| \\over |\\text{Total number of claims in the generated answer}|}
-$$
-
-### Configuring Columns
-
-This metric requires the following columns in your dataset:
-
-- `user_input` (str): The user input that the model is responding to.
-- `retrieved_contexts` (List[str]): A list of text contexts which are retrieved to generate
-the answer.
-- `response` (str): The response generated by the model which will be evaluated for
-faithfulness against the given contexts.
-
-If the above data is not in the appropriate column, you can specify different column
-names for these fields using the parameters `retrieved_contexts_column` and
-`response_column`.
-
-For example, if your dataset has this data stored in different columns, you can
-pass the following parameters:
-```python
-{
-retrieved_contexts_column": "context_info",
-response_column": "my_answer_col",
-user_input_column": "user_input",
-}
-```
-
-If the data is stored as a dictionary in another column, specify the column and key
-like this:
-```python
-pred_col = dataset.prediction_column(model)
-params = {
-retrieved_contexts_column": f"{pred_col}.retrieved_contexts",
-response_column": f"{pred_col}.response",
-user_input_column": "user_input",
-}
-```
-
-For more complex situations, you can use a function to extract the data:
-```python
-pred_col = dataset.prediction_column(model)
-params = {
-retrieved_contexts_column": lambda row: [row[pred_col]["context_message"]],
-response_column": lambda row: "\\n\\n".join(row[pred_col]["messages"]),
-user_input_column": "user_input",
-}
-```
\ No newline at end of file
diff --git a/site/tests/model_validation/ragas/NoiseSensitivity.md b/site/tests/model_validation/ragas/NoiseSensitivity.md
deleted file mode 100644
index 0356680ec5..0000000000
--- a/site/tests/model_validation/ragas/NoiseSensitivity.md
+++ /dev/null
@@ -1,86 +0,0 @@
-# NoiseSensitivity
-
-Assesses the sensitivity of a Large Language Model (LLM) to noise in retrieved context by measuring how often it
-generates incorrect responses.
-
-### Purpose
-
-The Noise Sensitivity test aims to measure how sensitive an LLM is to irrelevant or noisy information within the
-contextual data used to generate its responses. A lower noise sensitivity score suggests better model robustness in
-generating accurate answers from given contexts.
-
-### Test Mechanism
-
-This test evaluates the model's answers by comparing the claims made in the generated response against the ground
-truth and the retrieved context. The noise sensitivity score is calculated as:
-
-$$
-\\text{noise sensitivity} = {|\\text{Number of incorrect claims in answer}| \\over |\\text{Number of total claims in answer}|}
-$$
-
-The formula computes the fraction of incorrect claims to the total claims in the answer, using a dataset where
-answer', 'context', and 'ground_truth' columns are specified.
-
-#### Configuring Columns
-
-This metric requires the following columns in your dataset:
-
-- `retrieved_contexts` (List[str]): A list of text contexts which are retrieved to generate
-the answer.
-- `response` (str): The response generated by the model
-- `reference` (str): The "correct" answer to the question
-- `user_input` (str): The user input question
-If the above data is not in the appropriate column, you can specify different column
-names for these fields using the parameters `retrieved_contexts_column` and `response_column`.
-
-For example, if your dataset has this data stored in different columns, you can
-pass the following parameters:
-```python
-{
-retrieved_contexts_column": "context_info",
-response_column": "my_answer_col",
-reference_column": "reference",
-user_input_column": "user_input",
-}
-```
-
-If the data is stored as a dictionary in another column, specify the column and key
-like this:
-```python
-pred_col = dataset.prediction_column(model)
-params = {
-reference_column": "reference",
-retrieved_contexts_column": f"{pred_col}.retrieved_contexts",
-response_column": f"{pred_col}.response",
-user_input_column": "user_input",
-}
-```
-
-For more complex situations, you can use a function to extract the data:
-```python
-pred_col = dataset.prediction_column(model)
-params = {
-reference_column": "reference",
-retrieved_contexts_column": lambda row: [row[pred_col]["context_message"]],
-response_column": lambda row: "\\n\\n".join(row[pred_col]["messages"]),
-user_input_column": "user_input",
-}
-
-### Signs of High Risk
-
-- High noise sensitivity scores across multiple samples.
-- Significant deviation between mean and median noise sensitivity scores.
-- High standard deviation indicating inconsistency in the model's performance.
-
-### Strengths
-
-- Provides a quantitative measure of how well the LLM handles noisy or irrelevant context.
-- Easy integration and configuration using column parameters.
-- Utilizes both histogram and box plot visualizations to analyze score distribution.
-
-### Limitations
-
-- Requires accurate ground truth that aligns with the generated answers.
-- Assumes the context provided is sufficiently granular to assess noise sensitivity.
-- Primarily applicable to tasks like text QA, text generation, and text summarization where contextual relevance is
-critical.
\ No newline at end of file
diff --git a/site/tests/model_validation/ragas/ResponseRelevancy.md b/site/tests/model_validation/ragas/ResponseRelevancy.md
deleted file mode 100644
index 4a645bec8e..0000000000
--- a/site/tests/model_validation/ragas/ResponseRelevancy.md
+++ /dev/null
@@ -1,72 +0,0 @@
-# ResponseRelevancy
-
-Assesses how pertinent the generated answer is to the given prompt.
-
-The evaluation metric, Response Relevancy, focuses on assessing how pertinent the
-generated answer is to the given prompt. A lower score is assigned to answers that
-are incomplete or contain redundant information and higher scores indicate better
-relevancy. This metric is computed using the `user_input`, the `retrieved_contexts`
-and the `response`.
-
-The Response Relevancy is defined as the mean cosine similarity of the original
-`user_input` to a number of artificial questions, which are generated (reverse-engineered)
-based on the `response`:
-
-$$
-\\text{answer relevancy} = \\frac{1}{N} \\sum_{i=1}^{N} cos(E_{g_i}, E_o)
-$$
-$$
-\\text{answer relevancy} = \\frac{1}{N} \\sum_{i=1}^{N} \\frac{E_{g_i} \\cdot E_o}{\\|E_{g_i}\\|\\|E_o\\|}
-$$
-
-Where:
-- $E_{g_i}$ is the embedding of the generated question $i$.
-- $E_o$ is the embedding of the original question.
-- $N$ is the number of generated questions - 3 by default.
-
-**Note**: *This is a reference-free metric, meaning that it does not require a
-`ground_truth` answer to compare against. A similar metric that does evaluate the
-correctness of a generated answers with respect to a `ground_truth` answer is
-`validmind.model_validation.ragas.AnswerCorrectness`.*
-
-### Configuring Columns
-
-This metric requires the following columns in your dataset:
-
-- `user_input` (str): The text query that was input into the model.
-- `retrieved_contexts` (List[str]): Any contextual information retrieved by the model
-before generating an answer.
-- `response` (str): The response generated by the model.
-
-If the above data is not in the appropriate column, you can specify different column
-names for these fields using the parameters `question_column`, `answer_column`, and
-`contexts_column`.
-
-For example, if your dataset has this data stored in different columns, you can
-pass the following parameters:
-```python
-params = {
-user_input_column": "input_text",
-response_column": "output_text",
-retrieved_contexts_column": "context_info
-}
-```
-
-If answer and contexts are stored as a dictionary in another column, specify the
-column and key like this:
-```python
-pred_col = dataset.prediction_column(model)
-params = {
-response_column": f"{pred_col}.generated_answer",
-retrieved_contexts_column": f"{pred_col}.contexts",
-}
-```
-
-For more complex data structures, you can use a function to extract the answers:
-```python
-pred_col = dataset.prediction_column(model)
-params = {
-response_column": lambda row: "\\n\\n".join(row[pred_col]["messages"]),
-retrieved_contexts_column": lambda row: [row[pred_col]["context_message"]],
-}
-```
\ No newline at end of file
diff --git a/site/tests/model_validation/ragas/SemanticSimilarity.md b/site/tests/model_validation/ragas/SemanticSimilarity.md
deleted file mode 100644
index 51fe77ed56..0000000000
--- a/site/tests/model_validation/ragas/SemanticSimilarity.md
+++ /dev/null
@@ -1,59 +0,0 @@
-# SemanticSimilarity
-
-Calculates the semantic similarity between generated responses and ground truths
-
-The concept of Answer Semantic Similarity pertains to the assessment of the semantic
-resemblance between the generated answer and the ground truth. This evaluation is
-based on the `reference` and the `response`, with values falling within the range
-of 0 to 1. A higher score signifies a better alignment between the generated response
-and the ground truth.
-
-Measuring the semantic similarity between answers can offer valuable insights into
-the quality of the generated response. This evaluation utilizes a cross-encoder
-model to calculate the semantic similarity score.
-
-See this paper for more details: https://arxiv.org/pdf/2108.06130.pdf
-
-The following steps are involved in computing the answer similarity score:
-1. Vectorize the ground truth answer using the specified embedding model.
-2. Vectorize the generated answer using the same embedding model.
-3. Compute the cosine similarity between the two vectors.
-
-### Configuring Columns
-
-This metric requires the following columns in your dataset:
-
-- `response` (str): The text response generated by the model.
-- `reference` (str): The ground truth answer that the generated answer is compared
-against.
-
-If the above data is not in the appropriate column, you can specify different column
-names for these fields using the parameters `response_column`, and `reference_column`.
-
-For example, if your dataset has this data stored in different columns, you can
-pass the following parameters:
-```python
-{
-response_column": "llm_output_col",
-reference_column": "my_ground_truth_col",
-}
-```
-
-If answer is stored as a dictionary in another column, specify the column and key
-like this:
-```python
-pred_col = dataset.prediction_column(model)
-params = {
-response_column": f"{pred_col}.generated_answer",
-reference_column": "my_ground_truth_col",
-}
-```
-
-For more complex situations, you can use a function to extract the data:
-```python
-pred_col = dataset.prediction_column(model)
-params = {
-response_column": lambda row: "\\n\\n".join(row[pred_col]["messages"]),
-reference_column": "my_ground_truth_col",
-}
-```
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/AdjustedMutualInformation.md b/site/tests/model_validation/sklearn/AdjustedMutualInformation.md
deleted file mode 100644
index bd510a905f..0000000000
--- a/site/tests/model_validation/sklearn/AdjustedMutualInformation.md
+++ /dev/null
@@ -1,41 +0,0 @@
-# AdjustedMutualInformation
-
-Evaluates clustering model performance by measuring mutual information between true and predicted labels, adjusting
-for chance.
-
-### Purpose
-
-The purpose of this metric (Adjusted Mutual Information) is to evaluate the performance of a machine learning
-model, more specifically, a clustering model. It measures the mutual information between the true labels and the
-ones predicted by the model, adjusting for chance.
-
-### Test Mechanism
-
-The Adjusted Mutual Information (AMI) uses sklearn's `adjusted_mutual_info_score` function. This function
-calculates the mutual information between the true labels and the ones predicted while correcting for the chance
-correlation expected due to random label assignments. This test requires the model, the training dataset, and the
-test dataset as inputs.
-
-### Signs of High Risk
-
-- Low Adjusted Mutual Information Score: This score ranges between 0 and 1. A low score (closer to 0) can indicate
-poor model performance as the predicted labels do not align well with the true labels.
-- In case of high-dimensional data, if the algorithm shows high scores, this could also be a potential risk as AMI
-may not perform reliably.
-
-### Strengths
-
-- The AMI metric takes into account the randomness of the predicted labels, which makes it more robust than the
-simple Mutual Information.
-- The scale of AMI is not dependent on the sizes of the clustering, allowing for comparability between different
-datasets or models.
-- Good for comparing the output of clustering algorithms where the number of clusters is not known a priori.
-
-### Limitations
-
-- Adjusted Mutual Information does not take into account the continuous nature of some data. As a result, it may
-not be the best choice for regression or other continuous types of tasks.
-- AMI has the drawback of being biased towards clusterings with a higher number of clusters.
-- In comparison to other metrics, AMI can be slower to compute.
-- The interpretability of the score can be complex as it depends on the understanding of information theory
-concepts.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/AdjustedRandIndex.md b/site/tests/model_validation/sklearn/AdjustedRandIndex.md
deleted file mode 100644
index 106f524999..0000000000
--- a/site/tests/model_validation/sklearn/AdjustedRandIndex.md
+++ /dev/null
@@ -1,38 +0,0 @@
-# AdjustedRandIndex
-
-Measures the similarity between two data clusters using the Adjusted Rand Index (ARI) metric in clustering machine
-learning models.
-
-### Purpose
-
-The Adjusted Rand Index (ARI) metric is intended to measure the similarity between two data clusters. This metric
-is specifically used for clustering machine learning models to quantify how well the model is clustering and
-producing data groups. It involves comparing the model's produced clusters against the actual (true) clusters found
-in the dataset.
-
-### Test Mechanism
-
-The Adjusted Rand Index (ARI) is calculated using the `adjusted_rand_score` method from the `sklearn.metrics`
-module in Python. The test requires inputs including the model itself and the model's training and test datasets.
-The model's computed clusters and the true clusters are compared, and the similarities are measured to compute the
-ARI.
-
-### Signs of High Risk
-
-- If the ARI is close to zero, it signifies that the model's cluster assignments are random and do not match the
-actual dataset clusters, indicating a high risk.
-- An ARI of less than zero indicates that the model's clustering performance is worse than random.
-
-### Strengths
-
-- ARI is normalized and provides a consistent metric between -1 and +1, irrespective of raw cluster sizes or
-dataset size variations.
-- It does not require a ground truth for computation, making it ideal for unsupervised learning model evaluations.
-- It penalizes for false positives and false negatives, providing a robust measure of clustering quality.
-
-### Limitations
-
-- In real-world situations, true clustering is often unknown, which can hinder the practical application of the ARI.
-- The ARI requires all individual data instances to be independent, which may not always hold true.
-- It may be difficult to interpret the implications of an ARI score without context or a benchmark, as it is
-heavily dependent on the characteristics of the dataset used.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/CalibrationCurve.md b/site/tests/model_validation/sklearn/CalibrationCurve.md
deleted file mode 100644
index 023858f2b7..0000000000
--- a/site/tests/model_validation/sklearn/CalibrationCurve.md
+++ /dev/null
@@ -1,53 +0,0 @@
-# CalibrationCurve
-
-Evaluates the calibration of probability estimates by comparing predicted probabilities against observed
-frequencies.
-
-### Purpose
-
-The Calibration Curve test assesses how well a model's predicted probabilities align with actual
-observed frequencies. This is crucial for applications requiring accurate probability estimates,
-such as risk assessment, decision-making systems, and cost-sensitive applications where probability
-calibration directly impacts business decisions.
-
-### Test Mechanism
-
-The test uses sklearn's calibration_curve function to:
-1. Sort predictions into bins based on predicted probabilities
-2. Calculate the mean predicted probability in each bin
-3. Compare against the observed frequency of positive cases
-4. Plot the results against the perfect calibration line (y=x)
-The resulting curve shows how well the predicted probabilities match empirical probabilities.
-
-### Signs of High Risk
-
-- Significant deviation from the perfect calibration line
-- Systematic overconfidence (predictions too close to 0 or 1)
-- Systematic underconfidence (predictions clustered around 0.5)
-- Empty or sparse bins indicating poor probability coverage
-- Sharp discontinuities in the calibration curve
-- Different calibration patterns across different probability ranges
-- Consistent over/under estimation in critical probability regions
-- Large confidence intervals in certain probability ranges
-
-### Strengths
-
-- Visual and intuitive interpretation of probability quality
-- Identifies systematic biases in probability estimates
-- Supports probability threshold selection
-- Helps understand model confidence patterns
-- Applicable across different classification models
-- Enables comparison between different models
-- Guides potential need for recalibration
-- Critical for risk-sensitive applications
-
-### Limitations
-
-- Sensitive to the number of bins chosen
-- Requires sufficient samples in each bin for reliable estimates
-- May mask local calibration issues within bins
-- Does not account for feature-dependent calibration issues
-- Limited to binary classification problems
-- Cannot detect all forms of miscalibration
-- Assumes bin boundaries are appropriate for the problem
-- May be affected by class imbalance
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/ClassifierPerformance.md b/site/tests/model_validation/sklearn/ClassifierPerformance.md
deleted file mode 100644
index e5870d812e..0000000000
--- a/site/tests/model_validation/sklearn/ClassifierPerformance.md
+++ /dev/null
@@ -1,37 +0,0 @@
-# ClassifierPerformance
-
-Evaluates performance of binary or multiclass classification models using precision, recall, F1-Score, accuracy,
-and ROC AUC scores.
-
-### Purpose
-
-The Classifier Performance test is designed to evaluate the performance of Machine Learning classification models.
-It accomplishes this by computing precision, recall, F1-Score, and accuracy, as well as the ROC AUC (Receiver
-operating characteristic - Area under the curve) scores, thereby providing a comprehensive analytic view of the
-models' performance. The test is adaptable, handling binary and multiclass models equally effectively.
-
-### Test Mechanism
-
-The test produces a report that includes precision, recall, F1-Score, and accuracy, by leveraging the
-`classification_report` from scikit-learn's metrics module. For multiclass models, macro and weighted averages for
-these scores are also calculated. Additionally, the ROC AUC scores are calculated and included in the report using
-the `multiclass_roc_auc_score` function. The outcome of the test (report format) differs based on whether the model
-is binary or multiclass.
-
-### Signs of High Risk
-
-- Low values for precision, recall, F1-Score, accuracy, and ROC AUC, indicating poor performance.
-- Imbalance in precision and recall scores.
-- A low ROC AUC score, especially scores close to 0.5 or lower, suggesting a failing model.
-
-### Strengths
-
-- Versatile, capable of assessing both binary and multiclass models.
-- Utilizes a variety of commonly employed performance metrics, offering a comprehensive view of model performance.
-- The use of ROC-AUC as a metric is beneficial for evaluating unbalanced datasets.
-
-### Limitations
-
-- Assumes correctly identified labels for binary classification models.
-- Specifically designed for classification models and not suitable for regression models.
-- May provide limited insights if the test dataset does not represent real-world scenarios adequately.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/ClassifierThresholdOptimization.md b/site/tests/model_validation/sklearn/ClassifierThresholdOptimization.md
deleted file mode 100644
index 15913dc7c7..0000000000
--- a/site/tests/model_validation/sklearn/ClassifierThresholdOptimization.md
+++ /dev/null
@@ -1,66 +0,0 @@
-# ClassifierThresholdOptimization
-
-Analyzes and visualizes different threshold optimization methods for binary classification models.
-
-### Purpose
-
-The Classifier Threshold Optimization test identifies optimal decision thresholds using various
-methods to balance different performance metrics. This helps adapt the model's decision boundary
-to specific business requirements, such as minimizing false positives in fraud detection or
-achieving target recall in medical diagnosis.
-
-### Test Mechanism
-
-The test implements multiple threshold optimization methods:
-1. Youden's J statistic (maximizing sensitivity + specificity - 1)
-2. F1-score optimization (balancing precision and recall)
-3. Precision-Recall equality point
-4. Target recall achievement
-5. Naive (0.5) threshold
-For each method, it computes ROC and PR curves, identifies optimal points, and provides
-comprehensive performance metrics at each threshold.
-
-### Signs of High Risk
-
-- Large discrepancies between different optimization methods
-- Optimal thresholds far from the default 0.5
-- Poor performance metrics across all thresholds
-- Significant gap between achieved and target recall
-- Unstable thresholds across different methods
-- Extreme trade-offs between precision and recall
-- Threshold optimization showing minimal impact
-- Business metrics not improving with optimization
-
-### Strengths
-
-- Multiple optimization strategies for different needs
-- Visual and numerical results for comparison
-- Support for business-driven optimization (target recall)
-- Comprehensive performance metrics at each threshold
-- Integration with ROC and PR curves
-- Handles class imbalance through various metrics
-- Enables informed threshold selection
-- Supports cost-sensitive decision making
-
-### Limitations
-
-- Assumes cost of false positives/negatives are known
-- May need adjustment for highly imbalanced datasets
-- Threshold might not be stable across different samples
-- Cannot handle multi-class problems directly
-- Optimization methods may conflict with business needs
-- Requires sufficient validation data
-- May not capture temporal changes in optimal threshold
-- Single threshold may not be optimal for all subgroups
-
-Args:
-dataset: VMDataset containing features and target
-model: VMModel containing predictions
-methods: List of methods to compare (default: ['youden', 'f1', 'precision_recall'])
-target_recall: Target recall value if using 'target_recall' method
-
-Returns:
-Dictionary containing:
-- table: DataFrame comparing different threshold optimization methods
-(using weighted averages for precision, recall, and f1)
-- figure: Plotly figure showing ROC and PR curves with optimal thresholds
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/ClusterCosineSimilarity.md b/site/tests/model_validation/sklearn/ClusterCosineSimilarity.md
deleted file mode 100644
index 36ac2ea586..0000000000
--- a/site/tests/model_validation/sklearn/ClusterCosineSimilarity.md
+++ /dev/null
@@ -1,43 +0,0 @@
-# ClusterCosineSimilarity
-
-Measures the intra-cluster similarity of a clustering model using cosine similarity.
-
-### Purpose
-
-The purpose of this metric is to measure how similar the data points within each cluster of a clustering model are.
-This is done using cosine similarity, which compares the multi-dimensional direction (but not magnitude) of data
-vectors. From a Model Risk Management perspective, this metric is used to quantitatively validate that clusters
-formed by a model have high intra-cluster similarity.
-
-### Test Mechanism
-
-This test works by first extracting the true and predicted clusters of the model's training data. Then, it computes
-the centroid (average data point) of each cluster. Next, it calculates the cosine similarity between each data
-point within a cluster and its respective centroid. Finally, it outputs the mean cosine similarity of each cluster,
-highlighting how similar, on average, data points in a cluster are to the cluster's centroid.
-
-### Signs of High Risk
-
-- Low mean cosine similarity for one or more clusters: If the mean cosine similarity is low, the data points within
-the respective cluster have high variance in their directions. This can be indicative of poor clustering,
-suggesting that the model might not be suitably separating the data into distinct patterns.
-- High disparity between mean cosine similarity values across clusters: If there's a significant difference in mean
-cosine similarity across different clusters, this could indicate imbalance in how the model forms clusters.
-
-### Strengths
-
-- Cosine similarity operates in a multi-dimensional space, making it effective for measuring similarity in high
-dimensional datasets, typical for many machine learning problems.
-- It provides an agnostic view of the cluster performance by only considering the direction (and not the magnitude)
-of each vector.
-- This metric is not dependent on the scale of the variables, making it equally effective on different scales.
-
-### Limitations
-
-- Cosine similarity does not consider magnitudes (i.e. lengths) of vectors, only their direction. This means it may
-overlook instances where clusters have been adequately separated in terms of magnitude.
-- This method summarily assumes that centroids represent the average behavior of data points in each cluster. This
-might not always be true, especially in clusters with high amounts of variance or non-spherical shapes.
-- It primarily works with continuous variables and is not suitable for binary or categorical variables.
-- Lastly, although rare, perfect perpendicular vectors (cosine similarity = 0) could be within the same cluster,
-which may give an inaccurate representation of a 'bad' cluster due to low cosine similarity score.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/ClusterPerformanceMetrics.md b/site/tests/model_validation/sklearn/ClusterPerformanceMetrics.md
deleted file mode 100644
index a1f70d9845..0000000000
--- a/site/tests/model_validation/sklearn/ClusterPerformanceMetrics.md
+++ /dev/null
@@ -1,45 +0,0 @@
-# ClusterPerformanceMetrics
-
-Evaluates the performance of clustering machine learning models using multiple established metrics.
-
-### Purpose
-
-The `ClusterPerformanceMetrics` test is used to assess the performance and validity of clustering machine learning
-models. It evaluates homogeneity, completeness, V measure score, the Adjusted Rand Index, the Adjusted Mutual
-Information, and the Fowlkes-Mallows score of the model. These metrics provide a holistic understanding of the
-model's ability to accurately form clusters of the given dataset.
-
-### Test Mechanism
-
-The `ClusterPerformanceMetrics` test runs a clustering ML model over a given dataset and then calculates six
-metrics using the Scikit-learn metrics computation functions: Homogeneity Score, Completeness Score, V Measure,
-Adjusted Rand Index (ARI), Adjusted Mutual Information (AMI), and Fowlkes-Mallows Score. It then returns the result
-as a summary, presenting the metric values for both training and testing datasets.
-
-### Signs of High Risk
-
-- Low Homogeneity Score: Indicates that the clusters formed contain a variety of classes, resulting in less pure
-clusters.
-- Low Completeness Score: Suggests that class instances are scattered across multiple clusters rather than being
-gathered in a single cluster.
-- Low V Measure: Reports a low overall clustering performance.
-- ARI close to 0 or Negative: Implies that clustering results are random or disagree with the true labels.
-- AMI close to 0: Means that clustering labels are random compared with the true labels.
-- Low Fowlkes-Mallows score: Signifies less precise and poor clustering performance in terms of precision and
-recall.
-
-### Strengths
-
-- Provides a comprehensive view of clustering model performance by examining multiple clustering metrics.
-- Uses established and widely accepted metrics from scikit-learn, providing reliability in the results.
-- Able to provide performance metrics for both training and testing datasets.
-- Clearly defined and human-readable descriptions of each score make it easy to understand what each score
-represents.
-
-### Limitations
-
-- Only applies to clustering models; not suitable for other types of machine learning models.
-- Does not test for overfitting or underfitting in the clustering model.
-- All the scores rely on ground truth labels, the absence or inaccuracy of which can lead to misleading results.
-- Does not consider aspects like computational efficiency of the model or its capability to handle high dimensional
-data.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/CompletenessScore.md b/site/tests/model_validation/sklearn/CompletenessScore.md
deleted file mode 100644
index 34bc9cc9d8..0000000000
--- a/site/tests/model_validation/sklearn/CompletenessScore.md
+++ /dev/null
@@ -1,36 +0,0 @@
-# CompletenessScore
-
-Evaluates a clustering model's capacity to categorize instances from a single class into the same cluster.
-
-### Purpose
-
-The Completeness Score metric is used to assess the performance of clustering models. It measures the extent to
-which all the data points that are members of a given class are elements of the same cluster. The aim is to
-determine the capability of the model to categorize all instances from a single class into the same cluster.
-
-### Test Mechanism
-
-This test takes three inputs, a model and its associated training and testing datasets. It invokes the
-`completeness_score` function from the sklearn library on the labels predicted by the model. High scores indicate
-that data points from the same class generally appear in the same cluster, while low scores suggest the opposite.
-
-### Signs of High Risk
-
-- Low completeness score: This suggests that the model struggles to group instances from the same class into one
-cluster, indicating poor clustering performance.
-
-### Strengths
-
-- The Completeness Score provides an effective method for assessing the performance of a clustering model,
-specifically its ability to group class instances together.
-- This test metric conveniently relies on the capabilities provided by the sklearn library, ensuring consistent and
-reliable test results.
-
-### Limitations
-
-- This metric only evaluates a specific aspect of clustering, meaning it may not provide a holistic or complete
-view of the model's performance.
-- It cannot assess the effectiveness of the model in differentiating between separate classes, as it is solely
-focused on how well data points from the same class are grouped.
-- The Completeness Score only applies to clustering models; it cannot be used for other types of machine learning
-models.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/ConfusionMatrix.md b/site/tests/model_validation/sklearn/ConfusionMatrix.md
deleted file mode 100644
index 345c6579a9..0000000000
--- a/site/tests/model_validation/sklearn/ConfusionMatrix.md
+++ /dev/null
@@ -1,46 +0,0 @@
-# ConfusionMatrix
-
-Evaluates and visually represents the classification ML model's predictive performance using a Confusion Matrix
-heatmap.
-
-### Purpose
-
-The Confusion Matrix tester is designed to assess the performance of a classification Machine Learning model. This
-performance is evaluated based on how well the model is able to correctly classify True Positives, True Negatives,
-False Positives, and False Negatives - fundamental aspects of model accuracy.
-
-### Test Mechanism
-
-The mechanism used involves taking the predicted results (`y_test_predict`) from the classification model and
-comparing them against the actual values (`y_test_true`). A confusion matrix is built using the unique labels
-extracted from `y_test_true`, employing scikit-learn's metrics. The matrix is then visually rendered with the help
-of Plotly's `create_annotated_heatmap` function. A heatmap is created which provides a two-dimensional graphical
-representation of the model's performance, showcasing distributions of True Positives (TP), True Negatives (TN),
-False Positives (FP), and False Negatives (FN).
-
-### Signs of High Risk
-
-- High numbers of False Positives (FP) and False Negatives (FN), depicting that the model is not effectively
-classifying the values.
-- Low numbers of True Positives (TP) and True Negatives (TN), implying that the model is struggling with correctly
-identifying class labels.
-
-### Strengths
-
-- It provides a simplified yet comprehensive visual snapshot of the classification model's predictive performance.
-- It distinctly brings out True Positives (TP), True Negatives (TN), False Positives (FP), and False Negatives
-(FN), thus making it easier to focus on potential areas of improvement.
-- The matrix is beneficial in dealing with multi-class classification problems as it can provide a simple view of
-complex model performances.
-- It aids in understanding the different types of errors that the model could potentially make, as it provides
-in-depth insights into Type-I and Type-II errors.
-
-### Limitations
-
-- In cases of unbalanced classes, the effectiveness of the confusion matrix might be lessened. It may wrongly
-interpret the accuracy of a model that is essentially just predicting the majority class.
-- It does not provide a single unified statistic that could evaluate the overall performance of the model.
-Different aspects of the model's performance are evaluated separately instead.
-- It mainly serves as a descriptive tool and does not offer the capability for statistical hypothesis testing.
-- Risks of misinterpretation exist because the matrix doesn't directly provide precision, recall, or F1-score data.
-These metrics have to be computed separately.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/FeatureImportance.md b/site/tests/model_validation/sklearn/FeatureImportance.md
deleted file mode 100644
index bc5a445bbe..0000000000
--- a/site/tests/model_validation/sklearn/FeatureImportance.md
+++ /dev/null
@@ -1,40 +0,0 @@
-# FeatureImportance
-
-Compute feature importance scores for a given model and generate a summary table
-with the top important features.
-
-### Purpose
-
-The Feature Importance Comparison test is designed to compare the feature importance scores for different models
-when applied to various datasets. By doing so, it aims to identify the most impactful features and assess the
-consistency of feature importance across models.
-
-### Test Mechanism
-
-This test works by iterating through each dataset-model pair and calculating permutation feature importance (PFI)
-scores. It then generates a summary table containing the top `num_features` important features for each model. The
-process involves:
-
-- Extracting features and target data from each dataset.
-- Computing PFI scores using `sklearn.inspection.permutation_importance`.
-- Sorting and selecting the top features based on their importance scores.
-- Compiling these features into a summary table for comparison.
-
-### Signs of High Risk
-
-- Key features expected to be important are ranked low, indicating potential issues with model training or data
-quality.
-- High variance in feature importance scores across different models, suggesting instability in feature selection.
-
-### Strengths
-
-- Provides a clear comparison of the most important features for each model.
-- Uses permutation importance, which is a model-agnostic method and can be applied to any estimator.
-
-### Limitations
-
-- Assumes that the dataset is provided as a DataFrameDataset object with `x_df` and `y_df` methods to access
-feature and target data.
-- Requires that `model.model` is compatible with `sklearn.inspection.permutation_importance`.
-- The function's output is dependent on the number of features specified by `num_features`, which defaults to 3 but
-can be adjusted.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/FowlkesMallowsScore.md b/site/tests/model_validation/sklearn/FowlkesMallowsScore.md
deleted file mode 100644
index ef41039479..0000000000
--- a/site/tests/model_validation/sklearn/FowlkesMallowsScore.md
+++ /dev/null
@@ -1,41 +0,0 @@
-# FowlkesMallowsScore
-
-Evaluates the similarity between predicted and actual cluster assignments in a model using the Fowlkes-Mallows
-score.
-
-### Purpose
-
-The FowlkesMallowsScore is a performance metric used to validate clustering algorithms within machine learning
-models. The score intends to evaluate the matching grade between two clusters. It measures the similarity between
-the predicted and actual cluster assignments, thus gauging the accuracy of the model's clustering capability.
-
-### Test Mechanism
-
-The FowlkesMallowsScore method applies the `fowlkes_mallows_score` function from the `sklearn` library to evaluate
-the model's accuracy in clustering different types of data. The test fetches the datasets from the model's training
-and testing datasets as inputs then compares the resulting clusters against the previously known clusters to obtain
-a score. A high score indicates a better clustering performance by the model.
-
-### Signs of High Risk
-
-- A low Fowlkes-Mallows score (near zero): This indicates that the model's clustering capability is poor and the
-algorithm isn't properly grouping data.
-- Inconsistently low scores across different datasets: This may indicate that the model's clustering performance is
-not robust and the model may fail when applied to unseen data.
-
-### Strengths
-
-- The Fowlkes-Mallows score is a simple and effective method for evaluating the performance of clustering
-algorithms.
-- This metric takes into account both precision and recall in its calculation, therefore providing a balanced and
-comprehensive measure of model performance.
-- The Fowlkes-Mallows score is non-biased meaning it treats False Positives and False Negatives equally.
-
-### Limitations
-
-- As a pairwise-based method, this score can be computationally intensive for large datasets and can become
-unfeasible as the size of the dataset increases.
-- The Fowlkes-Mallows score works best with balanced distribution of samples across clusters. If this condition is
-not met, the score can be skewed.
-- It does not handle mismatching numbers of clusters between the true and predicted labels. As such, it may return
-misleading results if the predicted labels suggest a different number of clusters than what is in the true labels.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/HomogeneityScore.md b/site/tests/model_validation/sklearn/HomogeneityScore.md
deleted file mode 100644
index 7d82c6dafa..0000000000
--- a/site/tests/model_validation/sklearn/HomogeneityScore.md
+++ /dev/null
@@ -1,39 +0,0 @@
-# HomogeneityScore
-
-Assesses clustering homogeneity by comparing true and predicted labels, scoring from 0 (heterogeneous) to 1
-(homogeneous).
-
-### Purpose
-
-The Homogeneity Score encapsulated in this performance test is used to measure the homogeneity of the clusters
-formed by a machine learning model. In simple terms, a clustering result satisfies homogeneity if all of its
-clusters contain only points which are members of a single class.
-
-### Test Mechanism
-
-This test uses the `homogeneity_score` function from the `sklearn.metrics` library to compare the ground truth
-class labels of the training and testing sets with the labels predicted by the given model. The returned score is a
-metric of the clustering accuracy, and ranges from 0.0 to 1.0, with 1.0 denoting the highest possible degree of
-homogeneity.
-
-### Signs of High Risk
-
-- A score close to 0: This denotes that clusters are highly heterogenous and points within the same cluster might
-not belong to the same class.
-- A significantly lower score for testing data compared to the score for training data: This can indicate
-overfitting, where the model has learned to perfectly match the training data but fails to perform well on unseen
-data.
-
-### Strengths
-
-- It provides a simple quantitative measure of the degree to which clusters contain points from only one class.
-- Useful for validating clustering solutions where the ground truth — class membership of points — is known.
-- It's agnostic to the absolute labels, and cares only that the points within the same cluster have the same class
-label.
-
-### Limitations
-
-- The Homogeneity Score is not useful for clustering solutions where the ground truth labels are not known.
-- It doesn’t work well with differently sized clusters since it gives predominance to larger clusters.
-- The score does not address the actual number of clusters formed, or the evenness of cluster sizes. It only checks
-the homogeneity within the given clusters created by the model.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/HyperParametersTuning.md b/site/tests/model_validation/sklearn/HyperParametersTuning.md
deleted file mode 100644
index 2375885271..0000000000
--- a/site/tests/model_validation/sklearn/HyperParametersTuning.md
+++ /dev/null
@@ -1,51 +0,0 @@
-# HyperParametersTuning
-
-Performs exhaustive grid search over specified parameter ranges to find optimal model configurations
-across different metrics and decision thresholds.
-
-### Purpose
-
-The Hyperparameter Tuning test systematically explores the model's parameter space to identify optimal
-configurations. It supports multiple optimization metrics and decision thresholds, providing a comprehensive
-view of how different parameter combinations affect various aspects of model performance.
-
-### Test Mechanism
-
-The test uses scikit-learn's GridSearchCV to perform cross-validation for each parameter combination.
-For each specified threshold and optimization metric, it creates a scoring dictionary with
-threshold-adjusted metrics, performs grid search with cross-validation, records best parameters and
-corresponding scores, and combines results into a comparative table. This process is repeated for each
-optimization metric to provide a comprehensive view of model performance under different configurations.
-
-### Signs of High Risk
-
-- Large performance variations across different parameter combinations
-- Significant discrepancies between different optimization metrics
-- Best parameters at the edges of the parameter grid
-- Unstable performance across different thresholds
-- Overly complex model configurations (risk of overfitting)
-- Very different optimal parameters for different metrics
-- Cross-validation scores showing high variance
-- Extreme parameter values in best configurations
-
-### Strengths
-
-- Comprehensive exploration of parameter space
-- Supports multiple optimization metrics
-- Allows threshold optimization
-- Provides comparative view across different configurations
-- Uses cross-validation for robust evaluation
-- Helps understand trade-offs between different metrics
-- Enables systematic parameter selection
-- Supports both classification and clustering tasks
-
-### Limitations
-
-- Computationally expensive for large parameter grids
-- May not find global optimum (limited to grid points)
-- Cannot handle dependencies between parameters
-- Memory intensive for large datasets
-- Limited to scikit-learn compatible models
-- Cross-validation splits may not preserve time series structure
-- Grid search may miss optimal values between grid points
-- Resource intensive for high-dimensional parameter spaces
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/KMeansClustersOptimization.md b/site/tests/model_validation/sklearn/KMeansClustersOptimization.md
deleted file mode 100644
index 51c0e789a7..0000000000
--- a/site/tests/model_validation/sklearn/KMeansClustersOptimization.md
+++ /dev/null
@@ -1,46 +0,0 @@
-# KMeansClustersOptimization
-
-Optimizes the number of clusters in K-means models using Elbow and Silhouette methods.
-
-### Purpose
-
-This metric is used to optimize the number of clusters used in K-means clustering models. It intends to measure and
-evaluate the optimal number of clusters by leveraging two methodologies, namely the Elbow method and the Silhouette
-method. This is crucial as an inappropriate number of clusters can either overly simplify or overcomplicate the
-structure of the data, thereby undermining the effectiveness of the model.
-
-### Test Mechanism
-
-The test mechanism involves iterating over a predefined range of cluster numbers and applying both the Elbow method
-and the Silhouette method. The Elbow method computes the sum of the minimum euclidean distances between data points
-and their respective cluster centers (distortion). This value decreases as the number of clusters increases; the
-optimal number is typically at the 'elbow' point where the decrease in distortion becomes less pronounced.
-Meanwhile, the Silhouette method calculates the average silhouette score for each data point in the dataset,
-providing a measure of how similar each item is to its own cluster compared to other clusters. The optimal number
-of clusters under this method is the one that maximizes the average silhouette score. The results of both methods
-are plotted for visual inspection.
-
-### Signs of High Risk
-
-- A high distortion value or a low silhouette average score for the optimal number of clusters.
-- No clear 'elbow' point or plateau observed in the distortion plot, or a uniformly low silhouette average score
-across different numbers of clusters, suggesting the data is not amenable to clustering.
-- An optimal cluster number that is unreasonably high or low, suggestive of overfitting or underfitting,
-respectively.
-
-### Strengths
-
-- Provides both a visual and quantitative method to determine the optimal number of clusters.
-- Leverages two different methods (Elbow and Silhouette), thereby affording robustness and versatility in assessing
-the data's clusterability.
-- Facilitates improved model performance by allowing for an informed selection of the number of clusters.
-
-### Limitations
-
-- Assumes that a suitable number of clusters exists in the data, which may not always be true, especially for
-complex or noisy data.
-- Both methods may fail to provide definitive answers when the data lacks clear cluster structures.
-- Might not be straightforward to determine the 'elbow' point or maximize the silhouette average score, especially
-in larger and complicated datasets.
-- Assumes spherical clusters (due to using the Euclidean distance in the Elbow method), which might not align with
-the actual structure of the data.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/MinimumAccuracy.md b/site/tests/model_validation/sklearn/MinimumAccuracy.md
deleted file mode 100644
index a38ca5b8e8..0000000000
--- a/site/tests/model_validation/sklearn/MinimumAccuracy.md
+++ /dev/null
@@ -1,36 +0,0 @@
-# MinimumAccuracy
-
-Checks if the model's prediction accuracy meets or surpasses a specified threshold.
-
-### Purpose
-
-The Minimum Accuracy test’s objective is to verify whether the model's prediction accuracy on a specific dataset
-meets or surpasses a predetermined minimum threshold. Accuracy, which is simply the ratio of correct predictions to
-total predictions, is a key metric for evaluating the model's performance. Considering binary as well as multiclass
-classifications, accurate labeling becomes indispensable.
-
-### Test Mechanism
-
-The test mechanism involves contrasting the model's accuracy score with a preset minimum threshold value, with the
-default being 0.7. The accuracy score is computed utilizing sklearn’s `accuracy_score` method, where the true
-labels `y_true` and predicted labels `class_pred` are compared. If the accuracy score is above the threshold, the
-test receives a passing mark. The test returns the result along with the accuracy score and threshold used for the
-test.
-
-### Signs of High Risk
-
-- Model fails to achieve or surpass the predefined score threshold.
-- Persistent scores below the threshold, indicating a high risk of inaccurate predictions.
-
-### Strengths
-
-- Simplicity, presenting a straightforward measure of holistic model performance across all classes.
-- Particularly advantageous when classes are balanced.
-- Versatile, as it can be implemented on both binary and multiclass classification tasks.
-
-### Limitations
-
-- Misleading accuracy scores when classes in the dataset are highly imbalanced.
-- Favoritism towards the majority class, giving an inaccurate perception of model performance.
-- Inability to measure the model's precision, recall, or capacity to manage false positives or false negatives.
-- Focused on overall correctness and may not be sufficient for all types of model analytics.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/MinimumF1Score.md b/site/tests/model_validation/sklearn/MinimumF1Score.md
deleted file mode 100644
index 668146e1d6..0000000000
--- a/site/tests/model_validation/sklearn/MinimumF1Score.md
+++ /dev/null
@@ -1,38 +0,0 @@
-# MinimumF1Score
-
-Assesses if the model's F1 score on the validation set meets a predefined minimum threshold, ensuring balanced
-performance between precision and recall.
-
-### Purpose
-
-The main objective of this test is to ensure that the F1 score, a balanced measure of precision and recall, of the
-model meets or surpasses a predefined threshold on the validation dataset. The F1 score is highly useful for
-gauging model performance in classification tasks, especially in cases where the distribution of positive and
-negative classes is skewed.
-
-### Test Mechanism
-
-The F1 score for the validation dataset is computed through scikit-learn's metrics in Python. The scoring mechanism
-differs based on the classification problem: for multi-class problems, macro averaging is used, and for binary
-classification, the built-in `f1_score` calculation is used. The obtained F1 score is then assessed against the
-predefined minimum F1 score that is expected from the model.
-
-### Signs of High Risk
-
-- If a model returns an F1 score that is less than the established threshold, it is regarded as high risk.
-- A low F1 score might suggest that the model is not finding an optimal balance between precision and recall,
-failing to effectively identify positive classes while minimizing false positives.
-
-### Strengths
-
-- Provides a balanced measure of a model's performance by accounting for both false positives and false negatives.
-- Particularly advantageous in scenarios with imbalanced class distribution, where accuracy can be misleading.
-- Flexibility in setting the threshold value allows tailored minimum acceptable performance standards.
-
-### Limitations
-
-- May not be suitable for all types of models and machine learning tasks.
-- The F1 score assumes an equal cost for false positives and false negatives, which may not be true in some
-real-world scenarios.
-- Practitioners might need to rely on other metrics such as precision, recall, or the ROC-AUC score that align more
-closely with specific requirements.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/MinimumROCAUCScore.md b/site/tests/model_validation/sklearn/MinimumROCAUCScore.md
deleted file mode 100644
index ed2b660023..0000000000
--- a/site/tests/model_validation/sklearn/MinimumROCAUCScore.md
+++ /dev/null
@@ -1,41 +0,0 @@
-# MinimumROCAUCScore
-
-Validates model by checking if the ROC AUC score meets or surpasses a specified threshold.
-
-### Purpose
-
-The Minimum ROC AUC Score test is used to determine the model's performance by ensuring that the Receiver Operating
-Characteristic Area Under the Curve (ROC AUC) score on the validation dataset meets or exceeds a predefined
-threshold. The ROC AUC score indicates how well the model can distinguish between different classes, making it a
-crucial measure in binary and multiclass classification tasks.
-
-### Test Mechanism
-
-This test implementation calculates the multiclass ROC AUC score on the true target values and the model's
-predictions. The test converts the multi-class target variables into binary format using `LabelBinarizer` before
-computing the score. If this ROC AUC score is higher than the predefined threshold (defaulted to 0.5), the test
-passes; otherwise, it fails. The results, including the ROC AUC score, the threshold, and whether the test passed
-or failed, are then stored in a `ThresholdTestResult` object.
-
-### Signs of High Risk
-
-- A high risk or failure in the model's performance as related to this metric would be represented by a low ROC AUC
-score, specifically any score lower than the predefined minimum threshold. This suggests that the model is
-struggling to distinguish between different classes effectively.
-
-### Strengths
-
-- The test considers both the true positive rate and false positive rate, providing a comprehensive performance
-measure.
-- ROC AUC score is threshold-independent meaning it measures the model's quality across various classification
-thresholds.
-- Works robustly with binary as well as multi-class classification problems.
-
-### Limitations
-
-- ROC AUC may not be useful if the class distribution is highly imbalanced; it could perform well in terms of AUC
-but still fail to predict the minority class.
-- The test does not provide insight into what specific aspects of the model are causing poor performance if the ROC
-AUC score is unsatisfactory.
-- The use of macro average for multiclass ROC AUC score implies equal weightage to each class, which might not be
-appropriate if the classes are imbalanced.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/ModelParameters.md b/site/tests/model_validation/sklearn/ModelParameters.md
deleted file mode 100644
index a1a3b37cce..0000000000
--- a/site/tests/model_validation/sklearn/ModelParameters.md
+++ /dev/null
@@ -1,42 +0,0 @@
-# ModelParameters
-
-Extracts and displays model parameters in a structured format for transparency and reproducibility.
-
-### Purpose
-
-The Model Parameters test is designed to provide transparency into model configuration and ensure
-reproducibility of machine learning models. It accomplishes this by extracting and presenting all
-relevant parameters that define the model's behavior, making it easier to audit, validate, and
-reproduce model training.
-
-### Test Mechanism
-
-The test leverages scikit-learn's API convention of get_params() to extract model parameters. It
-produces a structured DataFrame containing parameter names and their corresponding values. For models
-that follow scikit-learn's API (including XGBoost, RandomForest, and other estimators), all
-parameters are automatically extracted and displayed.
-
-### Signs of High Risk
-
-- Missing crucial parameters that should be explicitly set
-- Extreme parameter values that could indicate overfitting (e.g., unlimited tree depth)
-- Inconsistent parameters across different versions of the same model type
-- Parameter combinations known to cause instability or poor performance
-- Default values used for critical parameters that should be tuned
-
-### Strengths
-
-- Universal compatibility with scikit-learn API-compliant models
-- Ensures transparency in model configuration
-- Facilitates model reproducibility and version control
-- Enables systematic parameter auditing
-- Supports both classification and regression models
-- Helps identify potential configuration issues
-
-### Limitations
-
-- Only works with models implementing scikit-learn's get_params() method
-- Cannot capture dynamic parameters set during model training
-- Does not validate parameter values for model-specific appropriateness
-- Parameter meanings and impacts may vary across different model types
-- Cannot detect indirect parameter interactions or their effects on model performance
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/ModelsPerformanceComparison.md b/site/tests/model_validation/sklearn/ModelsPerformanceComparison.md
deleted file mode 100644
index 26d953fa31..0000000000
--- a/site/tests/model_validation/sklearn/ModelsPerformanceComparison.md
+++ /dev/null
@@ -1,42 +0,0 @@
-# ModelsPerformanceComparison
-
-Evaluates and compares the performance of multiple Machine Learning models using various metrics like accuracy,
-precision, recall, and F1 score.
-
-### Purpose
-
-The Models Performance Comparison test aims to evaluate and compare the performance of various Machine Learning
-models using test data. It employs multiple metrics such as accuracy, precision, recall, and the F1 score, among
-others, to assess model performance and assist in selecting the most effective model for the designated task.
-
-### Test Mechanism
-
-The test employs Scikit-learn’s performance metrics to evaluate each model's performance for both binary and
-multiclass classification tasks. To compare performances, the test runs each model against the test dataset, then
-produces a comprehensive classification report. This report includes metrics such as accuracy, precision, recall,
-and the F1 score. Based on whether the task at hand is binary or multiclass classification, it calculates metrics
-for all the classes and their weighted averages, macro averages, and per-class metrics. The test will be skipped if
-no models are supplied.
-
-### Signs of High Risk
-
-- Low scores in accuracy, precision, recall, and F1 metrics indicate a potentially high risk.
-- A low area under the Receiver Operating Characteristic (ROC) curve (roc_auc score) is another possible indicator
-of high risk.
-- If the metrics scores are significantly lower than alternative models, this might suggest a high risk of failure.
-
-### Strengths
-
-- Provides a simple way to compare the performance of multiple models, accommodating both binary and multiclass
-classification tasks.
-- Offers a holistic view of model performance through a comprehensive report of key performance metrics.
-- The inclusion of the ROC AUC score is advantageous, as this robust performance metric can effectively handle
-class imbalance issues.
-
-### Limitations
-
-- May not be suitable for more complex performance evaluations that consider factors such as prediction speed,
-computational cost, or business-specific constraints.
-- The test's reliability depends on the provided test dataset; hence, the selected models' performance could vary
-with unseen data or changes in the data distribution.
-- The ROC AUC score might not be as meaningful or easily interpretable for multilabel/multiclass tasks.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/OverfitDiagnosis.md b/site/tests/model_validation/sklearn/OverfitDiagnosis.md
deleted file mode 100644
index 993487fd7e..0000000000
--- a/site/tests/model_validation/sklearn/OverfitDiagnosis.md
+++ /dev/null
@@ -1,41 +0,0 @@
-# OverfitDiagnosis
-
-Assesses potential overfitting in a model's predictions, identifying regions where performance between training and
-testing sets deviates significantly.
-
-### Purpose
-
-The Overfit Diagnosis test aims to identify areas in a model's predictions where there is a significant difference
-in performance between the training and testing sets. This test helps to pinpoint specific regions or feature
-segments where the model may be overfitting.
-
-### Test Mechanism
-
-This test compares the model's performance on training versus test data, grouped by feature columns. It calculates
-the difference between the training and test performance for each group and identifies regions where this
-difference exceeds a specified threshold:
-
-- The test works for both classification and regression models.
-- It defaults to using the AUC metric for classification models and the MSE metric for regression models.
-- The threshold for identifying overfitting regions is set to 0.04 by default.
-- The test calculates the performance metrics for each feature segment and plots regions where the performance gap
-exceeds the threshold.
-
-### Signs of High Risk
-
-- Significant gaps between training and test performance metrics for specific feature segments.
-- Multiple regions with performance gaps exceeding the defined threshold.
-- Higher than expected differences in predicted versus actual values in the test set compared to the training set.
-
-### Strengths
-
-- Identifies specific areas where overfitting occurs.
-- Supports multiple performance metrics, providing flexibility.
-- Applicable to both classification and regression models.
-- Visualization of overfitting segments aids in better understanding and debugging.
-
-### Limitations
-
-- The default threshold may not be suitable for all use cases and requires tuning.
-- May not capture more subtle forms of overfitting that do not exceed the threshold.
-- Assumes that the binning of features adequately represents the data segments.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/PermutationFeatureImportance.md b/site/tests/model_validation/sklearn/PermutationFeatureImportance.md
deleted file mode 100644
index 8094817c8a..0000000000
--- a/site/tests/model_validation/sklearn/PermutationFeatureImportance.md
+++ /dev/null
@@ -1,39 +0,0 @@
-# PermutationFeatureImportance
-
-Assesses the significance of each feature in a model by evaluating the impact on model performance when feature
-values are randomly rearranged.
-
-### Purpose
-
-The Permutation Feature Importance (PFI) metric aims to assess the importance of each feature used by the Machine
-Learning model. The significance is measured by evaluating the decrease in the model's performance when the
-feature's values are randomly arranged.
-
-### Test Mechanism
-
-PFI is calculated via the `permutation_importance` method from the `sklearn.inspection` module. This method
-shuffles the columns of the feature dataset and measures the impact on the model's performance. A significant
-decrease in performance after permutating a feature's values deems the feature as important. On the other hand, if
-performance remains the same, the feature is likely not important. The output of the PFI metric is a figure
-illustrating the importance of each feature.
-
-### Signs of High Risk
-
-- The model heavily relies on a feature with highly variable or easily permutable values, indicating instability.
-- A feature deemed unimportant by the model but expected to have a significant effect on the outcome based on
-domain knowledge is not influencing the model's predictions.
-
-### Strengths
-
-- Provides insights into the importance of different features and may reveal underlying data structure.
-- Can indicate overfitting if a particular feature or set of features overly impacts the model's predictions.
-- Model-agnostic and can be used with any classifier that provides a measure of prediction accuracy before and
-after feature permutation.
-
-### Limitations
-
-- Does not imply causality; it only presents the amount of information that a feature provides for the prediction
-task.
-- Does not account for interactions between features. If features are correlated, the permutation importance may
-allocate importance to one and not the other.
-- Cannot interact with certain libraries like statsmodels, pytorch, catboost, etc., thus limiting its applicability.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/PopulationStabilityIndex.md b/site/tests/model_validation/sklearn/PopulationStabilityIndex.md
deleted file mode 100644
index de858878a9..0000000000
--- a/site/tests/model_validation/sklearn/PopulationStabilityIndex.md
+++ /dev/null
@@ -1,50 +0,0 @@
-# PopulationStabilityIndex
-
-Assesses the Population Stability Index (PSI) to quantify the stability of an ML model's predictions across
-different datasets.
-
-### Purpose
-
-The Population Stability Index (PSI) serves as a quantitative assessment for evaluating the stability of a machine
-learning model's output distributions when comparing two different datasets. Typically, these would be a
-development and a validation dataset or two datasets collected at different periods. The PSI provides a measurable
-indication of any significant shift in the model's performance over time or noticeable changes in the
-characteristics of the population the model is making predictions for.
-
-### Test Mechanism
-
-The implementation of the PSI in this script involves calculating the PSI for each feature between the training and
-test datasets. Data from both datasets is sorted and placed into either a predetermined number of bins or
-quantiles. The boundaries for these bins are initially determined based on the distribution of the training data.
-The contents of each bin are calculated and their respective proportions determined. Subsequently, the PSI is
-derived for each bin through a logarithmic transformation of the ratio of the proportions of data for each feature
-in the training and test datasets. The PSI, along with the proportions of data in each bin for both datasets, are
-displayed in a summary table, a grouped bar chart, and a scatter plot.
-
-### Signs of High Risk
-
-- A high PSI value is a clear indicator of high risk. Such a value suggests a significant shift in the model
-predictions or severe changes in the characteristics of the underlying population.
-- This ultimately suggests that the model may not be performing as well as expected and that it may be less
-reliable for making future predictions.
-
-### Strengths
-
-- The PSI provides a quantitative measure of the stability of a model over time or across different samples, making
-it an invaluable tool for evaluating changes in a model's performance.
-- It allows for direct comparisons across different features based on the PSI value.
-- The calculation and interpretation of the PSI are straightforward, facilitating its use in model risk management.
-- The use of visual aids such as tables and charts further simplifies the comprehension and interpretation of the
-PSI.
-
-### Limitations
-
-- The PSI test does not account for the interdependence between features: features that are dependent on one
-another may show similar shifts in their distributions, which in turn may result in similar PSI values.
-- The PSI test does not inherently provide insights into why there are differences in distributions or why the PSI
-values may have changed.
-- The test may not handle features with significant outliers adequately.
-- Additionally, the PSI test is performed on model predictions, not on the underlying data distributions which can
-lead to misinterpretations. Any changes in PSI could be due to shifts in the model (model drift), changes in the
-relationships between features and the target variable (concept drift), or both. However, distinguishing between
-these causes is non-trivial.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/PrecisionRecallCurve.md b/site/tests/model_validation/sklearn/PrecisionRecallCurve.md
deleted file mode 100644
index 5cc9af3ca9..0000000000
--- a/site/tests/model_validation/sklearn/PrecisionRecallCurve.md
+++ /dev/null
@@ -1,40 +0,0 @@
-# PrecisionRecallCurve
-
-Evaluates the precision-recall trade-off for binary classification models and visualizes the Precision-Recall curve.
-
-### Purpose
-
-The Precision Recall Curve metric is intended to evaluate the trade-off between precision and recall in
-classification models, particularly binary classification models. It assesses the model's capacity to produce
-accurate results (high precision), as well as its ability to capture a majority of all positive instances (high
-recall).
-
-### Test Mechanism
-
-The test extracts ground truth labels and prediction probabilities from the model's test dataset. It applies the
-`precision_recall_curve` method from the sklearn metrics module to these extracted labels and predictions, which
-computes a precision-recall pair for each possible threshold. This calculation results in an array of precision and
-recall scores that can be plotted against each other to form the Precision-Recall Curve. This curve is then
-visually represented by using Plotly's scatter plot.
-
-### Signs of High Risk
-
-- A lower area under the Precision-Recall Curve signifies high risk.
-- This corresponds to a model yielding a high amount of false positives (low precision) and/or false negatives (low
-recall).
-- If the curve is closer to the bottom left of the plot, rather than being closer to the top right corner, it can
-be a sign of high risk.
-
-### Strengths
-
-- This metric aptly represents the balance between precision (minimizing false positives) and recall (minimizing
-false negatives), which is especially critical in scenarios where both values are significant.
-- Through the graphic representation, it enables an intuitive understanding of the model's performance across
-different threshold levels.
-
-### Limitations
-
-- This metric is only applicable to binary classification models - it raises errors for multiclass classification
-models or Foundation models.
-- It may not fully represent the overall accuracy of the model if the cost of false positives and false negatives
-are extremely different, or if the dataset is heavily imbalanced.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/ROCCurve.md b/site/tests/model_validation/sklearn/ROCCurve.md
deleted file mode 100644
index e16f5f0e6e..0000000000
--- a/site/tests/model_validation/sklearn/ROCCurve.md
+++ /dev/null
@@ -1,46 +0,0 @@
-# ROCCurve
-
-Evaluates binary classification model performance by generating and plotting the Receiver Operating Characteristic
-(ROC) curve and calculating the Area Under Curve (AUC) score.
-
-### Purpose
-
-The Receiver Operating Characteristic (ROC) curve is designed to evaluate the performance of binary classification
-models. This curve illustrates the balance between the True Positive Rate (TPR) and False Positive Rate (FPR)
-across various threshold levels. In combination with the Area Under the Curve (AUC), the ROC curve aims to measure
-the model's discrimination ability between the two defined classes in a binary classification problem (e.g.,
-default vs non-default). Ideally, a higher AUC score signifies superior model performance in accurately
-distinguishing between the positive and negative classes.
-
-### Test Mechanism
-
-First, this script selects the target model and datasets that require binary classification. It then calculates the
-predicted probabilities for the test set, and uses this data, along with the true outcomes, to generate and plot
-the ROC curve. Additionally, it includes a line signifying randomness (AUC of 0.5). The AUC score for the model's
-ROC curve is also computed, presenting a numerical estimation of the model's performance. If any Infinite values
-are detected in the ROC threshold, these are effectively eliminated. The resulting ROC curve, AUC score, and
-thresholds are consequently saved for future reference.
-
-### Signs of High Risk
-
-- A high risk is potentially linked to the model's performance if the AUC score drops below or nears 0.5.
-- Another warning sign would be the ROC curve lying closer to the line of randomness, indicating no discriminative
-ability.
-- For the model to be deemed competent at its classification tasks, it is crucial that the AUC score is
-significantly above 0.5.
-
-### Strengths
-
-- The ROC Curve offers an inclusive visual depiction of a model's discriminative power throughout all conceivable
-classification thresholds, unlike other metrics that solely disclose model performance at one fixed threshold.
-- Despite the proportions of the dataset, the AUC Score, which represents the entire ROC curve as a single data
-point, continues to be consistent, proving to be the ideal choice for such situations.
-
-### Limitations
-
-- The primary limitation is that this test is exclusively structured for binary classification tasks, thus limiting
-its application towards other model types.
-- Furthermore, its performance might be subpar with models that output probabilities highly skewed towards 0 or 1.
-- At the extreme, the ROC curve could reflect high performance even when the majority of classifications are
-incorrect, provided that the model's ranking format is retained. This phenomenon is commonly termed the "Class
-Imbalance Problem".
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/RegressionErrors.md b/site/tests/model_validation/sklearn/RegressionErrors.md
deleted file mode 100644
index 3585c6dd3c..0000000000
--- a/site/tests/model_validation/sklearn/RegressionErrors.md
+++ /dev/null
@@ -1,45 +0,0 @@
-# RegressionErrors
-
-Assesses the performance and error distribution of a regression model using various error metrics.
-
-### Purpose
-
-The purpose of the Regression Errors test is to measure the performance of a regression model by calculating
-several error metrics. This evaluation helps determine the model's accuracy and potential issues like overfitting
-or bias by analyzing differences in error metrics between the training and testing datasets.
-
-### Test Mechanism
-
-The test computes the following error metrics:
-- **Mean Absolute Error (MAE)**: Average of the absolute differences between true values and predicted values.
-- **Mean Squared Error (MSE)**: Average of the squared differences between true values and predicted values.
-- **Root Mean Squared Error (RMSE)**: Square root of the mean squared error.
-- **Mean Absolute Percentage Error (MAPE)**: Average of the absolute differences between true values and predicted
-values, divided by the true values, and expressed as a percentage.
-- **Mean Bias Deviation (MBD)**: Average bias between true values and predicted values.
-
-These metrics are calculated separately for the training and testing datasets and compared to identify
-discrepancies.
-
-### Signs of High Risk
-
-- High values for MAE, MSE, RMSE, or MAPE indicating poor model performance.
-- Large differences in error metrics between the training and testing datasets, suggesting overfitting.
-- Significant deviation of MBD from zero, indicating systematic bias in model predictions.
-
-### Strengths
-
-- Provides a comprehensive overview of model performance through multiple error metrics.
-- Individual metrics offer specific insights, e.g., MAE for interpretability, MSE for emphasizing larger errors.
-- RMSE is useful for being in the same unit as the target variable.
-- MAPE allows the error to be expressed as a percentage.
-- MBD detects systematic bias in model predictions.
-
-### Limitations
-
-- MAE and MSE are sensitive to outliers.
-- RMSE heavily penalizes larger errors, which might not always be desirable.
-- MAPE can be misleading when actual values are near zero.
-- MBD may not be suitable if bias varies with the magnitude of actual values.
-- These metrics may not capture all nuances of model performance and should be interpreted with domain-specific
-context.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/RegressionErrorsComparison.md b/site/tests/model_validation/sklearn/RegressionErrorsComparison.md
deleted file mode 100644
index 93522eaa14..0000000000
--- a/site/tests/model_validation/sklearn/RegressionErrorsComparison.md
+++ /dev/null
@@ -1,37 +0,0 @@
-# RegressionErrorsComparison
-
-Assesses multiple regression error metrics to compare model performance across different datasets, emphasizing
-systematic overestimation or underestimation and large percentage errors.
-
-### Purpose
-
-The purpose of this test is to compare regression errors for different models applied to various datasets. It aims
-to examine model performance using multiple error metrics, thereby identifying areas where models may be
-underperforming or exhibiting bias.
-
-### Test Mechanism
-
-The function iterates through each dataset-model pair and calculates various error metrics, including Mean Absolute
-Error (MAE), Mean Squared Error (MSE), Mean Absolute Percentage Error (MAPE), and Mean Bias Deviation (MBD). The
-results are summarized in a table, which provides a comprehensive view of each model's performance on the datasets.
-
-### Signs of High Risk
-
-- High Mean Absolute Error (MAE) or Mean Squared Error (MSE), indicating poor model performance.
-- High Mean Absolute Percentage Error (MAPE), suggesting large percentage errors, especially problematic if the
-true values are small.
-- Mean Bias Deviation (MBD) significantly different from zero, indicating systematic overestimation or
-underestimation by the model.
-
-### Strengths
-
-- Provides multiple error metrics to assess model performance from different perspectives.
-- Includes a check to avoid division by zero when calculating MAPE.
-
-### Limitations
-
-- Assumes that the dataset is provided as a DataFrameDataset object with `y`, `y_pred`, and `feature_columns`
-attributes.
-- Relies on the `logger` from `validmind.logging` to warn about zero values in `y_true`, which should be correctly
-implemented and imported.
-- Requires that `dataset.y_pred(model)` returns the predicted values for the model.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/RegressionPerformance.md b/site/tests/model_validation/sklearn/RegressionPerformance.md
deleted file mode 100644
index 41ddde045c..0000000000
--- a/site/tests/model_validation/sklearn/RegressionPerformance.md
+++ /dev/null
@@ -1,32 +0,0 @@
-# RegressionPerformance
-
-Evaluates the performance of a regression model using five different metrics: MAE, MSE, RMSE, MAPE, and MBD.
-
-### Purpose
-
-The Regression Models Performance Comparison metric is used to measure the performance of regression models. It
-calculates multiple evaluation metrics, including Mean Absolute Error (MAE), Mean Squared Error (MSE),
-Root Mean Squared Error (RMSE), Mean Absolute Percentage Error (MAPE), and Mean Bias Deviation (MBD), thereby
-enabling a comprehensive view of model performance.
-
-### Test Mechanism
-
-The test uses the sklearn library to calculate the MAE, MSE, RMSE, MAPE, and MBD. These calculations encapsulate both
-the direction and the magnitude of error in predictions, thereby providing a multi-faceted view of model accuracy.
-
-### Signs of High Risk
-
-- High values of MAE, MSE, RMSE, and MAPE, which indicate a high error rate and imply a larger departure of the
-model's predictions from the true values.
-- A large value of MBD, which shows a consistent bias in the model’s predictions.
-
-### Strengths
-
-- The metric evaluates models on five different metrics offering a comprehensive analysis of model performance.
-- It is designed to handle regression tasks and can be seamlessly integrated with libraries like sklearn.
-
-### Limitations
-
-- The metric only evaluates regression models and does not evaluate classification models.
-- The test assumes that the models have been trained and tested appropriately prior to evaluation. It does not
-handle pre-processing, feature selection, or other stages in the model lifecycle.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/RegressionR2Square.md b/site/tests/model_validation/sklearn/RegressionR2Square.md
deleted file mode 100644
index 72c1c49b10..0000000000
--- a/site/tests/model_validation/sklearn/RegressionR2Square.md
+++ /dev/null
@@ -1,39 +0,0 @@
-# RegressionR2Square
-
-Assesses the overall goodness-of-fit of a regression model by evaluating R-squared (R2) and Adjusted R-squared (Adj
-R2) scores to determine the model's explanatory power over the dependent variable.
-
-### Purpose
-
-The purpose of the RegressionR2Square Metric test is to measure the overall goodness-of-fit of a regression model.
-Specifically, this Python-based test evaluates the R-squared (R2) and Adjusted R-squared (Adj R2) scores, which are
-statistical measures used to assess the strength of the relationship between the model's predictors and the
-response variable.
-
-### Test Mechanism
-
-The test deploys the `r2_score` method from the Scikit-learn metrics module to measure the R2 score on both
-training and test sets. This score reflects the proportion of the variance in the dependent variable that is
-predictable from the independent variables. The test also calculates the Adjusted R2 score, which accounts for the
-number of predictors in the model to penalize model complexity and reduce overfitting. The Adjusted R2 score will
-be smaller if unnecessary predictors are included in the model.
-
-### Signs of High Risk
-
-- Low R2 or Adjusted R2 scores, suggesting that the model does not explain much variation in the dependent variable.
-- Significant discrepancy between R2 scores on the training set and test set, indicating overfitting and poor
-generalization to unseen data.
-
-### Strengths
-
-- Widely-used measure in regression analysis, providing a sound general indication of model performance.
-- Easy to interpret and understand, as it represents the proportion of the dependent variable's variance explained
-by the independent variables.
-- Adjusted R2 score helps control overfitting by penalizing unnecessary predictors.
-
-### Limitations
-
-- Sensitive to the inclusion of unnecessary predictors even though Adjusted R2 penalizes complexity.
-- Less reliable in cases of non-linear relationships or when the underlying assumptions of linear regression are
-violated.
-- Does not provide insight on whether the correct regression model was used or if key assumptions have been met.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/RegressionR2SquareComparison.md b/site/tests/model_validation/sklearn/RegressionR2SquareComparison.md
deleted file mode 100644
index e71d116442..0000000000
--- a/site/tests/model_validation/sklearn/RegressionR2SquareComparison.md
+++ /dev/null
@@ -1,41 +0,0 @@
-# RegressionR2SquareComparison
-
-Compares R-Squared and Adjusted R-Squared values for different regression models across multiple datasets to assess
-model performance and relevance of features.
-
-### Purpose
-
-The Regression R2 Square Comparison test aims to compare the R-Squared and Adjusted R-Squared values for different
-regression models across various datasets. It helps in assessing how well each model explains the variability in
-the dataset, and whether the models include irrelevant features.
-
-### Test Mechanism
-
-This test operates by:
-
-- Iterating through each dataset-model pair.
-- Calculating the R-Squared values to measure how much of the variability in the dataset is explained by the model.
-- Calculating the Adjusted R-Squared values, which adjust the R-Squared based on the number of predictors in the
-model, making it more reliable when comparing models with different numbers of features.
-- Generating a summary table containing these values for each combination of dataset and model.
-
-### Signs of High Risk
-
-- If the R-Squared values are significantly low, it indicates the model isn't explaining much of the variability in
-the dataset.
-- A significant difference between R-Squared and Adjusted R-Squared values might indicate that the model includes
-irrelevant features.
-
-### Strengths
-
-- Provides a quantitative measure of model performance in terms of variance explained.
-- Adjusted R-Squared accounts for the number of predictors, making it a more reliable measure when comparing models
-with different numbers of features.
-- Useful for time-series forecasting and regression tasks.
-
-### Limitations
-
-- Assumes the dataset is provided as a DataFrameDataset object with `y`, `y_pred`, and `feature_columns` attributes.
-- Relies on `adj_r2_score` from the `statsmodels.statsutils` module, which needs to be correctly implemented and
-imported.
-- Requires that `dataset.y_pred(model)` returns the predicted values for the model.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/RobustnessDiagnosis.md b/site/tests/model_validation/sklearn/RobustnessDiagnosis.md
deleted file mode 100644
index 1f9fb63ebf..0000000000
--- a/site/tests/model_validation/sklearn/RobustnessDiagnosis.md
+++ /dev/null
@@ -1,37 +0,0 @@
-# RobustnessDiagnosis
-
-Assesses the robustness of a machine learning model by evaluating performance decay under noisy conditions.
-
-### Purpose
-
-The Robustness Diagnosis test aims to evaluate the resilience of a machine learning model when subjected to
-perturbations or noise in its input data. This is essential for understanding the model's ability to handle
-real-world scenarios where data may be imperfect or corrupted.
-
-### Test Mechanism
-
-This test introduces Gaussian noise to the numeric input features of the datasets at varying scales of standard
-deviation. The performance of the model is then measured using a specified metric. The process includes:
-
-- Adding Gaussian noise to numerical input features based on scaling factors.
-- Evaluating the model's performance on the perturbed data using metrics like AUC for classification tasks and MSE
-for regression tasks.
-- Aggregating and plotting the results to visualize performance decay relative to perturbation size.
-
-### Signs of High Risk
-
-- A significant drop in performance metrics with minimal noise.
-- Performance decay values exceeding the specified threshold.
-- Consistent failure to meet performance standards across multiple perturbation scales.
-
-### Strengths
-
-- Provides insights into the model's robustness against noisy or corrupted data.
-- Utilizes a variety of performance metrics suitable for both classification and regression tasks.
-- Visualization helps in understanding the extent of performance degradation.
-
-### Limitations
-
-- Gaussian noise might not adequately represent all types of real-world data perturbations.
-- Performance thresholds are somewhat arbitrary and might need tuning.
-- The test may not account for more complex or unstructured noise patterns that could affect model robustness.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/SHAPGlobalImportance.md b/site/tests/model_validation/sklearn/SHAPGlobalImportance.md
deleted file mode 100644
index 3a0cc6458e..0000000000
--- a/site/tests/model_validation/sklearn/SHAPGlobalImportance.md
+++ /dev/null
@@ -1,44 +0,0 @@
-# SHAPGlobalImportance
-
-Evaluates and visualizes global feature importance using SHAP values for model explanation and risk identification.
-
-### Purpose
-
-The SHAP (SHapley Additive exPlanations) Global Importance metric aims to elucidate model outcomes by attributing
-them to the contributing features. It assigns a quantifiable global importance to each feature via their respective
-absolute Shapley values, thereby making it suitable for tasks like classification (both binary and multiclass).
-This metric forms an essential part of model risk management.
-
-### Test Mechanism
-
-The exam begins with the selection of a suitable explainer which aligns with the model's type. For tree-based
-models like XGBClassifier, RandomForestClassifier, CatBoostClassifier, TreeExplainer is used whereas for linear
-models like LogisticRegression, XGBRegressor, LinearRegression, it is the LinearExplainer. Once the explainer
-calculates the Shapley values, these values are visualized using two specific graphical representations:
-
-1. Mean Importance Plot: This graph portrays the significance of individual features based on their absolute
-Shapley values. It calculates the average of these absolute Shapley values across all instances to highlight the
-global importance of features.
-
-2. Summary Plot: This visual tool combines the feature importance with their effects. Every dot on this chart
-represents a Shapley value for a certain feature in a specific case. The vertical axis is denoted by the feature
-whereas the horizontal one corresponds to the Shapley value. A color gradient indicates the value of the feature,
-gradually changing from low to high. Features are systematically organized in accordance with their importance.
-
-### Signs of High Risk
-
-- Overemphasis on certain features in SHAP importance plots, thus hinting at the possibility of model overfitting
-- Anomalies such as unexpected or illogical features showing high importance, which might suggest that the model's
-decisions are rooted in incorrect or undesirable reasoning
-- A SHAP summary plot filled with high variability or scattered data points, indicating a cause for concern
-
-### Strengths
-
-- SHAP does more than just illustrating global feature significance, it offers a detailed perspective on how
-different features shape the model's decision-making logic for each instance.
-- It provides clear insights into model behavior.
-
-### Limitations
-
-- High-dimensional data can convolute interpretations.
-- Associating importance with tangible real-world impact still involves a certain degree of subjectivity.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/ScoreProbabilityAlignment.md b/site/tests/model_validation/sklearn/ScoreProbabilityAlignment.md
deleted file mode 100644
index 055f90c7ef..0000000000
--- a/site/tests/model_validation/sklearn/ScoreProbabilityAlignment.md
+++ /dev/null
@@ -1,50 +0,0 @@
-# ScoreProbabilityAlignment
-
-Analyzes the alignment between credit scores and predicted probabilities.
-
-### Purpose
-
-The Score-Probability Alignment test evaluates how well credit scores align with
-predicted default probabilities. This helps validate score scaling, identify potential
-calibration issues, and ensure scores reflect risk appropriately.
-
-### Test Mechanism
-
-The test:
-1. Groups scores into bins
-2. Calculates average predicted probability per bin
-3. Tests monotonicity of relationship
-4. Analyzes probability distribution within score bands
-
-### Signs of High Risk
-
-- Non-monotonic relationship between scores and probabilities
-- Large probability variations within score bands
-- Unexpected probability jumps between adjacent bands
-- Poor alignment with expected odds-to-score relationship
-- Inconsistent probability patterns across score ranges
-- Clustering of probabilities at extreme values
-- Score bands with similar probability profiles
-- Unstable probability estimates in key decision bands
-
-### Strengths
-
-- Direct validation of score-to-probability relationship
-- Identifies potential calibration issues
-- Supports score band validation
-- Helps understand model behavior
-- Useful for policy setting
-- Visual and numerical results
-- Easy to interpret
-- Supports regulatory documentation
-
-### Limitations
-
-- Sensitive to bin selection
-- Requires sufficient data per bin
-- May mask within-bin variations
-- Point-in-time analysis only
-- Cannot detect all forms of miscalibration
-- Assumes scores should align with probabilities
-- May oversimplify complex relationships
-- Limited to binary outcomes
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/SilhouettePlot.md b/site/tests/model_validation/sklearn/SilhouettePlot.md
deleted file mode 100644
index 313420f6c6..0000000000
--- a/site/tests/model_validation/sklearn/SilhouettePlot.md
+++ /dev/null
@@ -1,46 +0,0 @@
-# SilhouettePlot
-
-Calculates and visualizes Silhouette Score, assessing the degree of data point suitability to its cluster in ML
-models.
-
-### Purpose
-
-This test calculates the Silhouette Score, which is a model performance metric used in clustering applications.
-Primarily, the Silhouette Score evaluates how similar a data point is to its own cluster compared to other
-clusters. The metric ranges between -1 and 1, where a high value indicates that the object is well matched to its
-own cluster and poorly matched to neighboring clusters. Thus, the goal is to achieve a high Silhouette Score,
-implying well-separated clusters.
-
-### Test Mechanism
-
-The test first extracts the true and predicted labels from the model's training data. The test runs the Silhouette
-Score function, which takes as input the training dataset features and the predicted labels, subsequently
-calculating the average score. This average Silhouette Score is printed for reference. The script then calculates
-the silhouette coefficients for each data point, helping to form the Silhouette Plot. Each cluster is represented
-in this plot, with color distinguishing between different clusters. A red dashed line indicates the average
-Silhouette Score. The Silhouette Scores are also collected into a structured table, facilitating model performance
-analysis and comparison.
-
-### Signs of High Risk
-
-- A low Silhouette Score, potentially indicating that the clusters are not well separated and that data points may
-not be fitting well to their respective clusters.
-- A Silhouette Plot displaying overlapping clusters or the absence of clear distinctions between clusters visually
-also suggests poor clustering performance.
-
-### Strengths
-
-- The Silhouette Score provides a clear and quantitative measure of how well data points have been grouped into
-clusters, offering insights into model performance.
-- The Silhouette Plot provides an intuitive, graphical representation of the clustering mechanism, aiding visual
-assessments of model performance.
-- It does not require ground truth labels, so it's useful when true cluster assignments are not known.
-
-### Limitations
-
-- The Silhouette Score may be susceptible to the influence of outliers, which could impact its accuracy and
-reliability.
-- It assumes the clusters are convex and isotropic, which might not be the case with complex datasets.
-- Due to the average nature of the Silhouette Score, the metric does not account for individual data point
-assignment nuances, so potentially relevant details may be omitted.
-- Computationally expensive for large datasets, as it requires pairwise distance computations.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/TrainingTestDegradation.md b/site/tests/model_validation/sklearn/TrainingTestDegradation.md
deleted file mode 100644
index 5bd3f2dac6..0000000000
--- a/site/tests/model_validation/sklearn/TrainingTestDegradation.md
+++ /dev/null
@@ -1,41 +0,0 @@
-# TrainingTestDegradation
-
-Tests if model performance degradation between training and test datasets exceeds a predefined threshold.
-
-### Purpose
-
-The `TrainingTestDegradation` class serves as a test to verify that the degradation in performance between the
-training and test datasets does not exceed a predefined threshold. This test measures the model's ability to
-generalize from its training data to unseen test data, assessing key classification metrics such as precision,
-recall, and f1 score to verify the model's robustness and reliability.
-
-### Test Mechanism
-
-The code applies several predefined metrics, including precision, recall, and f1 scores, to the model's
-predictions for both the training and test datasets. It calculates the degradation as the difference between the
-training score and test score divided by the training score. The test is considered successful if the degradation
-for each metric is less than the preset maximum threshold (default: 0.10). The results are summarized in a table
-showing each metric's train score, test score, degradation percentage, and pass/fail status.
-
-### Signs of High Risk
-
-- A degradation percentage that exceeds the maximum allowed threshold of 10% for any of the evaluated metrics.
-- A high difference or gap between the metric scores on the training and the test datasets.
-- The 'Pass/Fail' column displaying 'Fail' for any of the evaluated metrics.
-
-### Strengths
-
-- Provides a quantitative measure of the model's ability to generalize to unseen data, which is key for predicting
-its practical real-world performance.
-- By evaluating multiple metrics, it takes into account different facets of model performance and enables a more
-holistic evaluation.
-- The use of a variable predefined threshold allows the flexibility to adjust the acceptability criteria for
-different scenarios.
-
-### Limitations
-
-- The test compares raw performance on training and test data but does not factor in the nature of the data. Areas
-with less representation in the training set might still perform poorly on unseen data.
-- It requires good coverage and balance in the test and training datasets to produce reliable results, which may
-not always be available.
-- The test is currently only designed for classification tasks.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/VMeasure.md b/site/tests/model_validation/sklearn/VMeasure.md
deleted file mode 100644
index 65bcb27ab0..0000000000
--- a/site/tests/model_validation/sklearn/VMeasure.md
+++ /dev/null
@@ -1,37 +0,0 @@
-# VMeasure
-
-Evaluates homogeneity and completeness of a clustering model using the V Measure Score.
-
-### Purpose
-
-The purpose of this metric, V Measure Score (V Score), is to evaluate the performance of a clustering model. It
-measures the homogeneity and completeness of a set of cluster labels, where homogeneity refers to each cluster
-containing only members of a single class and completeness meaning all members of a given class are assigned to the
-same cluster.
-
-### Test Mechanism
-
-ClusterVMeasure is a class that inherits from another class, ClusterPerformance. It uses the `v_measure_score`
-function from the sklearn module's metrics package. The required inputs to perform this metric are the model, train
-dataset, and test dataset. The test is appropriate for models tasked with clustering.
-
-### Signs of High Risk
-
-- Low V Measure Score: A low V Measure Score indicates that the clustering model has poor homogeneity or
-completeness, or both. This might signal that the model is failing to correctly cluster the data.
-
-### Strengths
-
-- The V Measure Score is a harmonic mean between homogeneity and completeness. This ensures that both attributes
-are taken into account when evaluating the model, providing an overall measure of its cluster validity.
-- The metric does not require knowledge of the ground truth classes when measuring homogeneity and completeness,
-making it applicable in instances where such information is unavailable.
-
-### Limitations
-
-- The V Measure Score can be influenced by the number of clusters, which means that it might not always reflect the
-quality of the clustering. Partitioning the data into many small clusters could lead to high homogeneity but low
-completeness, leading to a low V Measure Score even if the clustering might be useful.
-- It assumes equal importance of homogeneity and completeness. In some applications, one may be more important than
-the other. The V Measure Score does not provide flexibility in assigning different weights to homogeneity and
-completeness.
\ No newline at end of file
diff --git a/site/tests/model_validation/sklearn/WeakspotsDiagnosis.md b/site/tests/model_validation/sklearn/WeakspotsDiagnosis.md
deleted file mode 100644
index 5189a401cc..0000000000
--- a/site/tests/model_validation/sklearn/WeakspotsDiagnosis.md
+++ /dev/null
@@ -1,49 +0,0 @@
-# WeakspotsDiagnosis
-
-Identifies and visualizes weak spots in a machine learning model's performance across various sections of the
-feature space.
-
-### Purpose
-
-The weak spots test is applied to evaluate the performance of a machine learning model within specific regions of
-its feature space. This test slices the feature space into various sections, evaluating the model's outputs within
-each section against specific performance metrics (e.g., accuracy, precision, recall, and F1 scores). The ultimate
-aim is to identify areas where the model's performance falls below the set thresholds, thereby exposing its
-possible weaknesses and limitations.
-
-### Test Mechanism
-
-The test mechanism adopts an approach of dividing the feature space of the training dataset into numerous bins. The
-model's performance metrics (accuracy, precision, recall, F1 scores) are then computed for each bin on both the
-training and test datasets. A "weak spot" is identified if any of the performance metrics fall below a
-predetermined threshold for a particular bin on the test dataset. The test results are visually plotted as bar
-charts for each performance metric, indicating the bins which fail to meet the established threshold.
-
-### Signs of High Risk
-
-- Any performance metric of the model dropping below the set thresholds.
-- Significant disparity in performance between the training and test datasets within a bin could be an indication
-of overfitting.
-- Regions or slices with consistently low performance metrics. Such instances could mean that the model struggles
-to handle specific types of input data adequately, resulting in potentially inaccurate predictions.
-
-### Strengths
-
-- The test helps pinpoint precise regions of the feature space where the model's performance is below par, allowing
-for more targeted improvements to the model.
-- The graphical presentation of the performance metrics offers an intuitive way to understand the model's
-performance across different feature areas.
-- The test exhibits flexibility, letting users set different thresholds for various performance metrics according
-to the specific requirements of the application.
-
-### Limitations
-
-- The binning system utilized for the feature space in the test could over-simplify the model's behavior within
-each bin. The granularity of this slicing depends on the chosen 'bins' parameter and can sometimes be arbitrary.
-- The effectiveness of this test largely hinges on the selection of thresholds for the performance metrics, which
-may not hold universally applicable and could be subjected to the specifications of a particular model and
-application.
-- The test is unable to handle datasets with a text column, limiting its application to numerical or categorical
-data types only.
-- Despite its usefulness in highlighting problematic regions, the test does not offer direct suggestions for model
-improvement.
\ No newline at end of file
diff --git a/site/tests/model_validation/statsmodels/AutoARIMA.md b/site/tests/model_validation/statsmodels/AutoARIMA.md
deleted file mode 100644
index 85fcd89f15..0000000000
--- a/site/tests/model_validation/statsmodels/AutoARIMA.md
+++ /dev/null
@@ -1,49 +0,0 @@
-# AutoARIMA
-
-Evaluates ARIMA models for time-series forecasting, ranking them using Bayesian and Akaike Information Criteria.
-
-### Purpose
-
-The AutoARIMA validation test is designed to evaluate and rank AutoRegressive Integrated Moving Average (ARIMA)
-models. These models are primarily used for forecasting time-series data. The validation test automatically fits
-multiple ARIMA models, with varying parameters, to every variable within the given dataset. The models are then
-ranked based on their Bayesian Information Criterion (BIC) and Akaike Information Criterion (AIC) values, which
-provide a basis for the efficient model selection process.
-
-### Test Mechanism
-
-This metric proceeds by generating an array of feasible combinations of ARIMA model parameters which are within a
-prescribed limit. These limits include `max_p`, `max_d`, `max_q`; they represent the autoregressive, differencing,
-and moving average components respectively. Upon applying these sets of parameters, the validation test fits each
-ARIMA model to the time-series data provided. For each model, it subsequently proceeds to calculate and record both
-the BIC and AIC values, which serve as performance indicators for the model fit. Prior to this parameter fitting
-process, the Augmented Dickey-Fuller test for data stationarity is conducted on the data series. If a series is
-found to be non-stationary, a warning message is sent out, given that ARIMA models necessitate input series to be
-stationary.
-
-### Signs of High Risk
-
-- If the p-value of the Augmented Dickey-Fuller test for a variable exceeds 0.05, a warning is logged. This warning
-indicates that the series might not be stationary, leading to potentially inaccurate results.
-- Consistent failure in fitting ARIMA models (as made evident through logged errors) might disclose issues with
-either the data or model stability.
-
-### Strengths
-
-- The AutoARIMA validation test simplifies the often complex task of selecting the most suitable ARIMA model based
-on BIC and AIC criteria.
-- The mechanism incorporates a check for non-stationarity within the data, which is a critical prerequisite for
-ARIMA models.
-- The exhaustive search through all possible combinations of model parameters enhances the likelihood of
-identifying the best-fit model.
-
-### Limitations
-
-- This validation test can be computationally costly as it involves creating and fitting multiple ARIMA models for
-every variable.
-- Although the test checks for non-stationarity and logs warnings where present, it does not apply any
-transformations to the data to establish stationarity.
-- The selection of models leans solely on BIC and AIC criteria, which may not yield the best predictive model in
-all scenarios.
-- The test is only applicable to regression tasks involving time-series data, and may not work effectively for
-other types of machine learning tasks.
\ No newline at end of file
diff --git a/site/tests/model_validation/statsmodels/CumulativePredictionProbabilities.md b/site/tests/model_validation/statsmodels/CumulativePredictionProbabilities.md
deleted file mode 100644
index 9e609c8a4d..0000000000
--- a/site/tests/model_validation/statsmodels/CumulativePredictionProbabilities.md
+++ /dev/null
@@ -1,41 +0,0 @@
-# CumulativePredictionProbabilities
-
-Visualizes cumulative probabilities of positive and negative classes in classification models.
-
-### Purpose
-
-This metric is utilized to evaluate the distribution of predicted probabilities for positive and negative classes
-in a classification model. It provides a visual assessment of the model's behavior by plotting the cumulative
-probabilities for positive and negative classes within the provided dataset.
-
-### Test Mechanism
-
-The classification model is evaluated by first computing the predicted probabilities for each instance in the
-dataset, which are then added as a new column. The cumulative probabilities for positive and negative classes are
-subsequently calculated and sorted in ascending order. Cumulative distributions of these probabilities are created
-for both positive and negative classes. These cumulative probabilities are represented visually in a plot with lines
-representing cumulative distributions of positive and negative classes.
-
-### Signs of High Risk
-
-- Imbalanced distribution of probabilities for either positive or negative classes.
-- Marked discrepancies or large differences between the cumulative probability distributions for positive and
-negative classes.
-- Unusual patterns in the cumulative probability distributions that may indicate model calibration issues.
-
-### Strengths
-
-- Provides a visual illustration of data, which enhances the ease of understanding and interpreting the model's
-behavior.
-- Differentiates between positive and negative classes and their respective distribution patterns, aiding in
-problem diagnosis.
-- Helps identify potential calibration issues by visualizing how probabilities are distributed across classes.
-
-### Limitations
-
-- Exclusive to classification tasks and specifically to classification models.
-- Graphical results necessitate human interpretation and may not be directly applicable for automated risk
-detection.
-- The method does not give a solitary quantifiable measure of model risk, instead, it offers a visual
-representation and broad distributional information.
-- If the dataset is not representative of the overall data distribution, the metric could provide misleading results.
\ No newline at end of file
diff --git a/site/tests/model_validation/statsmodels/DurbinWatsonTest.md b/site/tests/model_validation/statsmodels/DurbinWatsonTest.md
deleted file mode 100644
index 7bec1cf5b5..0000000000
--- a/site/tests/model_validation/statsmodels/DurbinWatsonTest.md
+++ /dev/null
@@ -1,37 +0,0 @@
-# DurbinWatsonTest
-
-Assesses autocorrelation in time series data features using the Durbin-Watson statistic.
-
-### Purpose
-
-The Durbin-Watson Test metric detects autocorrelation in time series data (where a set of data values influences
-their predecessors). Autocorrelation is a crucial factor for regression tasks as these often assume the
-independence of residuals. A model with significant autocorrelation may give unreliable predictions.
-
-### Test Mechanism
-
-Utilizing the `durbin_watson` function in the `statsmodels` Python library, the Durbin-Watson (DW) Test metric
-generates a statistical value for each feature of the training dataset. The function is looped over all columns of
-the dataset, calculating and caching the DW value for each column for further analysis. A DW metric value nearing 2
-indicates no autocorrelation. Conversely, values approaching 0 suggest positive autocorrelation, and those leaning
-towards 4 imply negative autocorrelation.
-
-### Signs of High Risk
-
-- If a feature's DW value significantly deviates from 2, it could signal a high risk due to potential
-autocorrelation issues in the dataset.
-- A value closer to 0 could imply positive autocorrelation, while a value nearer to 4 could point to negative
-autocorrelation, both leading to potentially unreliable prediction models.
-
-### Strengths
-
-- The metric specializes in identifying autocorrelation in prediction model residuals.
-- Autocorrelation detection assists in diagnosing violation of various modeling technique assumptions, particularly
-in regression analysis and time-series data modeling.
-
-### Limitations
-
-- The Durbin-Watson Test mainly detects linear autocorrelation and could overlook other types of relationships.
-- The metric is highly sensitive to data points order. Shuffling the order could lead to notably different results.
-- The test only checks for first-order autocorrelation (between a variable and its immediate predecessor) and fails
-to detect higher-order autocorrelation.
\ No newline at end of file
diff --git a/site/tests/model_validation/statsmodels/GINITable.md b/site/tests/model_validation/statsmodels/GINITable.md
deleted file mode 100644
index 0e571bcf10..0000000000
--- a/site/tests/model_validation/statsmodels/GINITable.md
+++ /dev/null
@@ -1,49 +0,0 @@
-# GINITable
-
-Evaluates classification model performance using AUC, GINI, and KS metrics for training and test datasets.
-
-### Purpose
-
-The 'GINITable' metric is designed to evaluate the performance of a classification model by emphasizing its
-discriminatory power. Specifically, it calculates and presents three important metrics - the Area under the ROC
-Curve (AUC), the GINI coefficient, and the Kolmogorov-Smirnov (KS) statistic - for both training and test datasets.
-
-### Test Mechanism
-
-Using a dictionary for storing performance metrics for both the training and test datasets, the 'GINITable' metric
-calculates each of these metrics sequentially. The Area under the ROC Curve (AUC) is calculated via the
-`roc_auc_score` function from the Scikit-Learn library. The GINI coefficient, a measure of statistical dispersion,
-is then computed by doubling the AUC and subtracting 1. Finally, the Kolmogorov-Smirnov (KS) statistic is
-calculated via the `roc_curve` function from Scikit-Learn, with the False Positive Rate (FPR) subtracted from the
-True Positive Rate (TPR) and the maximum value taken from the resulting data. These metrics are then stored in a
-pandas DataFrame for convenient visualization.
-
-### Signs of High Risk
-
-- Low values for performance metrics may suggest a reduction in model performance, particularly a low AUC which
-indicates poor classification performance, or a low GINI coefficient, which could suggest a decreased ability to
-discriminate different classes.
-- A high KS value may be an indicator of potential overfitting, as this generally signifies a substantial
-divergence between positive and negative distributions.
-- Significant discrepancies between the performance on the training dataset and the test dataset may present
-another signal of high risk.
-
-### Strengths
-
-- Offers three key performance metrics (AUC, GINI, and KS) in one test, providing a more comprehensive evaluation
-of the model.
-- Provides a direct comparison between the model's performance on training and testing datasets, which aids in
-identifying potential underfitting or overfitting.
-- The applied metrics are class-distribution invariant, thereby remaining effective for evaluating model
-performance even when dealing with imbalanced datasets.
-- Presents the metrics in a user-friendly table format for easy comprehension and analysis.
-
-### Limitations
-
-- The GINI coefficient and KS statistic are both dependent on the AUC value. Therefore, any errors in the
-calculation of the latter will adversely impact the former metrics too.
-- Mainly suited for binary classification models and may require modifications for effective application in
-multi-class scenarios.
-- The metrics used are threshold-dependent and may exhibit high variability based on the chosen cut-off points.
-- The test does not incorporate a method to efficiently handle missing or inefficiently processed data, which could
-lead to inaccuracies in the metrics if the data is not appropriately preprocessed.
\ No newline at end of file
diff --git a/site/tests/model_validation/statsmodels/KolmogorovSmirnov.md b/site/tests/model_validation/statsmodels/KolmogorovSmirnov.md
deleted file mode 100644
index f697481716..0000000000
--- a/site/tests/model_validation/statsmodels/KolmogorovSmirnov.md
+++ /dev/null
@@ -1,35 +0,0 @@
-# KolmogorovSmirnov
-
-Assesses whether each feature in the dataset aligns with a normal distribution using the Kolmogorov-Smirnov test.
-
-### Purpose
-
-The Kolmogorov-Smirnov (KS) test evaluates the distribution of features in a dataset to determine their alignment
-with a normal distribution. This is important because many statistical methods and machine learning models assume
-normality in the data distribution.
-
-### Test Mechanism
-
-This test calculates the KS statistic and corresponding p-value for each feature in the dataset. It does so by
-comparing the cumulative distribution function of the feature with an ideal normal distribution. The KS statistic
-and p-value for each feature are then stored in a dictionary. The p-value threshold to reject the normal
-distribution hypothesis is not preset, providing flexibility for different applications.
-
-### Signs of High Risk
-
-- Elevated KS statistic for a feature combined with a low p-value, indicating a significant divergence from a
-normal distribution.
-- Features with notable deviations that could create problems if the model assumes normality in data distribution.
-
-### Strengths
-
-- The KS test is sensitive to differences in the location and shape of empirical cumulative distribution functions.
-- It is non-parametric and adaptable to various datasets, as it does not assume any specific data distribution.
-- Provides detailed insights into the distribution of individual features.
-
-### Limitations
-
-- The test's sensitivity to disparities in the tails of data distribution might cause false alarms about
-non-normality.
-- Less effective for multivariate distributions, as it is designed for univariate distributions.
-- Does not identify specific types of non-normality, such as skewness or kurtosis, which could impact model fitting.
\ No newline at end of file
diff --git a/site/tests/model_validation/statsmodels/Lilliefors.md b/site/tests/model_validation/statsmodels/Lilliefors.md
deleted file mode 100644
index a6b6e17cd8..0000000000
--- a/site/tests/model_validation/statsmodels/Lilliefors.md
+++ /dev/null
@@ -1,45 +0,0 @@
-# Lilliefors
-
-Assesses the normality of feature distributions in an ML model's training dataset using the Lilliefors test.
-
-### Purpose
-
-The purpose of this metric is to utilize the Lilliefors test, named in honor of the Swedish statistician Hubert
-Lilliefors, in order to assess whether the features of the machine learning model's training dataset conform to a
-normal distribution. This is done because the assumption of normal distribution plays a vital role in numerous
-statistical procedures as well as numerous machine learning models. Should the features fail to follow a normal
-distribution, some model types may not operate at optimal efficiency. This can potentially lead to inaccurate
-predictions.
-
-### Test Mechanism
-
-The application of this test happens across all feature columns within the training dataset. For each feature, the
-Lilliefors test returns a test statistic and p-value. The test statistic quantifies how far the feature's
-distribution is from an ideal normal distribution, whereas the p-value aids in determining the statistical
-relevance of this deviation. The final results are stored within a dictionary, the keys of which correspond to the
-name of the feature column, and the values being another dictionary which houses the test statistic and p-value.
-
-### Signs of High Risk
-
-- If the p-value corresponding to a specific feature sinks below a pre-established significance level, generally
-set at 0.05, then it can be deduced that the distribution of that feature significantly deviates from a normal
-distribution. This can present a high risk for models that assume normality, as these models may perform
-inaccurately or inefficiently in the presence of such a feature.
-
-### Strengths
-
-- One advantage of the Lilliefors test is its utility irrespective of whether the mean and variance of the normal
-distribution are known in advance. This makes it a more robust option in real-world situations where these values
-might not be known.
-- The test has the ability to screen every feature column, offering a holistic view of the dataset.
-
-### Limitations
-
-- Despite the practical applications of the Lilliefors test in validating normality, it does come with some
-limitations.
-- It is only capable of testing unidimensional data, thus rendering it ineffective for datasets with interactions
-between features or multi-dimensional phenomena.
-- The test might not be as sensitive as some other tests (like the Anderson-Darling test) in detecting deviations
-from a normal distribution.
-- Like any other statistical test, Lilliefors test may also produce false positives or negatives. Hence, banking
-solely on this test, without considering other characteristics of the data, may give rise to risks.
\ No newline at end of file
diff --git a/site/tests/model_validation/statsmodels/PredictionProbabilitiesHistogram.md b/site/tests/model_validation/statsmodels/PredictionProbabilitiesHistogram.md
deleted file mode 100644
index 0a877ade30..0000000000
--- a/site/tests/model_validation/statsmodels/PredictionProbabilitiesHistogram.md
+++ /dev/null
@@ -1,40 +0,0 @@
-# PredictionProbabilitiesHistogram
-
-Assesses the predictive probability distribution for binary classification to evaluate model performance and
-potential overfitting or bias.
-
-### Purpose
-
-The Prediction Probabilities Histogram test is designed to generate histograms displaying the Probability of
-Default (PD) predictions for both positive and negative classes in training and testing datasets. This helps in
-evaluating the performance of a classification model.
-
-### Test Mechanism
-
-The metric follows these steps to execute the test:
-- Extracts the target column from both the train and test datasets.
-- Uses the model's predict function to calculate probabilities.
-- Adds these probabilities as a new column to the training and testing dataframes.
-- Generates histograms for each class (0 or 1) within the training and testing datasets.
-- Sets different opacities for the histograms to enhance visualization.
-- Overlays the four histograms (two for training and two for testing) on two different subplot frames.
-- Returns a plotly graph object displaying the visualization.
-
-### Signs of High Risk
-
-- Significant discrepancies between the histograms of training and testing data.
-- Large disparities between the histograms for the positive and negative classes.
-- Potential overfitting or bias indicated by significant issues.
-- Unevenly distributed probabilities suggesting inaccurate model predictions.
-
-### Strengths
-
-- Offers a visual representation of the PD predictions made by the model, aiding in understanding its behavior.
-- Assesses both the training and testing datasets, adding depth to model validation.
-- Highlights disparities between classes, providing insights into class imbalance or data skewness.
-- Effectively visualizes risk spread, which is particularly beneficial for credit risk prediction.
-
-### Limitations
-
-- Specifically tailored for binary classification scenarios and not suited for multi-class classification tasks.
-- Provides a robust visual representation but lacks a quantifiable measure to assess model performance.
\ No newline at end of file
diff --git a/site/tests/model_validation/statsmodels/RegressionCoeffs.md b/site/tests/model_validation/statsmodels/RegressionCoeffs.md
deleted file mode 100644
index 64feb1ab21..0000000000
--- a/site/tests/model_validation/statsmodels/RegressionCoeffs.md
+++ /dev/null
@@ -1,44 +0,0 @@
-# RegressionCoeffs
-
-Assesses the significance and uncertainty of predictor variables in a regression model through visualization of
-coefficients and their 95% confidence intervals.
-
-### Purpose
-
-The `RegressionCoeffs` metric visualizes the estimated regression coefficients alongside their 95% confidence intervals,
-providing insights into the impact and significance of predictor variables on the response variable. This visualization
-helps to understand the variability and uncertainty in the model's estimates, aiding in the evaluation of the
-significance of each predictor.
-
-### Test Mechanism
-
-The function operates by extracting the estimated coefficients and their standard errors from the regression model.
-Using these, it calculates the confidence intervals at a 95% confidence level, which indicates the range within which
-the true coefficient value is expected to fall 95% of the time. The confidence intervals are computed using the
-Z-value associated with the 95% confidence level. The coefficients and their confidence intervals are then visualized
-in a bar plot. The x-axis represents the predictor variables, the y-axis represents the estimated coefficients, and
-the error bars depict the confidence intervals.
-
-### Signs of High Risk
-
-- The confidence interval for a coefficient contains the zero value, suggesting that the predictor may not significantly
-contribute to the model.
-- Multiple coefficients with confidence intervals that include zero, potentially indicating issues with model reliability.
-- Very wide confidence intervals, which may suggest high uncertainty in the coefficient estimates and potential model
-instability.
-
-### Strengths
-
-- Provides a clear visualization that allows for easy interpretation of the significance and impact of predictor
-variables.
-- Includes confidence intervals, which provide additional information about the uncertainty surrounding each coefficient
-estimate.
-
-### Limitations
-
-- The method assumes normality of residuals and independence of observations, assumptions that may not always hold true
-in practice.
-- It does not address issues related to multi-collinearity among predictor variables, which can affect the interpretation
-of coefficients.
-- This metric is limited to regression tasks using tabular data and is not applicable to other types of machine learning
-tasks or data structures.
\ No newline at end of file
diff --git a/site/tests/model_validation/statsmodels/RegressionFeatureSignificance.md b/site/tests/model_validation/statsmodels/RegressionFeatureSignificance.md
deleted file mode 100644
index 6b82923047..0000000000
--- a/site/tests/model_validation/statsmodels/RegressionFeatureSignificance.md
+++ /dev/null
@@ -1,39 +0,0 @@
-# RegressionFeatureSignificance
-
-Assesses and visualizes the statistical significance of features in a regression model.
-
-### Purpose
-
-The Regression Feature Significance metric assesses the significance of each feature in a given set of regression
-model. It creates a visualization displaying p-values for every feature of the model, assisting model developers
-in understanding which features are most influential in their model.
-
-### Test Mechanism
-
-The test mechanism involves extracting the model's coefficients and p-values for each feature, and then plotting these
-values. The x-axis on the plot contains the p-values while the y-axis denotes the coefficients of each feature. A
-vertical red line is drawn at the threshold for p-value significance, which is 0.05 by default. Any features with
-p-values to the left of this line are considered statistically significant at the chosen level.
-
-### Signs of High Risk
-
-- Any feature with a high p-value (greater than the threshold) is considered a potential high risk, as it suggests
-the feature is not statistically significant and may not be reliably contributing to the model's predictions.
-- A high number of such features may indicate problems with the model validation, variable selection, and overall
-reliability of the model predictions.
-
-### Strengths
-
-- Helps identify the features that significantly contribute to a model's prediction, providing insights into the
-feature importance.
-- Provides tangible, easy-to-understand visualizations to interpret the feature significance.
-
-### Limitations
-
-- This metric assumes model features are independent, which may not always be the case. Multicollinearity (high
-correlation amongst predictors) can cause high variance and unreliable statistical tests of significance.
-- The p-value strategy for feature selection doesn't take into account the magnitude of the effect, focusing solely
-on whether the feature is likely non-zero.
-- This test is specific to regression models and wouldn't be suitable for other types of ML models.
-- P-value thresholds are somewhat arbitrary and do not always indicate practical significance, only statistical
-significance.
\ No newline at end of file
diff --git a/site/tests/model_validation/statsmodels/RegressionModelForecastPlot.md b/site/tests/model_validation/statsmodels/RegressionModelForecastPlot.md
deleted file mode 100644
index d4b6b686ea..0000000000
--- a/site/tests/model_validation/statsmodels/RegressionModelForecastPlot.md
+++ /dev/null
@@ -1,41 +0,0 @@
-# RegressionModelForecastPlot
-
-Generates plots to visually compare the forecasted outcomes of a regression model against actual observed values over
-a specified date range.
-
-### Purpose
-
-This metric is useful for time-series models or any model where the outcome changes over time, allowing direct
-comparison of predicted vs actual values. It can help identify overfitting or underfitting situations as well as
-general model performance.
-
-### Test Mechanism
-
-This test generates a plot with the x-axis representing the date ranging from the specified "start_date" to the
-end_date", while the y-axis shows the value of the outcome variable. Two lines are plotted: one representing the
-forecasted values and the other representing the observed values. The "start_date" and "end_date" can be parameters
-of this test; if these parameters are not provided, they are set to the minimum and maximum date available in the
-dataset.
-
-### Signs of High Risk
-
-- High risk or failure signs could be deduced visually from the plots if the forecasted line significantly deviates
-from the observed line, indicating the model's predicted values are not matching actual outcomes.
-- A model that struggles to handle the edge conditions like maximum and minimum data points could also be
-considered a sign of risk.
-
-### Strengths
-
-- Visualization: The plot provides an intuitive and clear illustration of how well the forecast matches the actual
-values, making it straightforward even for non-technical stakeholders to interpret.
-- Flexibility: It allows comparison for multiple models and for specified time periods.
-- Model Evaluation: It can be useful in identifying overfitting or underfitting situations, as these will manifest
-as discrepancies between the forecasted and observed values.
-
-### Limitations
-
-- Interpretation Bias: Interpretation of the plot is subjective and can lead to different conclusions by different
-evaluators.
-- Lack of Precision: Visual representation might not provide precise values of the deviation.
-- Inapplicability: Limited to cases where the order of data points (time-series) matters, it might not be of much
-use in problems that are not related to time series prediction.
\ No newline at end of file
diff --git a/site/tests/model_validation/statsmodels/RegressionModelForecastPlotLevels.md b/site/tests/model_validation/statsmodels/RegressionModelForecastPlotLevels.md
deleted file mode 100644
index d39e7a7df0..0000000000
--- a/site/tests/model_validation/statsmodels/RegressionModelForecastPlotLevels.md
+++ /dev/null
@@ -1,36 +0,0 @@
-# RegressionModelForecastPlotLevels
-
-Assesses the alignment between forecasted and observed values in regression models through visual plots
-
-### Purpose
-
-This test aims to visually assess the performance of a regression model by comparing its forecasted values against
-the actual observed values for both the raw and transformed (integrated) data. This helps determine the accuracy
-of the model and can help identify overfitting or underfitting. The integration is applied to highlight the trend
-rather than the absolute level.
-
-### Test Mechanism
-
-This test generates two plots:
-
-- Raw data vs forecast
-- Transformed data vs forecast
-
-The transformed data is created by performing a cumulative sum on the raw data.
-
-### Signs of High Risk
-
-- Significant deviation between forecasted and observed values.
-- Patterns suggesting overfitting or underfitting.
-- Large discrepancies in the plotted forecasts, indicating potential issues with model generalizability and
-precision.
-
-### Strengths
-
-- Provides an intuitive, visual way to assess multiple regression models, aiding in easier interpretation and
-evaluation of forecast accuracy.
-
-### Limitations
-
-- Relies heavily on visual interpretation, which may vary between individuals.
-- Does not provide a numerical metric to quantify forecast accuracy, relying solely on visual assessment.
\ No newline at end of file
diff --git a/site/tests/model_validation/statsmodels/RegressionModelSensitivityPlot.md b/site/tests/model_validation/statsmodels/RegressionModelSensitivityPlot.md
deleted file mode 100644
index 11bc5c3262..0000000000
--- a/site/tests/model_validation/statsmodels/RegressionModelSensitivityPlot.md
+++ /dev/null
@@ -1,42 +0,0 @@
-# RegressionModelSensitivityPlot
-
-Assesses the sensitivity of a regression model to changes in independent variables by applying shocks and
-visualizing the impact.
-
-### Purpose
-
-The Regression Sensitivity Plot test is designed to perform sensitivity analysis on regression models. This test
-aims to measure the impact of slight changes (shocks) applied to individual variables on the system's outcome while
-keeping all other variables constant. By doing so, it analyzes the effects of each independent variable on the
-dependent variable within the regression model, helping identify significant risk factors that could substantially
-influence the model's output.
-
-### Test Mechanism
-
-This test operates by initially applying shocks of varying magnitudes, defined by specific parameters, to each of
-the model's features, one at a time. With all other variables held constant, a new prediction is made for each
-dataset subjected to shocks. Any changes in the model's predictions are directly attributed to the shocks applied.
-If the transformation parameter is set to "integrate," initial predictions and target values undergo transformation
-via an integration function before being plotted. Finally, a plot demonstrating observed values against predicted
-values for each model is generated, showcasing a distinct line graph illustrating predictions for each shock.
-
-### Signs of High Risk
-
-- Drastic alterations in model predictions due to minor shocks to an individual variable, indicating high
-sensitivity and potential over-dependence on that variable.
-- Unusually high or unpredictable shifts in response to shocks, suggesting potential model instability or
-overfitting.
-
-### Strengths
-
-- Helps identify variables that strongly influence model outcomes, aiding in understanding feature importance.
-- Generates visual plots, making results easily interpretable even to non-technical stakeholders.
-- Useful in identifying overfitting and detecting unstable models that react excessively to minor variable changes.
-
-### Limitations
-
-- Operates on the assumption that all other variables remain unchanged during the application of a shock, which may
-not reflect real-world interdependencies.
-- Best compatible with linear models and may not effectively evaluate the sensitivity of non-linear models.
-- Provides a visual representation without a numerical risk measure, potentially introducing subjectivity in
-interpretation.
\ No newline at end of file
diff --git a/site/tests/model_validation/statsmodels/RegressionModelSummary.md b/site/tests/model_validation/statsmodels/RegressionModelSummary.md
deleted file mode 100644
index 37b6429080..0000000000
--- a/site/tests/model_validation/statsmodels/RegressionModelSummary.md
+++ /dev/null
@@ -1,32 +0,0 @@
-# RegressionModelSummary
-
-Evaluates regression model performance using metrics including R-Squared, Adjusted R-Squared, MSE, and RMSE.
-
-### Purpose
-
-The Regression Model Summary test evaluates the performance of regression models by measuring their predictive
-ability regarding dependent variables given changes in the independent variables. It uses conventional regression
-metrics such as R-Squared, Adjusted R-Squared, Mean Squared Error (MSE), and Root Mean Squared Error (RMSE) to
-assess the model's accuracy and fit.
-
-### Test Mechanism
-
-This test uses the sklearn library to calculate the R-Squared, Adjusted R-Squared, MSE, and RMSE. It outputs a
-table with the results of these metrics along with the feature columns used by the model.
-
-### Signs of High Risk
-
-- Low R-Squared and Adjusted R-Squared values.
-- High MSE and RMSE values.
-
-### Strengths
-
-- Offers an extensive evaluation of regression models by combining four key measures of model accuracy and fit.
-- Provides a comprehensive view of the model's performance.
-- Both the R-Squared and Adjusted R-Squared measures are readily interpretable.
-
-### Limitations
-
-- RMSE and MSE might be sensitive to outliers.
-- A high R-Squared or Adjusted R-Squared may not necessarily indicate a good model, especially in cases of
-overfitting.
\ No newline at end of file
diff --git a/site/tests/model_validation/statsmodels/RegressionPermutationFeatureImportance.md b/site/tests/model_validation/statsmodels/RegressionPermutationFeatureImportance.md
deleted file mode 100644
index 3a7d1b7c40..0000000000
--- a/site/tests/model_validation/statsmodels/RegressionPermutationFeatureImportance.md
+++ /dev/null
@@ -1,36 +0,0 @@
-# RegressionPermutationFeatureImportance
-
-Assesses the significance of each feature in a model by evaluating the impact on model performance when feature
-values are randomly rearranged.
-
-### Purpose
-
-The primary purpose of this metric is to determine which features significantly impact the performance of a
-regression model developed using statsmodels. The metric measures how much the prediction accuracy deteriorates
-when each feature's values are permuted.
-
-### Test Mechanism
-
-This metric shuffles the values of each feature one at a time in the dataset, computes the model's performance
-after each permutation, and compares it to the baseline performance. A significant decrease in performance
-indicates the importance of the feature.
-
-### Signs of High Risk
-
-- Significant reliance on a feature that, when permuted, leads to a substantial decrease in performance, suggesting
-overfitting or high model dependency on that feature.
-- Features identified as unimportant despite known impacts from domain knowledge, suggesting potential issues in
-model training or data preprocessing.
-
-### Strengths
-
-- Directly assesses the impact of each feature on model performance, providing clear insights into model
-dependencies.
-- Model-agnostic within the scope of statsmodels, applicable to any regression model that outputs predictions.
-
-### Limitations
-
-- The metric is specific to statsmodels and cannot be used with other types of models without adaptation.
-- It does not capture interactions between features, which can lead to underestimating the importance of correlated
-features.
-- Assumes independence of features when calculating importance, which might not always hold true.
\ No newline at end of file
diff --git a/site/tests/model_validation/statsmodels/ScorecardHistogram.md b/site/tests/model_validation/statsmodels/ScorecardHistogram.md
deleted file mode 100644
index 8519a4573d..0000000000
--- a/site/tests/model_validation/statsmodels/ScorecardHistogram.md
+++ /dev/null
@@ -1,45 +0,0 @@
-# ScorecardHistogram
-
-The Scorecard Histogram test evaluates the distribution of credit scores between default and non-default instances,
-providing critical insights into the performance and generalizability of credit-risk models.
-
-### Purpose
-
-The Scorecard Histogram test metric provides a visual interpretation of the credit scores generated by a machine
-learning model for credit-risk classification tasks. It aims to compare the alignment of the model's scoring
-decisions with the actual outcomes of credit loan applications. It helps in identifying potential discrepancies
-between the model's predictions and real-world risk levels.
-
-### Test Mechanism
-
-This metric uses logistic regression to generate a histogram of credit scores for both default (negative class) and
-non-default (positive class) instances. Using both training and test datasets, the metric calculates the credit
-score of each instance with a scorecard method, considering the impact of different features on the likelihood of
-default. It includes the default point to odds (PDO) scaling factor and predefined target score and odds settings.
-Histograms for training and test sets are computed and plotted separately to offer insights into the model's
-generalizability to unseen data.
-
-### Signs of High Risk
-
-- Discrepancies between the distributions of training and testing data, indicating a model's poor generalization
-ability
-- Skewed distributions favoring specific scores or classes, representing potential bias
-
-### Strengths
-
-- Provides a visual interpretation of the model's credit scoring system, enhancing comprehension of model behavior
-- Enables a direct comparison between actual and predicted scores for both training and testing data
-- Its intuitive visualization helps understand the model's ability to differentiate between positive and negative
-classes
-- Can unveil patterns or anomalies not easily discerned through numerical metrics alone
-
-### Limitations
-
-- Despite its value for visual interpretation, it doesn't quantify the performance of the model and therefore may
-lack precision for thorough model evaluation
-- The quality of input data can strongly influence the metric, as bias or noise in the data will affect both the
-score calculation and resultant histogram
-- Its specificity to credit scoring models limits its applicability across a wider variety of machine learning
-tasks and models
-- The metric's effectiveness is somewhat tied to the subjective interpretation of the analyst, relying on their
-judgment of the characteristics and implications of the plot.
\ No newline at end of file
diff --git a/site/tests/ongoing_monitoring/CalibrationCurveDrift.md b/site/tests/ongoing_monitoring/CalibrationCurveDrift.md
deleted file mode 100644
index 3fa615e8df..0000000000
--- a/site/tests/ongoing_monitoring/CalibrationCurveDrift.md
+++ /dev/null
@@ -1,46 +0,0 @@
-# CalibrationCurveDrift
-
-Evaluates changes in probability calibration between reference and monitoring datasets.
-
-### Purpose
-
-The Calibration Curve Drift test is designed to assess changes in the model's probability calibration
-over time. By comparing calibration curves between reference and monitoring datasets, this test helps
-identify whether the model's probability estimates remain reliable in production. This is crucial for
-understanding if the model's risk predictions maintain their intended interpretation and whether
-recalibration might be necessary.
-
-### Test Mechanism
-
-This test proceeds by generating calibration curves for both reference and monitoring datasets. For each
-dataset, it bins the predicted probabilities and calculates the actual fraction of positives within each
-bin. It then compares these values between datasets to identify significant shifts in calibration.
-The test quantifies drift as percentage changes in both mean predicted probabilities and actual fractions
-of positives per bin, providing both visual and numerical assessments of calibration stability.
-
-### Signs of High Risk
-
-- Large differences between reference and monitoring calibration curves
-- Systematic over-estimation or under-estimation in monitoring dataset
-- Significant drift percentages exceeding the threshold in multiple bins
-- Changes in calibration concentrated in specific probability ranges
-- Inconsistent drift patterns across the probability spectrum
-- Empty or sparse bins indicating insufficient data for reliable comparison
-
-### Strengths
-
-- Provides visual and quantitative assessment of calibration changes
-- Identifies specific probability ranges where calibration has shifted
-- Enables early detection of systematic prediction biases
-- Includes detailed bin-by-bin comparison of calibration metrics
-- Handles edge cases with insufficient data in certain bins
-- Supports both binary and probabilistic interpretation of results
-
-### Limitations
-
-- Requires sufficient data in each probability bin for reliable comparison
-- Sensitive to choice of number of bins and binning strategy
-- May not capture complex changes in probability distributions
-- Cannot directly suggest recalibration parameters
-- Limited to assessing probability calibration aspects
-- Results may be affected by class imbalance changes
\ No newline at end of file
diff --git a/site/tests/ongoing_monitoring/ClassDiscriminationDrift.md b/site/tests/ongoing_monitoring/ClassDiscriminationDrift.md
deleted file mode 100644
index 6a81a93961..0000000000
--- a/site/tests/ongoing_monitoring/ClassDiscriminationDrift.md
+++ /dev/null
@@ -1,46 +0,0 @@
-# ClassDiscriminationDrift
-
-Compares classification discrimination metrics between reference and monitoring datasets.
-
-### Purpose
-
-The Class Discrimination Drift test is designed to evaluate changes in the model's discriminative power
-over time. By comparing key discrimination metrics between reference and monitoring datasets, this test
-helps identify whether the model maintains its ability to separate classes in production. This is crucial
-for understanding if the model's predictive power remains stable and whether its decision boundaries
-continue to effectively distinguish between different classes.
-
-### Test Mechanism
-
-This test proceeds by calculating three key discrimination metrics for both reference and monitoring
-datasets: ROC AUC (Area Under the Curve), GINI coefficient, and KS (Kolmogorov-Smirnov) statistic.
-For binary classification, it computes all three metrics. For multiclass problems, it focuses on
-macro-averaged ROC AUC. The test quantifies drift as percentage changes in these metrics between
-datasets, providing a comprehensive assessment of discrimination stability.
-
-### Signs of High Risk
-
-- Large drifts in discrimination metrics exceeding the threshold
-- Significant drops in ROC AUC indicating reduced ranking ability
-- Decreased GINI coefficients showing diminished separation power
-- Reduced KS statistics suggesting weaker class distinction
-- Inconsistent changes across different metrics
-- Systematic degradation in discriminative performance
-
-### Strengths
-
-- Combines multiple complementary discrimination metrics
-- Handles both binary and multiclass classification
-- Provides clear quantitative drift assessment
-- Enables early detection of model degradation
-- Includes standardized drift threshold evaluation
-- Supports comprehensive performance monitoring
-
-### Limitations
-
-- Does not identify root causes of discrimination drift
-- May be sensitive to changes in class distribution
-- Cannot suggest optimal decision threshold adjustments
-- Limited to discrimination aspects of performance
-- Requires sufficient data for reliable metric calculation
-- May not capture subtle changes in decision boundaries
\ No newline at end of file
diff --git a/site/tests/ongoing_monitoring/ClassImbalanceDrift.md b/site/tests/ongoing_monitoring/ClassImbalanceDrift.md
deleted file mode 100644
index 9523239d03..0000000000
--- a/site/tests/ongoing_monitoring/ClassImbalanceDrift.md
+++ /dev/null
@@ -1,46 +0,0 @@
-# ClassImbalanceDrift
-
-Evaluates drift in class distribution between reference and monitoring datasets.
-
-### Purpose
-
-The Class Imbalance Drift test is designed to detect changes in the distribution of target classes
-over time. By comparing class proportions between reference and monitoring datasets, this test helps
-identify whether the population structure remains stable in production. This is crucial for
-understanding if the model continues to operate under similar class distribution assumptions and
-whether retraining might be necessary due to significant shifts in class balance.
-
-### Test Mechanism
-
-This test proceeds by calculating class percentages for both reference and monitoring datasets.
-It computes the proportion of each class and quantifies drift as the percentage difference in these
-proportions between datasets. The test provides both visual and numerical comparisons of class
-distributions, with special attention to changes that exceed the specified drift threshold.
-Population stability is assessed on a class-by-class basis.
-
-### Signs of High Risk
-
-- Large shifts in class proportions exceeding the threshold
-- Systematic changes affecting multiple classes
-- Appearance of new classes or disappearance of existing ones
-- Significant changes in minority class representation
-- Reversal of majority-minority class relationships
-- Unexpected changes in class ratios
-
-### Strengths
-
-- Provides clear visualization of distribution changes
-- Identifies specific classes experiencing drift
-- Enables early detection of population shifts
-- Includes standardized drift threshold evaluation
-- Supports both binary and multiclass problems
-- Maintains interpretable percentage-based metrics
-
-### Limitations
-
-- Does not account for feature distribution changes
-- Cannot identify root causes of class drift
-- May be sensitive to small sample sizes
-- Limited to target variable distribution only
-- Requires sufficient samples per class
-- May not capture subtle distribution changes
\ No newline at end of file
diff --git a/site/tests/ongoing_monitoring/ClassificationAccuracyDrift.md b/site/tests/ongoing_monitoring/ClassificationAccuracyDrift.md
deleted file mode 100644
index a416c5d178..0000000000
--- a/site/tests/ongoing_monitoring/ClassificationAccuracyDrift.md
+++ /dev/null
@@ -1,46 +0,0 @@
-# ClassificationAccuracyDrift
-
-Compares classification accuracy metrics between reference and monitoring datasets.
-
-### Purpose
-
-The Classification Accuracy Drift test is designed to evaluate changes in the model's predictive accuracy
-over time. By comparing key accuracy metrics between reference and monitoring datasets, this test helps
-identify whether the model maintains its performance levels in production. This is crucial for
-understanding if the model's predictions remain reliable and whether its overall effectiveness has
-degraded significantly.
-
-### Test Mechanism
-
-This test proceeds by calculating comprehensive accuracy metrics for both reference and monitoring
-datasets. It computes overall accuracy, per-label precision, recall, and F1 scores, as well as
-macro-averaged metrics. The test quantifies drift as percentage changes in these metrics between
-datasets, providing both granular and aggregate views of accuracy changes. Special attention is paid
-to per-label performance to identify class-specific degradation.
-
-### Signs of High Risk
-
-- Large drifts in accuracy metrics exceeding the threshold
-- Inconsistent changes across different labels
-- Significant drops in macro-averaged metrics
-- Systematic degradation in specific class performance
-- Unexpected improvements suggesting data quality issues
-- Divergent trends between precision and recall
-
-### Strengths
-
-- Provides comprehensive accuracy assessment
-- Identifies class-specific performance changes
-- Enables early detection of model degradation
-- Includes both micro and macro perspectives
-- Supports multi-class classification evaluation
-- Maintains interpretable drift thresholds
-
-### Limitations
-
-- May be sensitive to class distribution changes
-- Does not account for prediction confidence
-- Cannot identify root causes of accuracy drift
-- Limited to accuracy-based metrics only
-- Requires sufficient samples per class
-- May not capture subtle performance changes
\ No newline at end of file
diff --git a/site/tests/ongoing_monitoring/ConfusionMatrixDrift.md b/site/tests/ongoing_monitoring/ConfusionMatrixDrift.md
deleted file mode 100644
index cc38f3e5d1..0000000000
--- a/site/tests/ongoing_monitoring/ConfusionMatrixDrift.md
+++ /dev/null
@@ -1,46 +0,0 @@
-# ConfusionMatrixDrift
-
-Compares confusion matrix metrics between reference and monitoring datasets.
-
-### Purpose
-
-The Confusion Matrix Drift test is designed to evaluate changes in the model's error patterns
-over time. By comparing confusion matrix elements between reference and monitoring datasets, this
-test helps identify whether the model maintains consistent prediction behavior in production. This
-is crucial for understanding if the model's error patterns have shifted and whether specific types
-of misclassifications have become more prevalent.
-
-### Test Mechanism
-
-This test proceeds by generating confusion matrices for both reference and monitoring datasets.
-For binary classification, it tracks True Positives, True Negatives, False Positives, and False
-Negatives as percentages of total predictions. For multiclass problems, it analyzes per-class
-metrics including true positives and error rates. The test quantifies drift as percentage changes
-in these metrics between datasets, providing detailed insight into shifting prediction patterns.
-
-### Signs of High Risk
-
-- Large drifts in confusion matrix elements exceeding threshold
-- Systematic changes in false positive or false negative rates
-- Inconsistent changes across different classes
-- Significant shifts in error patterns for specific classes
-- Unexpected improvements in certain metrics
-- Divergent trends between different types of errors
-
-### Strengths
-
-- Provides detailed analysis of prediction behavior
-- Identifies specific types of prediction changes
-- Enables early detection of systematic errors
-- Includes comprehensive error pattern analysis
-- Supports both binary and multiclass problems
-- Maintains interpretable percentage-based metrics
-
-### Limitations
-
-- May be sensitive to class distribution changes
-- Cannot identify root causes of prediction drift
-- Requires sufficient samples for reliable comparison
-- Limited to hard predictions (not probabilities)
-- May not capture subtle changes in decision boundaries
-- Complex interpretation for multiclass problems
\ No newline at end of file
diff --git a/site/tests/ongoing_monitoring/CumulativePredictionProbabilitiesDrift.md b/site/tests/ongoing_monitoring/CumulativePredictionProbabilitiesDrift.md
deleted file mode 100644
index 415bb204cf..0000000000
--- a/site/tests/ongoing_monitoring/CumulativePredictionProbabilitiesDrift.md
+++ /dev/null
@@ -1,47 +0,0 @@
-# CumulativePredictionProbabilitiesDrift
-
-Compares cumulative prediction probability distributions between reference and monitoring datasets.
-
-### Purpose
-
-The Cumulative Prediction Probabilities Drift test is designed to evaluate changes in the model's
-probability predictions over time. By comparing cumulative distribution functions of predicted
-probabilities between reference and monitoring datasets, this test helps identify whether the
-model's probability assignments remain stable in production. This is crucial for understanding if
-the model's risk assessment behavior has shifted and whether its probability calibration remains
-consistent.
-
-### Test Mechanism
-
-This test proceeds by generating cumulative distribution functions (CDFs) of predicted probabilities
-for both reference and monitoring datasets. For each class, it plots the cumulative proportion of
-predictions against probability values, enabling direct comparison of probability distributions.
-The test visualizes both the CDFs and their differences, providing insight into how probability
-assignments have shifted across the entire probability range.
-
-### Signs of High Risk
-
-- Large gaps between reference and monitoring CDFs
-- Systematic shifts in probability assignments
-- Concentration of differences in specific probability ranges
-- Changes in the shape of probability distributions
-- Unexpected patterns in cumulative differences
-- Significant shifts in probability thresholds
-
-### Strengths
-
-- Provides comprehensive view of probability changes
-- Identifies specific probability ranges with drift
-- Enables visualization of distribution differences
-- Supports analysis across multiple classes
-- Maintains interpretable probability scale
-- Captures subtle changes in probability assignments
-
-### Limitations
-
-- Does not provide single drift metric
-- May be complex to interpret for multiple classes
-- Cannot suggest probability recalibration
-- Requires visual inspection for assessment
-- Sensitive to sample size differences
-- May not capture class-specific calibration issues
\ No newline at end of file
diff --git a/site/tests/ongoing_monitoring/FeatureDrift.md b/site/tests/ongoing_monitoring/FeatureDrift.md
deleted file mode 100644
index fb066b8326..0000000000
--- a/site/tests/ongoing_monitoring/FeatureDrift.md
+++ /dev/null
@@ -1,41 +0,0 @@
-# FeatureDrift
-
-Evaluates changes in feature distribution over time to identify potential model drift.
-
-### Purpose
-
-The Feature Drift test aims to evaluate how much the distribution of features has shifted over time between two
-datasets, typically training and monitoring datasets. It uses the Population Stability Index (PSI) to quantify this
-change, providing insights into the model’s robustness and the necessity for retraining or feature engineering.
-
-### Test Mechanism
-
-This test calculates the PSI by:
-
-- Bucketing the distributions of each feature in both datasets.
-- Comparing the percentage of observations in each bucket between the two datasets.
-- Aggregating the differences across all buckets for each feature to produce the PSI score for that feature.
-
-The PSI score is interpreted as:
-
-- PSI < 0.1: No significant population change.
-- PSI < 0.2: Moderate population change.
-- PSI >= 0.2: Significant population change.
-
-### Signs of High Risk
-
-- PSI >= 0.2 for any feature, indicating a significant distribution shift.
-- Consistently high PSI scores across multiple features.
-- Sudden spikes in PSI in recent monitoring data compared to historical data.
-
-### Strengths
-
-- Provides a quantitative measure of feature distribution changes.
-- Easily interpretable thresholds for decision-making.
-- Helps in early detection of data drift, prompting timely interventions.
-
-### Limitations
-
-- May not capture more intricate changes in data distribution nuances.
-- Assumes that bucket thresholds (quantiles) adequately represent distribution shifts.
-- PSI score interpretation can be overly simplistic for complex datasets.
\ No newline at end of file
diff --git a/site/tests/ongoing_monitoring/PredictionAcrossEachFeature.md b/site/tests/ongoing_monitoring/PredictionAcrossEachFeature.md
deleted file mode 100644
index a13f9551ff..0000000000
--- a/site/tests/ongoing_monitoring/PredictionAcrossEachFeature.md
+++ /dev/null
@@ -1,33 +0,0 @@
-# PredictionAcrossEachFeature
-
-Assesses differences in model predictions across individual features between reference and monitoring datasets
-through visual analysis.
-
-### Purpose
-
-The Prediction Across Each Feature test aims to visually compare model predictions for each feature between
-reference (training) and monitoring (production) datasets. It helps identify significant differences in prediction
-patterns for further investigation and ensures the model's consistency and stability over time.
-
-### Test Mechanism
-
-The test generates scatter plots for each feature, comparing prediction probabilities between the reference and
-monitoring datasets. Each plot consists of two subplots: one for reference data and one for monitoring data,
-enabling visual comparison of the model's predictive behavior.
-
-### Signs of High Risk
-
-- Significant discrepancies between the reference and monitoring subplots for the same feature.
-- Unexpected patterns or trends in monitoring data that were absent in reference data.
-
-### Strengths
-
-- Provides a clear visual representation of model performance across different features.
-- Facilitates easy identification of features where the model's predictions have diverged.
-- Enables quick detection of potential model performance issues in production.
-
-### Limitations
-
-- Interpretation of scatter plots can be subjective and may require expertise.
-- Visualizations do not provide quantitative metrics for objective evaluation.
-- May not capture all types of distribution changes or issues with the model's predictions.
\ No newline at end of file
diff --git a/site/tests/ongoing_monitoring/PredictionCorrelation.md b/site/tests/ongoing_monitoring/PredictionCorrelation.md
deleted file mode 100644
index 46ea852942..0000000000
--- a/site/tests/ongoing_monitoring/PredictionCorrelation.md
+++ /dev/null
@@ -1,34 +0,0 @@
-# PredictionCorrelation
-
-Assesses correlation changes between model predictions from reference and monitoring datasets to detect potential
-target drift.
-
-### Purpose
-
-To evaluate the changes in correlation pairs between model predictions and features from reference and monitoring
-datasets. This helps in identifying significant shifts that may indicate target drift, potentially affecting model
-performance.
-
-### Test Mechanism
-
-This test calculates the correlation of each feature with model predictions for both reference and monitoring
-datasets. It then compares these correlations side-by-side using a bar plot and a correlation table. Significant
-changes in correlation pairs are highlighted to signal possible model drift.
-
-### Signs of High Risk
-
-- Significant changes in correlation pairs between the reference and monitoring predictions.
-- Notable differences in correlation values, indicating a possible shift in the relationship between features and
-the target variable.
-
-### Strengths
-
-- Provides visual identification of drift in feature relationships with model predictions.
-- Clear bar plot comparison aids in understanding model stability over time.
-- Enables early detection of target drift, facilitating timely interventions.
-
-### Limitations
-
-- Requires substantial reference and monitoring data for accurate comparison.
-- Correlation does not imply causation; other factors may influence changes.
-- Focuses solely on linear relationships, potentially missing non-linear interactions.
\ No newline at end of file
diff --git a/site/tests/ongoing_monitoring/PredictionProbabilitiesHistogramDrift.md b/site/tests/ongoing_monitoring/PredictionProbabilitiesHistogramDrift.md
deleted file mode 100644
index 21c585141b..0000000000
--- a/site/tests/ongoing_monitoring/PredictionProbabilitiesHistogramDrift.md
+++ /dev/null
@@ -1,47 +0,0 @@
-# PredictionProbabilitiesHistogramDrift
-
-Compares prediction probability distributions between reference and monitoring datasets.
-
-### Purpose
-
-The Prediction Probabilities Histogram Drift test is designed to evaluate changes in the model's
-probability predictions over time. By comparing probability distributions between reference and
-monitoring datasets using histograms, this test helps identify whether the model's probability
-assignments have shifted in production. This is crucial for understanding if the model's risk
-assessment behavior remains consistent and whether its probability estimates maintain their
-original distribution patterns.
-
-### Test Mechanism
-
-This test proceeds by generating histograms of prediction probabilities for both reference and
-monitoring datasets. For each class, it analyzes the distribution shape, central tendency, and
-spread of probabilities. The test computes distribution moments (mean, variance, skewness,
-kurtosis) and quantifies their drift between datasets. Visual comparison of overlaid histograms
-provides immediate insight into distribution changes.
-
-### Signs of High Risk
-
-- Significant shifts in probability distribution shapes
-- Large drifts in distribution moments exceeding threshold
-- Appearance of new modes or peaks in monitoring data
-- Changes in the spread or concentration of probabilities
-- Systematic shifts in probability assignments
-- Unexpected changes in distribution characteristics
-
-### Strengths
-
-- Provides intuitive visualization of probability changes
-- Identifies specific changes in distribution shape
-- Enables quantitative assessment of distribution drift
-- Supports analysis across multiple classes
-- Includes comprehensive moment analysis
-- Maintains interpretable probability scale
-
-### Limitations
-
-- May be sensitive to binning choices
-- Requires sufficient samples for reliable histograms
-- Cannot suggest probability recalibration
-- Complex interpretation for multiple classes
-- May not capture subtle distribution changes
-- Limited to univariate probability analysis
\ No newline at end of file
diff --git a/site/tests/ongoing_monitoring/PredictionQuantilesAcrossFeatures.md b/site/tests/ongoing_monitoring/PredictionQuantilesAcrossFeatures.md
deleted file mode 100644
index 36bd5ff060..0000000000
--- a/site/tests/ongoing_monitoring/PredictionQuantilesAcrossFeatures.md
+++ /dev/null
@@ -1,34 +0,0 @@
-# PredictionQuantilesAcrossFeatures
-
-Assesses differences in model prediction distributions across individual features between reference
-and monitoring datasets through quantile analysis.
-
-### Purpose
-
-This test aims to visualize how prediction distributions vary across feature values by showing
-quantile information between reference and monitoring datasets. It helps identify significant
-shifts in prediction patterns and potential areas of model instability.
-
-### Test Mechanism
-
-The test generates box plots for each feature, comparing prediction probability distributions
-between the reference and monitoring datasets. Each plot consists of two subplots showing the
-quantile distribution of predictions: one for reference data and one for monitoring data.
-
-### Signs of High Risk
-
-- Significant differences in prediction distributions between reference and monitoring data
-- Unexpected shifts in prediction quantiles across feature values
-- Large changes in prediction variability between datasets
-
-### Strengths
-
-- Provides clear visualization of prediction distribution changes
-- Shows outliers and variability in predictions across features
-- Enables quick identification of problematic feature ranges
-
-### Limitations
-
-- May not capture complex relationships between features and predictions
-- Quantile analysis may smooth over important individual predictions
-- Requires careful interpretation of distribution changes
\ No newline at end of file
diff --git a/site/tests/ongoing_monitoring/ROCCurveDrift.md b/site/tests/ongoing_monitoring/ROCCurveDrift.md
deleted file mode 100644
index 8c556f72b6..0000000000
--- a/site/tests/ongoing_monitoring/ROCCurveDrift.md
+++ /dev/null
@@ -1,47 +0,0 @@
-# ROCCurveDrift
-
-Compares ROC curves between reference and monitoring datasets.
-
-### Purpose
-
-The ROC Curve Drift test is designed to evaluate changes in the model's discriminative ability
-over time. By comparing Receiver Operating Characteristic (ROC) curves between reference and
-monitoring datasets, this test helps identify whether the model maintains its ability to
-distinguish between classes across different decision thresholds. This is crucial for
-understanding if the model's trade-off between sensitivity and specificity remains stable
-in production.
-
-### Test Mechanism
-
-This test proceeds by generating ROC curves for both reference and monitoring datasets. For each
-dataset, it plots the True Positive Rate against the False Positive Rate across all possible
-classification thresholds. The test also computes AUC scores and visualizes the difference
-between ROC curves, providing both graphical and numerical assessments of discrimination
-stability. Special attention is paid to regions where curves diverge significantly.
-
-### Signs of High Risk
-
-- Large differences between reference and monitoring ROC curves
-- Significant drop in AUC score for monitoring dataset
-- Systematic differences in specific FPR regions
-- Changes in optimal operating points
-- Inconsistent performance across different thresholds
-- Unexpected crossovers between curves
-
-### Strengths
-
-- Provides comprehensive view of discriminative ability
-- Identifies specific threshold ranges with drift
-- Enables visualization of performance differences
-- Includes AUC comparison for overall assessment
-- Supports threshold-independent evaluation
-- Maintains interpretable performance metrics
-
-### Limitations
-
-- Limited to binary classification problems
-- May be sensitive to class distribution changes
-- Cannot suggest optimal threshold adjustments
-- Requires visual inspection for detailed analysis
-- Complex interpretation of curve differences
-- May not capture subtle performance changes
\ No newline at end of file
diff --git a/site/tests/ongoing_monitoring/ScoreBandsDrift.md b/site/tests/ongoing_monitoring/ScoreBandsDrift.md
deleted file mode 100644
index 3f25439f8d..0000000000
--- a/site/tests/ongoing_monitoring/ScoreBandsDrift.md
+++ /dev/null
@@ -1,48 +0,0 @@
-# ScoreBandsDrift
-
-Analyzes drift in population distribution and default rates across score bands.
-
-### Purpose
-
-The Score Bands Drift test is designed to evaluate changes in score-based risk segmentation
-over time. By comparing population distribution and default rates across score bands between
-reference and monitoring datasets, this test helps identify whether the model's risk
-stratification remains stable in production. This is crucial for understanding if the model's
-scoring behavior maintains its intended risk separation and whether specific score ranges
-have experienced significant shifts.
-
-### Test Mechanism
-
-This test proceeds by segmenting scores into predefined bands and analyzing three key metrics
-across these bands: population distribution, predicted default rates, and observed default
-rates. For each band, it computes these metrics for both reference and monitoring datasets
-and quantifies drift as percentage changes. The test provides both detailed band-by-band
-comparisons and overall stability assessment, with special attention to bands showing
-significant drift.
-
-### Signs of High Risk
-
-- Large shifts in population distribution across bands
-- Significant changes in default rates within bands
-- Inconsistent drift patterns between adjacent bands
-- Divergence between predicted and observed rates
-- Systematic shifts in risk concentration
-- Empty or sparse score bands in monitoring data
-
-### Strengths
-
-- Provides comprehensive view of score-based drift
-- Identifies specific score ranges with instability
-- Enables comparison of multiple risk metrics
-- Includes both distribution and performance drift
-- Supports business-relevant score segmentation
-- Maintains interpretable drift thresholds
-
-### Limitations
-
-- Sensitive to choice of score band boundaries
-- Requires sufficient samples in each band
-- Cannot suggest optimal band adjustments
-- May not capture within-band distribution changes
-- Limited to predefined scoring metrics
-- Complex interpretation with multiple drift signals
\ No newline at end of file
diff --git a/site/tests/ongoing_monitoring/ScorecardHistogramDrift.md b/site/tests/ongoing_monitoring/ScorecardHistogramDrift.md
deleted file mode 100644
index 95522724d1..0000000000
--- a/site/tests/ongoing_monitoring/ScorecardHistogramDrift.md
+++ /dev/null
@@ -1,47 +0,0 @@
-# ScorecardHistogramDrift
-
-Compares score distributions between reference and monitoring datasets for each class.
-
-### Purpose
-
-The Scorecard Histogram Drift test is designed to evaluate changes in the model's scoring
-patterns over time. By comparing score distributions between reference and monitoring datasets
-for each class, this test helps identify whether the model's scoring behavior remains stable
-in production. This is crucial for understanding if the model's risk assessment maintains
-consistent patterns and whether specific score ranges have experienced significant shifts
-in their distribution.
-
-### Test Mechanism
-
-This test proceeds by generating histograms of scores for each class in both reference and
-monitoring datasets. It analyzes distribution characteristics through multiple statistical
-moments: mean, variance, skewness, and kurtosis. The test quantifies drift as percentage
-changes in these moments between datasets, providing both visual and numerical assessments
-of distribution stability. Special attention is paid to class-specific distribution changes.
-
-### Signs of High Risk
-
-- Significant shifts in score distribution shapes
-- Large drifts in distribution moments exceeding threshold
-- Changes in the relative positioning of class distributions
-- Appearance of new modes or peaks in monitoring data
-- Unexpected changes in score spread or concentration
-- Systematic shifts in class-specific scoring patterns
-
-### Strengths
-
-- Provides class-specific distribution analysis
-- Identifies detailed changes in scoring patterns
-- Enables visual comparison of distributions
-- Includes comprehensive moment analysis
-- Supports multiple class evaluation
-- Maintains interpretable score scale
-
-### Limitations
-
-- Sensitive to binning choices in visualization
-- Requires sufficient samples per class
-- Cannot suggest score adjustments
-- May not capture subtle distribution changes
-- Complex interpretation with multiple classes
-- Limited to univariate score analysis
\ No newline at end of file
diff --git a/site/tests/ongoing_monitoring/TargetPredictionDistributionPlot.md b/site/tests/ongoing_monitoring/TargetPredictionDistributionPlot.md
deleted file mode 100644
index d05e1e7be4..0000000000
--- a/site/tests/ongoing_monitoring/TargetPredictionDistributionPlot.md
+++ /dev/null
@@ -1,33 +0,0 @@
-# TargetPredictionDistributionPlot
-
-Assesses differences in prediction distributions between a reference dataset and a monitoring dataset to identify
-potential data drift.
-
-### Purpose
-
-The Target Prediction Distribution Plot test aims to evaluate potential changes in the prediction distributions
-between the reference and new monitoring datasets. It seeks to identify underlying shifts in data characteristics
-that warrant further investigation.
-
-### Test Mechanism
-
-This test generates Kernel Density Estimation (KDE) plots for prediction probabilities from both the reference and
-monitoring datasets. By visually comparing the KDE plots, it assesses significant differences in the prediction
-distributions between the two datasets.
-
-### Signs of High Risk
-
-- Significant divergence between the distribution curves of reference and monitoring predictions.
-- Unusual shifts or bimodal distribution in the monitoring predictions compared to the reference predictions.
-
-### Strengths
-
-- Visual representation makes it easy to spot differences in prediction distributions.
-- Useful for identifying potential data drift or changes in underlying data characteristics.
-- Simple and efficient to implement using standard plotting libraries.
-
-### Limitations
-
-- Subjective interpretation of the visual plots.
-- Might not pinpoint the exact cause of distribution changes.
-- Less effective if the differences in distributions are subtle and not easily visible.
\ No newline at end of file
diff --git a/site/tests/plots/BoxPlot.md b/site/tests/plots/BoxPlot.md
deleted file mode 100644
index 6fe6449114..0000000000
--- a/site/tests/plots/BoxPlot.md
+++ /dev/null
@@ -1,42 +0,0 @@
-# BoxPlot
-
-Generates customizable box plots for numerical features in a dataset with optional grouping using Plotly.
-
-### Purpose
-
-This test provides a flexible way to visualize the distribution of numerical features
-through interactive box plots, with optional grouping by categorical variables. Box plots are
-effective for identifying outliers, comparing distributions across groups, and
-understanding the spread and central tendency of the data.
-
-### Test Mechanism
-
-The test creates interactive box plots for specified numerical columns (or all numerical columns
-if none specified). It supports various customization options including:
-- Grouping by categorical variables
-- Customizable colors and styling
-- Outlier display options
-- Interactive hover information
-- Zoom and pan capabilities
-
-### Signs of High Risk
-
-- Presence of many outliers indicating data quality issues
-- Highly skewed distributions
-- Large differences in variance across groups
-- Unexpected patterns in grouped data
-
-### Strengths
-
-- Clear visualization of distribution statistics (median, quartiles, outliers)
-- Interactive Plotly plots with hover information and zoom capabilities
-- Effective for comparing distributions across groups
-- Handles missing values appropriately
-- Highly customizable appearance
-
-### Limitations
-
-- Limited to numerical features only
-- May not be suitable for continuous variables with many unique values
-- Visual interpretation may be subjective
-- Less effective with very large datasets
\ No newline at end of file
diff --git a/site/tests/plots/CorrelationHeatmap.md b/site/tests/plots/CorrelationHeatmap.md
deleted file mode 100644
index dda05391f7..0000000000
--- a/site/tests/plots/CorrelationHeatmap.md
+++ /dev/null
@@ -1,44 +0,0 @@
-# CorrelationHeatmap
-
-Generates customizable correlation heatmap plots for numerical features in a dataset using Plotly.
-
-### Purpose
-
-This test provides a flexible way to visualize correlations between numerical features
-in a dataset using interactive Plotly heatmaps. It supports different correlation methods
-and extensive customization options for the heatmap appearance, making it suitable for
-exploring feature relationships in data analysis.
-
-### Test Mechanism
-
-The test computes correlation coefficients between specified numerical columns
-(or all numerical columns if none specified) using the specified method.
-It then creates an interactive heatmap visualization with customizable appearance options including:
-- Different correlation methods (pearson, spearman, kendall)
-- Color schemes and annotations
-- Masking options for upper triangle
-- Threshold filtering for significant correlations
-- Interactive hover information
-
-### Signs of High Risk
-
-- Very high correlations (>0.9) between features indicating multicollinearity
-- Unexpected correlation patterns that contradict domain knowledge
-- Features with no correlation to any other variables
-- Strong correlations with the target variable that might indicate data leakage
-
-### Strengths
-
-- Supports multiple correlation methods
-- Interactive Plotly plots with hover information and zoom capabilities
-- Highly customizable visualization options
-- Can handle missing values appropriately
-- Provides clear visual representation of feature relationships
-- Optional thresholding to focus on significant correlations
-
-### Limitations
-
-- Limited to numerical features only
-- Cannot capture non-linear relationships effectively
-- May be difficult to interpret with many features
-- Correlation does not imply causation
\ No newline at end of file
diff --git a/site/tests/plots/HistogramPlot.md b/site/tests/plots/HistogramPlot.md
deleted file mode 100644
index 18c3d9e2dd..0000000000
--- a/site/tests/plots/HistogramPlot.md
+++ /dev/null
@@ -1,43 +0,0 @@
-# HistogramPlot
-
-Generates customizable histogram plots for numerical features in a dataset using Plotly.
-
-### Purpose
-
-This test provides a flexible way to visualize the distribution of numerical features in a dataset.
-It allows for extensive customization of the histogram appearance and behavior through parameters,
-making it suitable for various exploratory data analysis tasks.
-
-### Test Mechanism
-
-The test creates histogram plots for specified numerical columns (or all numerical columns if none specified).
-It supports various customization options including:
-- Number of bins or bin edges
-- Color and opacity
-- Kernel density estimation overlay
-- Logarithmic scaling
-- Normalization options
-- Configurable subplot layout (columns and spacing)
-
-### Signs of High Risk
-
-- Highly skewed distributions that may indicate data quality issues
-- Unexpected bimodal or multimodal distributions
-- Presence of extreme outliers
-- Empty or sparse distributions
-
-### Strengths
-
-- Highly customizable visualization options
-- Interactive Plotly plots with zoom, pan, and hover capabilities
-- Supports both single and multiple column analysis
-- Provides insights into data distribution patterns
-- Can handle different data types and scales
-- Configurable subplot layout for better visualization
-
-### Limitations
-
-- Limited to numerical features only
-- Visual interpretation may be subjective
-- May not be suitable for high-dimensional datasets
-- Performance may degrade with very large datasets
\ No newline at end of file
diff --git a/site/tests/plots/ViolinPlot.md b/site/tests/plots/ViolinPlot.md
deleted file mode 100644
index 55dc4f4f8b..0000000000
--- a/site/tests/plots/ViolinPlot.md
+++ /dev/null
@@ -1,36 +0,0 @@
-# ViolinPlot
-
-Generates interactive violin plots for numerical features using Plotly.
-
-### Purpose
-
-This test creates violin plots to visualize the distribution of numerical features,
-showing both the probability density and summary statistics. Violin plots combine
-aspects of box plots and kernel density estimation for rich distribution visualization.
-
-### Test Mechanism
-
-The test creates violin plots for specified numerical columns, with optional
-grouping by categorical variables. Each violin shows the distribution shape,
-quartiles, and median values.
-
-### Signs of High Risk
-
-- Multimodal distributions that might indicate mixed populations
-- Highly skewed distributions suggesting data quality issues
-- Large differences in distribution shapes across groups
-- Unusual distribution patterns that contradict domain expectations
-
-### Strengths
-
-- Shows detailed distribution shape information
-- Interactive Plotly visualization with hover details
-- Effective for comparing distributions across groups
-- Combines density estimation with quartile information
-
-### Limitations
-
-- Limited to numerical features only
-- Requires sufficient data points for meaningful density estimation
-- May not be suitable for discrete variables
-- Can be misleading with very small sample sizes
\ No newline at end of file
diff --git a/site/tests/prompt_validation/Bias.md b/site/tests/prompt_validation/Bias.md
deleted file mode 100644
index 044c9c292a..0000000000
--- a/site/tests/prompt_validation/Bias.md
+++ /dev/null
@@ -1,48 +0,0 @@
-# Bias
-
-Assesses potential bias in a Large Language Model by analyzing the distribution and order of exemplars in the
-prompt.
-
-### Purpose
-
-The Bias Evaluation test calculates if and how the order and distribution of exemplars (examples) in a few-shot
-learning prompt affect the output of a Large Language Model (LLM). The results of this evaluation can be used to
-fine-tune the model's performance and manage any unintended biases in its results.
-
-### Test Mechanism
-
-This test uses two checks:
-
-1. **Distribution of Exemplars:** The number of positive vs. negative examples in a prompt is varied. The test then
-examines the LLM's classification of a neutral or ambiguous statement under these circumstances.
-2. **Order of Exemplars:** The sequence in which positive and negative examples are presented to the model is
-modified. Their resultant effect on the LLM's response is studied.
-
-For each test case, the LLM grades the input prompt on a scale of 1 to 10. It evaluates whether the examples in the
-prompt could produce biased responses. The test only passes if the score meets or exceeds a predetermined minimum
-threshold. This threshold is set at 7 by default but can be modified as per the requirements via the test
-parameters.
-
-### Signs of High Risk
-
-- A skewed result favoring either positive or negative responses may suggest potential bias in the model. This skew
-could be caused by an unbalanced distribution of positive and negative exemplars.
-- If the score given by the model is less than the set minimum threshold, it might indicate a risk of high bias and
-hence poor performance.
-
-### Strengths
-
-- This test provides a quantitative measure of potential bias, offering clear guidelines for developers about
-whether their Large Language Model (LLM) contains significant bias.
-- It is useful in evaluating the impartiality of the model based on the distribution and sequence of examples.
-- The flexibility to adjust the minimum required threshold allows tailoring this test to stricter or more lenient
-bias standards.
-
-### Limitations
-
-- The test may not pick up on more subtle forms of bias or biases that are not directly related to the distribution
-or order of exemplars.
-- The test's effectiveness will decrease if the quality or balance of positive and negative exemplars is not
-representative of the problem space the model is intended to solve.
-- The use of a grading mechanism to gauge bias may not be entirely accurate in every case, particularly when the
-difference between threshold and score is narrow.
\ No newline at end of file
diff --git a/site/tests/prompt_validation/Clarity.md b/site/tests/prompt_validation/Clarity.md
deleted file mode 100644
index dbd1cc7213..0000000000
--- a/site/tests/prompt_validation/Clarity.md
+++ /dev/null
@@ -1,36 +0,0 @@
-# Clarity
-
-Evaluates and scores the clarity of prompts in a Large Language Model based on specified guidelines.
-
-### Purpose
-
-The Clarity evaluation metric is used to assess how clear the prompts of a Large Language Model (LLM) are. This
-assessment is particularly important because clear prompts assist the LLM in more accurately interpreting and
-responding to instructions.
-
-### Test Mechanism
-
-The evaluation uses an LLM to scrutinize the clarity of prompts, factoring in considerations such as the inclusion
-of relevant details, persona adoption, step-by-step instructions, usage of examples, and specification of desired
-output length. Each prompt is rated on a clarity scale of 1 to 10, and any prompt scoring at or above the preset
-threshold (default of 7) will be marked as clear. It is important to note that this threshold can be adjusted via
-test parameters, providing flexibility in the evaluation process.
-
-### Signs of High Risk
-
-- Prompts that consistently score below the clarity threshold
-- Repeated failure of prompts to adhere to guidelines for clarity, including detail inclusion, persona adoption,
-explicit step-by-step instructions, use of examples, and specification of output length
-
-### Strengths
-
-- Encourages the development of more effective prompts that aid the LLM in interpreting instructions accurately
-- Applies a quantifiable measure (a score from 1 to 10) to evaluate the clarity of prompts
-- Threshold for clarity is adjustable, allowing for flexible evaluation depending on the context
-
-### Limitations
-
-- Scoring system is subjective and relies on the AI’s interpretation of 'clarity
-- The test assumes that all required factors (detail inclusion, persona adoption, step-by-step instructions, use of
-examples, and specification of output length) contribute equally to clarity, which might not always be the case
-- The evaluation may not be as effective if used on non-textual models
\ No newline at end of file
diff --git a/site/tests/prompt_validation/Conciseness.md b/site/tests/prompt_validation/Conciseness.md
deleted file mode 100644
index 7855a3b6b8..0000000000
--- a/site/tests/prompt_validation/Conciseness.md
+++ /dev/null
@@ -1,36 +0,0 @@
-# Conciseness
-
-Analyzes and grades the conciseness of prompts provided to a Large Language Model.
-
-### Purpose
-
-The Conciseness Assessment is designed to evaluate the brevity and succinctness of prompts provided to a Language
-Learning Model (LLM). A concise prompt strikes a balance between offering clear instructions and eliminating
-redundant or unnecessary information, ensuring that the LLM receives relevant input without being overwhelmed.
-
-### Test Mechanism
-
-Using an LLM, this test conducts a conciseness analysis on input prompts. The analysis grades the prompt on a scale
-from 1 to 10, where the grade reflects how well the prompt delivers clear instructions without being verbose.
-Prompts that score equal to or above a predefined threshold (default set to 7) are deemed successfully concise.
-This threshold can be adjusted to meet specific requirements.
-
-### Signs of High Risk
-
-- Prompts that consistently score below the predefined threshold.
-- Prompts that are overly wordy or contain unnecessary information.
-- Prompts that create confusion or ambiguity due to excess or unnecessary information.
-
-### Strengths
-
-- Ensures clarity and effectiveness of the prompts.
-- Promotes brevity and preciseness in prompts without sacrificing essential information.
-- Useful for models like LLMs, where input prompt length and clarity greatly influence model performance.
-- Provides a quantifiable measure of prompt conciseness.
-
-### Limitations
-
-- The conciseness score is based on an AI's assessment, which might not fully capture human interpretation of
-conciseness.
-- The predefined threshold for conciseness could be subjective and might need adjustment based on application.
-- The test is dependent on the LLM’s understanding of conciseness, which might vary from model to model.
\ No newline at end of file
diff --git a/site/tests/prompt_validation/Delimitation.md b/site/tests/prompt_validation/Delimitation.md
deleted file mode 100644
index 13ab537236..0000000000
--- a/site/tests/prompt_validation/Delimitation.md
+++ /dev/null
@@ -1,37 +0,0 @@
-# Delimitation
-
-Evaluates the proper use of delimiters in prompts provided to Large Language Models.
-
-### Purpose
-
-The Delimitation Test aims to assess whether prompts provided to the Language Learning Model (LLM) correctly use
-delimiters to mark different sections of the input. Well-delimited prompts help simplify the interpretation process
-for the LLM, ensuring that the responses are precise and accurate.
-
-### Test Mechanism
-
-The test employs an LLM to examine prompts for appropriate use of delimiters such as triple quotation marks, XML
-tags, and section titles. Each prompt is assigned a score from 1 to 10 based on its delimitation integrity. Prompts
-with scores equal to or above the preset threshold (which is 7 by default, although it can be adjusted as
-necessary) pass the test.
-
-### Signs of High Risk
-
-- Prompts missing, improperly placed, or incorrectly used delimiters, leading to misinterpretation by the LLM.
-- High-risk scenarios with complex prompts involving multiple tasks or diverse data where correct delimitation is
-crucial.
-- Scores below the threshold, indicating a high risk.
-
-### Strengths
-
-- Ensures clarity in demarcating different components of given prompts.
-- Reduces ambiguity in understanding prompts, especially for complex tasks.
-- Provides a quantified insight into the appropriateness of delimiter usage, aiding continuous improvement.
-
-### Limitations
-
-- Only checks for the presence and placement of delimiters, not whether the correct delimiter type is used for the
-specific data or task.
-- May not fully reveal the impacts of poor delimitation on the LLM's final performance.
-- The preset score threshold may not be refined enough for complex tasks and prompts, requiring regular manual
-adjustment.
\ No newline at end of file
diff --git a/site/tests/prompt_validation/NegativeInstruction.md b/site/tests/prompt_validation/NegativeInstruction.md
deleted file mode 100644
index aec6b56e04..0000000000
--- a/site/tests/prompt_validation/NegativeInstruction.md
+++ /dev/null
@@ -1,42 +0,0 @@
-# NegativeInstruction
-
-Evaluates and grades the use of affirmative, proactive language over negative instructions in LLM prompts.
-
-### Purpose
-
-The Negative Instruction test is utilized to scrutinize the prompts given to a Large Language Model (LLM). The
-objective is to ensure these prompts are expressed using proactive, affirmative language. The focus is on
-instructions indicating what needs to be done rather than what needs to be avoided, thereby guiding the LLM more
-efficiently towards the desired output.
-
-### Test Mechanism
-
-An LLM is employed to evaluate each prompt. The prompt is graded based on its use of positive instructions with
-scores ranging between 1-10. This grade reflects how effectively the prompt leverages affirmative language while
-shying away from negative or restrictive instructions. A prompt that attains a grade equal to or above a
-predetermined threshold (7 by default) is regarded as adhering effectively to the best practices of positive
-instruction. This threshold can be custom-tailored through the test parameters.
-
-### Signs of High Risk
-
-- Low score obtained from the LLM analysis, indicating heavy reliance on negative instructions in the prompts.
-- Failure to surpass the preset minimum threshold.
-- The LLM generates ambiguous or undesirable outputs as a consequence of the negative instructions used in the
-prompt.
-
-### Strengths
-
-- Encourages the usage of affirmative, proactive language in prompts, aiding in more accurate and advantageous
-model responses.
-- The test result provides a comprehensible score, helping to understand how well a prompt follows the positive
-instruction best practices.
-
-### Limitations
-
-- Despite an adequate score, a prompt could still be misleading or could lead to undesired responses due to factors
-not covered by this test.
-- The test necessitates an LLM for evaluation, which might not be available or feasible in certain scenarios.
-- A numeric scoring system, while straightforward, may oversimplify complex issues related to prompt designing and
-instruction clarity.
-- The effectiveness of the test hinges significantly on the predetermined threshold level, which can be subjective
-and may need to be adjusted according to specific use-cases.
\ No newline at end of file
diff --git a/site/tests/prompt_validation/Robustness.md b/site/tests/prompt_validation/Robustness.md
deleted file mode 100644
index c3219b553b..0000000000
--- a/site/tests/prompt_validation/Robustness.md
+++ /dev/null
@@ -1,40 +0,0 @@
-# Robustness
-
-Assesses the robustness of prompts provided to a Large Language Model under varying conditions and contexts. This test
-specifically measures the model's ability to generate correct classifications with the given prompt even when the
-inputs are edge cases or otherwise difficult to classify.
-
-### Purpose
-
-The Robustness test is meant to evaluate the resilience and reliability of prompts provided to a Language Learning
-Model (LLM). The aim of this test is to guarantee that the prompts consistently generate accurate and expected
-outputs, even in diverse or challenging scenarios. This test is only applicable to LLM-powered text classification
-tasks where the prompt has a single input variable.
-
-### Test Mechanism
-
-The Robustness test appraises prompts under various conditions, alterations, and contexts to ascertain their
-stability in producing consistent responses from the LLM. Factors evaluated include different phrasings, inclusion
-of potential distracting elements, and various input complexities. By default, the test generates 10 inputs for a
-prompt but can be adjusted according to test parameters.
-
-### Signs of High Risk
-
-- If the output from the tests diverges extensively from the expected results, this indicates high risk.
-- When the prompt doesn't give a consistent performance across various tests.
-- A high risk is indicated when the prompt is susceptible to breaking, especially when the output is expected to be
-of a specific type.
-
-### Strengths
-
-- The robustness test helps to ensure stable performance of the LLM prompts and lowers the chances of generating
-unexpected or off-target outputs.
-- This test is vital for applications where predictability and reliability of the LLM’s output are crucial.
-
-### Limitations
-
-- Currently, the test only supports single-variable prompts, which restricts its application to more complex models.
-- When there are too many target classes (over 10), the test is skipped, which can leave potential vulnerabilities
-unchecked in complex multi-class models.
-- The test may not account for all potential conditions or alterations that could show up in practical use
-scenarios.
\ No newline at end of file
diff --git a/site/tests/prompt_validation/Specificity.md b/site/tests/prompt_validation/Specificity.md
deleted file mode 100644
index 80780d71ea..0000000000
--- a/site/tests/prompt_validation/Specificity.md
+++ /dev/null
@@ -1,38 +0,0 @@
-# Specificity
-
-Evaluates and scores the specificity of prompts provided to a Large Language Model (LLM), based on clarity, detail,
-and relevance.
-
-### Purpose
-
-The Specificity Test evaluates the clarity, precision, and effectiveness of the prompts provided to a Language
-Model (LLM). It aims to ensure that the instructions embedded in a prompt are indisputably clear and relevant,
-thereby helping to remove ambiguity and steer the LLM towards desired outputs. This level of specificity
-significantly affects the accuracy and relevance of LLM outputs.
-
-### Test Mechanism
-
-The Specificity Test employs an LLM to grade each prompt based on clarity, detail, and relevance parameters within
-a specificity scale that extends from 1 to 10. On this scale, prompts scoring equal to or more than a predefined
-threshold (set to 7 by default) pass the evaluation, while those scoring below this threshold fail it. Users can
-adjust this threshold as per their requirements.
-
-### Signs of High Risk
-
-- Prompts scoring consistently below the established threshold
-- Vague or ambiguous prompts that do not provide clear direction to the LLM
-- Overly verbose prompts that may confuse the LLM instead of providing clear guidance
-
-### Strengths
-
-- Enables precise and clear communication with the LLM to achieve desired outputs
-- Serves as a crucial means to measure the effectiveness of prompts
-- Highly customizable, allowing users to set their threshold based on specific use cases
-
-### Limitations
-
-- This test doesn't consider the content comprehension capability of the LLM
-- High specificity score doesn't guarantee a high-quality response from the LLM, as the model's performance is also
-dependent on various other factors
-- Striking a balance between specificity and verbosity can be challenging, as overly detailed prompts might confuse
-or mislead the model
\ No newline at end of file
diff --git a/site/tests/stats/CorrelationAnalysis.md b/site/tests/stats/CorrelationAnalysis.md
deleted file mode 100644
index 9578f41faf..0000000000
--- a/site/tests/stats/CorrelationAnalysis.md
+++ /dev/null
@@ -1,41 +0,0 @@
-# CorrelationAnalysis
-
-Performs comprehensive correlation analysis with significance testing for numerical features.
-
-### Purpose
-
-This test conducts detailed correlation analysis between numerical features, including
-correlation coefficients, significance testing, and identification of significant
-relationships. It helps identify multicollinearity, feature relationships, and
-potential redundancies in the dataset.
-
-### Test Mechanism
-
-The test computes correlation coefficients using the specified method and performs
-statistical significance testing for each correlation pair. It provides:
-- Correlation matrix with significance indicators
-- List of significant correlations above threshold
-- Summary statistics about correlation patterns
-- Identification of highly correlated feature pairs
-
-### Signs of High Risk
-
-- Very high correlations (>0.9) indicating potential multicollinearity
-- Many significant correlations suggesting complex feature interactions
-- Features with no significant correlations to others (potential isolation)
-- Unexpected correlation patterns contradicting domain knowledge
-
-### Strengths
-
-- Provides statistical significance testing for correlations
-- Supports multiple correlation methods (Pearson, Spearman, Kendall)
-- Identifies potentially problematic high correlations
-- Filters results by minimum correlation threshold
-- Comprehensive summary of correlation patterns
-
-### Limitations
-
-- Limited to numerical features only
-- Cannot detect non-linear relationships (except with Spearman)
-- Significance testing assumes certain distributional properties
-- Correlation does not imply causation
\ No newline at end of file
diff --git a/site/tests/stats/DescriptiveStats.md b/site/tests/stats/DescriptiveStats.md
deleted file mode 100644
index aab7f36314..0000000000
--- a/site/tests/stats/DescriptiveStats.md
+++ /dev/null
@@ -1,42 +0,0 @@
-# DescriptiveStats
-
-Provides comprehensive descriptive statistics for numerical features in a dataset.
-
-### Purpose
-
-This test generates detailed descriptive statistics for numerical features, including
-basic statistics, distribution measures, confidence intervals, and normality tests.
-It provides a comprehensive overview of data characteristics essential for
-understanding data quality and distribution properties.
-
-### Test Mechanism
-
-The test computes various statistical measures for each numerical column:
-- Basic statistics: count, mean, median, std, min, max, quartiles
-- Distribution measures: skewness, kurtosis, coefficient of variation
-- Confidence intervals for the mean
-- Normality tests (Shapiro-Wilk for small samples, Anderson-Darling for larger)
-- Missing value analysis
-
-### Signs of High Risk
-
-- High skewness or kurtosis indicating non-normal distributions
-- Large coefficients of variation suggesting high data variability
-- Significant results in normality tests when normality is expected
-- High percentage of missing values
-- Extreme outliers based on IQR analysis
-
-### Strengths
-
-- Comprehensive statistical analysis in a single test
-- Includes advanced statistical measures beyond basic descriptives
-- Provides confidence intervals for uncertainty quantification
-- Handles missing values appropriately
-- Suitable for both exploratory and confirmatory analysis
-
-### Limitations
-
-- Limited to numerical features only
-- Normality tests may not be meaningful for all data types
-- Large datasets may make some tests computationally expensive
-- Interpretation requires statistical knowledge
\ No newline at end of file
diff --git a/site/tests/stats/NormalityTests.md b/site/tests/stats/NormalityTests.md
deleted file mode 100644
index 2cf3535e11..0000000000
--- a/site/tests/stats/NormalityTests.md
+++ /dev/null
@@ -1,34 +0,0 @@
-# NormalityTests
-
-Performs multiple normality tests on numerical features to assess distribution normality.
-
-### Purpose
-
-This test evaluates whether numerical features follow a normal distribution using
-various statistical tests. Understanding distribution normality is crucial for
-selecting appropriate statistical methods and model assumptions.
-
-### Test Mechanism
-
-The test applies multiple normality tests:
-- Shapiro-Wilk test: Best for small to medium samples
-- Anderson-Darling test: More sensitive to deviations in tails
-- Kolmogorov-Smirnov test: General goodness-of-fit test
-
-### Signs of High Risk
-
-- Multiple normality tests failing consistently
-- Very low p-values indicating strong evidence against normality
-- Conflicting results between different normality tests
-
-### Strengths
-
-- Multiple statistical tests for robust assessment
-- Clear pass/fail indicators for each test
-- Suitable for different sample sizes
-
-### Limitations
-
-- Limited to numerical features only
-- Some tests sensitive to sample size
-- Perfect normality is rare in real data
\ No newline at end of file
diff --git a/site/tests/stats/OutlierDetection.md b/site/tests/stats/OutlierDetection.md
deleted file mode 100644
index 06ddb93cb9..0000000000
--- a/site/tests/stats/OutlierDetection.md
+++ /dev/null
@@ -1,34 +0,0 @@
-# OutlierDetection
-
-Detects outliers in numerical features using multiple statistical methods.
-
-### Purpose
-
-This test identifies outliers in numerical features using various statistical
-methods including IQR, Z-score, and Isolation Forest. It provides comprehensive
-outlier detection to help identify data quality issues and potential anomalies.
-
-### Test Mechanism
-
-The test applies multiple outlier detection methods:
-- IQR method: Values beyond Q1 - 1.5*IQR or Q3 + 1.5*IQR
-- Z-score method: Values with |z-score| > threshold
-- Isolation Forest: ML-based anomaly detection
-
-### Signs of High Risk
-
-- High percentage of outliers indicating data quality issues
-- Inconsistent outlier detection across methods
-- Extreme outliers that significantly deviate from normal patterns
-
-### Strengths
-
-- Multiple detection methods for robust outlier identification
-- Customizable thresholds for different sensitivity levels
-- Clear summary of outlier patterns across features
-
-### Limitations
-
-- Limited to numerical features only
-- Some methods assume normal distributions
-- Threshold selection can be subjective
\ No newline at end of file
diff --git a/site/training/administrator-fundamentals/_invite-new-user.qmd b/site/training/administrator-fundamentals/_invite-new-user.qmd
index 104a05816f..6c999f1ed5 100644
--- a/site/training/administrator-fundamentals/_invite-new-user.qmd
+++ b/site/training/administrator-fundamentals/_invite-new-user.qmd
@@ -34,7 +34,7 @@ b. Then, confirm that the invitation has disappeared from Pending Invites and th
 :::: {.content-hidden unless-format="revealjs"}
 **Invite a new user**
 
-1. Enter in the details under Invite by Email:
+1. Enter the details under Invite by Email:
   - **Group** — The group you created earlier.
   - **Role** — The role you created earlier.
 2. Click **{{< fa envelope >}} Send Invite**.
diff --git a/site/training/administrator-fundamentals/onboarding-your-organization.qmd b/site/training/administrator-fundamentals/onboarding-your-organization.qmd
index be2041460c..140a167272 100644
--- a/site/training/administrator-fundamentals/onboarding-your-organization.qmd
+++ b/site/training/administrator-fundamentals/onboarding-your-organization.qmd
@@ -165,7 +165,7 @@ Get your organization ready for use by first defining business units and use cas
 :::
 
 1. Click **{{< fa plus >}} Add Business Unit** under Business Units.
-2. Enter in your **[business unit name]{.smallcaps}**.
+2. Enter your **[business unit name]{.smallcaps}**.
 3. Click **Add Business Unit** to save your changes.
 
 When you're done, click [{{< fa chevron-right >}}]() to continue.
diff --git a/site/training/administrator-fundamentals/organizational-oversight-reporting.qmd b/site/training/administrator-fundamentals/organizational-oversight-reporting.qmd
index e7d106a638..728fc2488f 100644
--- a/site/training/administrator-fundamentals/organizational-oversight-reporting.qmd
+++ b/site/training/administrator-fundamentals/organizational-oversight-reporting.qmd
@@ -112,7 +112,48 @@ Already logged in and refreshed this module? Click [{{< fa chevron-right >}}]()
 
 :::: {.columns}
 ::: {.column width="30%" .pr4 .f2}
-Review workflows
+Review workflow executions
+
+::: {.f5 .nt2 .pl2 .mb4}
+(Scroll down for the full instructions.)
+:::
+
+::: {.tc}
+[Learn more ...](/guide/workflows/working-with-workflows.qmd#view-all-workflow-executions){.button target="_blank"}
+:::
+
+<br>Try it **live** on the next page. {{< fa hand-point-right >}}
+
+:::
+
+::: {.column width="70%" .bl .pl4 .f4}
+
+{{< include /guide/workflows/_view-workflow-executions.qmd >}}
+
+:::
+::::
+
+## {background-iframe="https://app.prod.validmind.ai/workflows" background-interactive="true" data-preload="yes"}
+
+:::: {.slideover--b .three-quarters .auto-collapse-10}
+::: {.tc}
+**View all workflow executions**
+:::
+
+- Use the buttons or keyboard shortcuts to control the timeline
+- Use **{{< fa magnifying-glass >}} Search** to search the timeline.
+- Use **{{< fa filter >}} Filter** to filter the timeline.
+- Click on any listed workflow to review the details of that specific workflow.
+
+When you're done, click [{{< fa chevron-right >}}]() to continue.
+
+::::
+
+## {.scrollable}
+
+:::: {.columns}
+::: {.column width="30%" .pr4 .f2}
+Review workflows on records & artifacts
 
 ::: {.f5 .nt2 .pl2 .mb4}
 (Scroll down for the full instructions.)
@@ -266,7 +307,7 @@ Manage custom reports
 :::
 
 1. Click **{{< fa plus >}} Add Page**.
-2. On the Add New Page module, enter in the **[page name]{.smallcaps}** and the **[description]{.smallcaps}**.
+2. On the Add New Page module, enter the **[page name]{.smallcaps}** and the **[description]{.smallcaps}**.
 3. Click **Add New Page** to create your custom analytics page.
 
 When you're done, click [{{< fa chevron-right >}}]() to continue.
@@ -282,7 +323,7 @@ When you're done, click [{{< fa chevron-right >}}]() to continue.
 
 1. Click on the tab for the custom page you added previously.
 1. Click **{{< fa pencil >}} Edit Dashboard** and select **{{< fa pencil >}} Add Widget** then **{{< fa pencil >}} Add Visualization**.
-3. On the Add Visualization panel, enter in your **[title]{.smallcaps}**.
+3. On the Add Visualization panel, enter your **[title]{.smallcaps}**.
 4. Select a **[visualization type]{.smallcaps}**.
 5. Select a **[dataset]{.smallcaps}**.
 6. Select the visualization configuration options to apply to the dataset.
@@ -311,8 +352,8 @@ Organizational oversight & reporting
 ::: {.column width="70%" .bl .pl4 .f3}
 In this final module, you learned how to:
 
-- [x] Track updates on models
-- [x] Review workflows and workflow history on models
+- [x] Track updates on records
+- [x] Review workflows and workflow history
 - [x] Navigate the analytics dashboard
 - [x] Create custom report dashboards and visualizations
 
@@ -321,7 +362,7 @@ In this final module, you learned how to:
 
 ::: {.f2}
 <br>
-There is more that {{< var vm.product >}} can do to help you oversee models and unite your model risk management teams within one comprehensive tool:
+There is more that {{< var vm.product >}} can do to help you oversee records and unite your risk management teams within one comprehensive tool:
 :::
 
 ::: {.tc}
diff --git a/site/training/administrator-fundamentals/using-validmind-for-risk-management.qmd b/site/training/administrator-fundamentals/using-validmind-for-risk-management.qmd
index 9e99b6ee60..e1de109313 100644
--- a/site/training/administrator-fundamentals/using-validmind-for-risk-management.qmd
+++ b/site/training/administrator-fundamentals/using-validmind-for-risk-management.qmd
@@ -233,10 +233,10 @@ Configure custom workflows
 
 <br>Try it **live** on the next pages. {{< fa hand-point-right >}}
 
-::: {.f5 .pl3 .mt4 .pr3 .embed}
+<!-- ::: {.f5 .pl3 .mt4 .pr3 .embed}
 For more assistance configuring workflows, refer to our [Workflow configuration examples](/guide/workflows/workflow-configuration-examples.qmd){target="_blank"}.
 
-:::
+::: -->
 
 :::
 
@@ -278,7 +278,7 @@ To set up a new custom workflow, you'll need to complete these four steps in seq
 
 1. Click **{{< fa plus >}} Add Workflow**.
 2. Select **Inventory Record** under [workflow target]{.smallcaps}.
-3. Enter in a **[title]{.smallcaps}** and a **[description]{.smallcaps}** the workflow.
+3. Enter a **[title]{.smallcaps}** and a **[description]{.smallcaps}** for the workflow.
 4. Under [record type]{.smallcaps}, select **Model**.
 5. Under **[workflow start]{.smallcaps}**, select **Manually**.
 6. Under **[workflow expected duration]{.smallcaps}**, define the SLA for the workflow.
@@ -548,7 +548,7 @@ Add assessment questions
 2. Select the regulation or policy you added previously by clicking on it.
 3. Select the assessment you added previously by clicking on it.
 4. Click **{{< fa plus >}} Add Question** to create a new question.
-5. Enter in the **[questions]{.smallcaps}**.
+5. Enter the **[questions]{.smallcaps}**.
 6. Click **Add # Question(s)** to insert questions into the assessment.
 
 When you're done, click [{{< fa chevron-right >}}]() to continue.
@@ -664,7 +664,7 @@ When you're done, click [{{< fa chevron-right >}}]() to continue.
 Click on the name of the attestation you added previously to configure it:
 
 1. Click **{{< fa plus >}} Add Attestation Period** and add a period.
-    - Enter in the **[name]{.smallcaps}**, **[start date]{.smallcaps}**, and **[end date]{.smallcaps}**.
+    - Enter the **[name]{.smallcaps}**, **[start date]{.smallcaps}**, and **[end date]{.smallcaps}**.
     - Click **Add Period**.
 2. Under Relevant Attestation Fields, drag fields into the **Relevant Attestation Fields** column to display in model snapshots.
 3. Under Questionnaire Template, click the template area to edit, then click **Save** to apply your changes.
diff --git a/site/training/ai-governance/compliance-and-oversight.qmd b/site/training/ai-governance/compliance-and-oversight.qmd
index 55746c12d3..cdd98a94c4 100644
--- a/site/training/ai-governance/compliance-and-oversight.qmd
+++ b/site/training/ai-governance/compliance-and-oversight.qmd
@@ -66,7 +66,7 @@ Key governance regulations include:
 | Regulation | Jurisdiction | Focus |
 |------------|--------------|-------|
 | [EU AI Act](https://eur-lex.europa.eu/eli/reg/2024/1689){target="_blank"} | European Union | Risk-based AI regulation |
-| [SR 11-7](https://www.federalreserve.gov/supervisionreg/srletters/sr1107.htm){target="_blank"} | United States | Model risk management |
+| [SR 26-2](https://www.federalreserve.gov/supervisionreg/srletters/SR2602.htm){target="_blank"} | United States | Model risk management |
 | [SS1/23](https://www.bankofengland.co.uk/prudential-regulation/publication/2023/may/model-risk-management-principles-for-banks-ss){target="_blank"} | United Kingdom | MRM principles |
 | [E-23](https://www.osfi-bsif.gc.ca/en/guidance/guidance-library/guideline-e-23-model-risk-management-2027){target="_blank"} | Canada | Enterprise-wide MRM & AI/ML risk |
 :::
@@ -96,7 +96,7 @@ Use our implementation guides for:
 ::: {.f4 .pl3 .pt2}
 [[AI Governance<br>[[[EU AI ACT]{.green}]{.bubble}]{.f5}](/about/use-cases/ai-governance.qmd){target="_blank"}]{.button .shadow-5-ns .f4 .content-tile style="width: 100%;"}
 
-[[Model Risk Management<br>[[[SR 11-7]{.green}]{.bubble} [[SS1/23]{.green}]{.bubble} [[E-23]{.green}]{.bubble}]{.f5}](/about/use-cases/model-risk-management.qmd){target="_blank"}]{.button .shadow-5-ns .f4 .content-tile style="width: 100%;"}
+[[Model Risk Management<br>[[[SR 26-2]{.green}]{.bubble} [[SS1/23]{.green}]{.bubble} [[E-23]{.green}]{.bubble}]{.f5}](/about/use-cases/model-risk-management.qmd){target="_blank"}]{.button .shadow-5-ns .f4 .content-tile style="width: 100%;"}
 :::
 :::
 
@@ -126,7 +126,7 @@ Use our implementation guides for:
 
 - [AI governance](/about/use-cases/ai-governance.qmd){target="_blank" .button}
 - [EU AI Act](/about/use-cases/eu-ai-act.qmd){target="_blank" .button}
-- [SR 11-7](/about/use-cases/sr-11-7.qmd){target="_blank" .button}
+- [SR 26-2](/about/use-cases/sr-26-2.qmd){target="_blank" .button}
 - [SS1/23](/about/use-cases/ss1-23.qmd){target="_blank" .button}
 - [E-23](/about/use-cases/e-23.qmd){target="_blank" .button} -->
 
diff --git a/site/training/assets/slides.scss b/site/training/assets/slides.scss
index 9e8fa51958..16bc95f076 100644
--- a/site/training/assets/slides.scss
+++ b/site/training/assets/slides.scss
@@ -59,6 +59,15 @@ section.has-dark-background a:hover {
   color: #042426 !important; 
 }
 
+/* Quarto's revealjs theme forces <kbd> to the presentation root font size,
+   which makes keyboard keys render much larger than surrounding bullet/body text.
+   Scale kbd down to inherit from its container so it matches text contexts like .f4/.f5. */
+.reveal .slide kbd {
+  font-size: inherit;
+  padding: 0.15em 0.4em;
+  vertical-align: baseline;
+}
+
 .reveal .footer a {
   color: #DE257E !important;
 }
diff --git a/site/training/common-slides/_document-overview.qmd b/site/training/common-slides/_document-overview.qmd
index a89903f202..fea9b761a7 100644
--- a/site/training/common-slides/_document-overview.qmd
+++ b/site/training/common-slides/_document-overview.qmd
@@ -2,6 +2,7 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
+:::: {.content-visible when-format="revealjs" when-meta="includes.developer"}
 ## {.scrollable .center}
 
 :::: {.columns}
@@ -9,7 +10,7 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 **Document Overview**
 
 ::: {.tc}
-[Learn more...](/guide/validation/review-documentation.qmd){.button target="_blank"}
+[Learn more...](/guide/documentation/working-with-documentation.html#document-overview){.button target="_blank"}
 :::
 <br>
 
@@ -24,4 +25,35 @@ Try it **live** on the next page. {{< fa hand-point-right >}}
 {{< include /guide/documentation/_locate-document-overview.qmd >}}
 
 :::
+::::
+
+
+::::
+
+
+:::: {.content-visible when-format="revealjs" unless-meta="includes.developer"}
+## {.scrollable .center}
+
+:::: {.columns}
+::: {.column width="30%" .pr4 .f2}
+**Document Overview**
+
+::: {.tc}
+[Learn more...](/guide/validation/review-documentation.qmd#document-overview){.button target="_blank"}
+:::
+<br>
+
+Try it **live** on the next page. {{< fa hand-point-right >}}
+
+:::
+
+::: {.column width="70%" .bl .pl4 .f3}
+
+{{< include /guide/documentation/_document-overview.qmd >}}
+
+{{< include /guide/documentation/_locate-document-overview.qmd >}}
+
+:::
+::::
+
 ::::
\ No newline at end of file
diff --git a/site/training/common-slides/_get-your-code-snippet.qmd b/site/training/common-slides/_get-your-code-snippet.qmd
index cc7ca2d838..86abe88aad 100644
--- a/site/training/common-slides/_get-your-code-snippet.qmd
+++ b/site/training/common-slides/_get-your-code-snippet.qmd
@@ -12,6 +12,11 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 :::: {.content-visible when-format="revealjs" when-meta="includes.developer"}
 ## Get your code snippet
 
+::: {.f4}
+Initialize the {{< var validmind.developer >}} with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the {{< var validmind.platform >}} when you run the {{< var vm.developer >}}:
+
+:::
+
 :::: {.columns}
 
 ::: {.column width="80%"}
@@ -35,28 +40,27 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 ::: {.column width="20%" .f4}
 
 ::: {.f5}
-{{< var vm.product >}} generates a unique *code snippet* for each registered model to connect with your local environment:
-
 1. Select the name of your model you registered for this course to open up the model details page.
 2. On the left sidebar that appears for your model, click **Getting Started**.
 3. Select `Development` from the **[document]{.smallcaps}** drop-down menu.
 4. Click **Copy snippet to clipboard**.
 
-:::
-
 When you're done, click [{{< fa chevron-right >}}]() to continue.
 
-:::
-
-::::
-
-:::: {.tc .f6 .embed}
+:::: {.pl2 .f6 .embed}
 **Can't load the {{< var validmind.platform >}}?**
 
 Make sure you're logged in and have refreshed the page in a Chromium-based web browser.
 
 :::
 
+:::
+
+:::
+
+::::
+
+
 ::::
 
 <!-- VISIBLE ONLY ON PAGES THAT **DO NOT** HAVE A CUSTOM METADATA TAG:
@@ -68,6 +72,11 @@ Make sure you're logged in and have refreshed the page in a Chromium-based web b
 :::: {.content-visible when-format="revealjs" unless-meta="includes.developer"}
 ## Get your code snippet
 
+::: {.f4}
+Initialize the {{< var validmind.developer >}} with the *code snippet* unique to each record per document, ensuring your test results are uploaded to the correct record and automatically populated in the right document in the {{< var validmind.platform >}} when you run the {{< var vm.developer >}}:
+
+:::
+
 :::: {.columns}
 
 ::: {.column width="80%"}
@@ -91,28 +100,27 @@ Make sure you're logged in and have refreshed the page in a Chromium-based web b
 ::: {.column width="20%" .f4}
 
 ::: {.f5}
-{{< var vm.product >}} generates a unique *code snippet* for each registered model to connect with your local environment:
-
 1. Select the name of your model you registered for this course to open up the model details page.
 2. On the left sidebar that appears for your model, click **Getting Started**.
 3. Select `Validation` from the **[document]{.smallcaps}** drop-down menu.
 4. Click **Copy snippet to clipboard**.
 
-:::
-
 When you're done, click [{{< fa chevron-right >}}]() to continue.
 
-:::
-
-::::
-
-:::: {.tc .f6 .embed}
+:::: {.pl2 .f6 .embed}
 **Can't load the {{< var validmind.platform >}}?**
 
 Make sure you're logged in and have refreshed the page in a Chromium-based web browser.
 
 :::
 
+:::
+
+:::
+
+::::
+
+
 ::::
 
 
diff --git a/site/training/common-slides/_register-sample-model.qmd b/site/training/common-slides/_register-sample-model.qmd
index 2963746d15..7a7c5349e1 100644
--- a/site/training/common-slides/_register-sample-model.qmd
+++ b/site/training/common-slides/_register-sample-model.qmd
@@ -9,8 +9,8 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 ::: {.slideover--r .three-quarters .auto-collapse-10}
 **Register a sample model**
 
-1. Enter in some details for your sample model, then click **Next {{< fa angle-right >}}**.
-2. Select your own name under the **[model owner]{.smallcaps}** drop-down.
+1. Enter some details for your sample model, then click **Next {{< fa angle-right >}}**.
+2. Select your own name under the **[record owner]{.smallcaps}** drop-down.
 3. Click **Register Model** to add the model to your inventory.
 
 When you're done, click [{{< fa chevron-right >}}]() to continue.
@@ -28,8 +28,8 @@ When you're done, click [{{< fa chevron-right >}}]() to continue.
 ::: {.slideover--r .three-quarters .auto-collapse-10}
 **Register a sample model**
 
-1. Enter in some details for your sample model, then click **Next {{< fa angle-right >}}**.
-2. Select your own name under the **[model owner]{.smallcaps}** drop-down — don't worry, we'll adjust these permissions next for validation.
+1. Enter some details for your sample model, then click **Next {{< fa angle-right >}}**.
+2. Select your own name under the **[record owner]{.smallcaps}** drop-down — don't worry, we'll adjust these permissions next for validation.
 3. Click **Register Model** to add the model to your inventory.
 
 When you're done, click [{{< fa chevron-right >}}]() to continue.
diff --git a/site/training/common-slides/_review-model-activity.qmd b/site/training/common-slides/_review-model-activity.qmd
index 134da303d6..8f7b98133e 100644
--- a/site/training/common-slides/_review-model-activity.qmd
+++ b/site/training/common-slides/_review-model-activity.qmd
@@ -6,12 +6,12 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
 :::: {.slideover--b .auto-collapse-10}
 ::: {.tc}
-**Review record activity**
+**Review model activity**
 :::
 
-1. Select the name of your record you registered for this course to open up the recird details page.
-2. In the left sidebar that appears for your record, click **{{< fa wifi >}} Activity**.
-3. Confirm activity logged on the record reflects your activities from this training course.
+1. Select the name of your model you registered for this course to open up the model details page.
+2. In the left sidebar that appears for your model, click **{{< fa wifi >}} Activity**.
+3. Confirm activity logged on the model reflects your activities from this training course.
 4. (Optional) Filter the activity by category or specific values to narrow down results.
 
 When you're done, click [{{< fa chevron-right >}}]() to continue.
diff --git a/site/training/common-slides/_submit-for-approval.qmd b/site/training/common-slides/_submit-for-approval.qmd
index 80e4472566..fbc2f44bf0 100644
--- a/site/training/common-slides/_submit-for-approval.qmd
+++ b/site/training/common-slides/_submit-for-approval.qmd
@@ -9,8 +9,8 @@ SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 **Submit for approval**
 :::
 
-1. Select the name of your record you registered for this course to open up the record details page.
-2. On the landing page of your record, locate the [active workflows]{.smallcaps} section and the workflow you'd like to transition.
+1. Select the name of your model you registered for this course to open up the model details page.
+2. On the landing page of your model, locate the [active workflows]{.smallcaps} section and the workflow you'd like to transition.
 3. If an action is available to your role, you'll see it listed under that workflow:
     - Click **{{< fa arrow-right >}}** to open up the transition panel for your selected action. This arrow will be followed by the action name.
     - Enter your **[notes]{.smallcaps}** and any other additional inventory fields then click **Submit**.
diff --git a/site/training/common-slides/_validmind-test-repository.qmd b/site/training/common-slides/_validmind-test-repository.qmd
index ab758f54db..e2ab46b5d8 100644
--- a/site/training/common-slides/_validmind-test-repository.qmd
+++ b/site/training/common-slides/_validmind-test-repository.qmd
@@ -2,12 +2,12 @@
 Refer to the LICENSE file in the root of this repository for details.
 SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial -->
 
-## {background-iframe="/developer/test-descriptions.html" background-interactive="true" data-preload="yes"}
+## {background-iframe="/developer/how-to/test-sandbox.html" background-interactive="true" data-preload="yes"}
 
 :::: {.slideover--l .three-quarters .auto-collapse-5}
 **{{< var vm.product >}} test repository**
 
-{{< var vm.product >}} provides a wealth out-of-the-box of tests to help you ensure that your model is being built appropriately.
+{{< var vm.product >}} provides a wealth of out-of-the-box tests to help you ensure that your record (model) is being built appropriately.
 
 In this module, you'll become familiar with the individual tests available in {{< var vm.product >}}, as well as how to run them and change parameters as necessary.
 
diff --git a/site/training/developer-fundamentals/developer-fundamentals-register.qmd b/site/training/developer-fundamentals/developer-fundamentals-register.qmd
index 9cc70cb7df..ca0a84e2f3 100644
--- a/site/training/developer-fundamentals/developer-fundamentals-register.qmd
+++ b/site/training/developer-fundamentals/developer-fundamentals-register.qmd
@@ -17,34 +17,34 @@ listing:
     table-hover: true
     image-align: left
     contents:
-    - path: using-validmind-for-model-development.html
-      title: "Using {{< var vm.product >}} for Model Development"
+    - path: using-validmind-for-development.html
+      title: "Using {{< var vm.product >}} for Development"
       subtitle: "Module 1"
-      description: "{{< fa check >}} Register a model in the {{< var validmind.platform >}} <br> {{< fa check >}} Install the {{< var validmind.developer >}} in your environment <br> {{< fa check >}} Connect to your registered model <br> {{< fa check >}} Preview your model's documentation template"
+      description: "{{< fa check >}} Register a record (model) in the {{< var validmind.platform >}} <br> {{< fa check >}} Install the {{< var validmind.developer >}} in your environment <br> {{< fa check >}} Connect to your registered model <br> {{< fa check >}} Preview your documentation template"
       reading-time: "15"
       author: "{{< var vm.product >}}"
     - path: learning-to-run-tests.html
       title: "Learning to Run Tests"
       subtitle: "Module 2"
-      description: "{{< fa check >}} Identify relevant tests to run from {{< var vm.product >}}'s test vault <br> {{< fa check >}} Initialize datasets & models for use with the {{< var validmind.developer >}} <br> {{< fa check >}} Run and log out-of-the-box tests for new and existing models <br> {{< fa check >}} Insert test results into your model's documentation"
+      description: "{{< fa check >}} Identify relevant tests to run from {{< var vm.product >}}'s test vault <br> {{< fa check >}} Initialize ValidMind objects for use with the {{< var vm.developer >}} <br> {{< fa check >}} Run and log out-of-the-box tests <br> {{< fa check >}} Insert test results into your documentation"
       reading-time: "45"
       author: "{{< var vm.product >}}"
     - path: implementing-custom-tests.html
       title: "Implementing Custom Tests"
       subtitle: "Module 3"
-      description: "{{< fa check >}} Implement, run, and log custom inline and reusable tests <br> {{< fa check >}} Refresh your template to include inserted test-driven blocks <br> {{< fa check >}} Configure your template to include custom tests"
+      description: "{{< fa check >}} Implement, run, and log custom inline and reusable tests <br> {{< fa check >}} Refresh template to include inserted test-driven blocks <br> {{< fa check >}} Configure template to include custom tests"
       reading-time: "60"
       author: "{{< var vm.product >}}"
-    - path: finalizing-model-documentation.html
-      title: "Finalizing Model Documentation"
+    - path: finalizing-documentation.html
+      title: "Finalizing Documentation"
       subtitle: "Module 4"
-      description: "{{< fa check >}} Refine your model documentation <br> {{< fa check >}} Submit your model documentation for approval <br> {{< fa check >}} Track changes and other updates to your model"
+      description: "{{< fa check >}} Refine your documentation  <br> {{< fa check >}} Submit your documentation for approval <br> {{< fa check >}} Track changes and other updates to your record (model)"
       reading-time: "30"
       author: "{{< var vm.product >}}"
     fields: [title, subtitle, description, reading-time]
 ---
 
-Learn how to use {{< var vm.product >}} as a **developer** to generate model documentation, automate testing, and track your model's progress through the model lifecycle.
+Learn how to use {{< var vm.product >}} as a **developer** to generate  documentation, automate testing, and track your record's progress throughout its entire lifecycle.
 
 ::: {.column-margin}
 {{< include /training/_compatibility.qmd >}}
diff --git a/site/training/developer-fundamentals/finalizing-model-documentation.qmd b/site/training/developer-fundamentals/finalizing-documentation.qmd
similarity index 75%
rename from site/training/developer-fundamentals/finalizing-model-documentation.qmd
rename to site/training/developer-fundamentals/finalizing-documentation.qmd
index 7f5723f1e8..ddfc6a166c 100644
--- a/site/training/developer-fundamentals/finalizing-model-documentation.qmd
+++ b/site/training/developer-fundamentals/finalizing-documentation.qmd
@@ -2,8 +2,10 @@
 # Copyright © 2023-2026 ValidMind Inc. All rights reserved.
 # Refer to the LICENSE file in the root of this repository for details.
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
-title: "Finalizing <br>Model Documentation"
+title: "Finalizing <br>Documentation"
 subtitle: "Developer Fundamentals — Module 4 of 4<br><br>_Click [{{< fa chevron-right >}}](#learning-objectives) to start_"
+aliases:
+  - /training/developer-fundamentals/finalizing-model-documentation.html
 lightbox: true
 format:
   revealjs:
@@ -26,7 +28,7 @@ format:
       - slideover
   html:
   # Change this to the file name prepended by a _ to get around the global HTML output settings required by _metadata.yml
-    output-file: _finalizing-model-documentation.html
+    output-file: _finalizing-documentation.html
     search: false
 title-slide-attributes:
   data-background-color: "#083E44"
@@ -34,11 +36,12 @@ title-slide-attributes:
 skip_preview: true
 includes:
   developer: true
+  pdf-context: true
 ---
 
 # Learning objectives {.center}
 
-_"As a **developer** who has logged tests with the {{< var validmind.developer >}} to the {{< var validmind.platform >}}, I want to refine my model's documentation, submit my model documentation for approval, and track changes and other updates to my model."_
+_"As a **developer** who has logged tests with the {{< var validmind.developer >}} to the {{< var validmind.platform >}}, I want to refine my documentation, submit my documentation for approval, and track changes and other updates to my record (model)."_
 
 ::: {.tc}
 <br>
@@ -51,10 +54,10 @@ This final module is part of a four-part series:
 ## Module 4 — Contents {.center}
 
 ::: {.f2}
-1. [Refine model documentation](#refine-model-documentation)
+1. [Refine documentation](#refine-documentation)
 3. [Submit documentation for approval](#submit-documentation-for-approval)
 4. [Collaborate with others](#collaborate-with-others)
-5. [Track record activity](#track-model-activity)
+5. [Track activity](#track-activity)
 6. [View analytics](#view-analytics)
 
 :::
@@ -76,7 +79,7 @@ To continue, you need to have been [onboarded](developer-fundamentals-register.q
 :::: {.columns}
 ::: {.column width="30%"}
 ::: {.tc}
-[Module 1](using-validmind-for-model-development.html){.button target="_blank"}
+[Module 1](using-validmind-for-development.html){.button target="_blank"}
 :::
 
 :::
@@ -104,7 +107,7 @@ Already logged in and refreshed this module? Click [{{< fa chevron-right >}}]()
 
 :::
 
-# Refine model documentation {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
+# Refine documentation {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
 ## {.scrollable .center}
 
@@ -136,9 +139,9 @@ From the {{< var validmind.platform >}}:
 
 1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
 
-2. Select the name of your record you registered for this course to open up the record details page.
+2. Select the name of your model you registered for this course to open up the model details page.
 
-3. In the left sidebar that appears for your record, click **Development** under {{< fa file >}} Documents.
+3. In the left sidebar that appears for your model, click **Development** under {{< fa file >}} Documents.
 
 {{< include /guide/documentation/_view-test-result-metadata.qmd >}}
 
@@ -153,8 +156,8 @@ From the {{< var validmind.platform >}}:
 **Review documented test results**
 :::
 
-1. Select the name of your record you registered for this course to open up the record details page.
-2. On the left sidebar that appears for your record, click **Development** under {{< fa file >}} Documents.
+1. Select the name of your model you registered for this course to open up the model details page.
+2. On the left sidebar that appears for your model, click **Development** under {{< fa file >}} Documents.
 3. Click into any section of the documentation to review the test results logged via the {{< var validmind.developer >}}. <br>For example:
     - **2.3 Correlations and Interactions**
     - **3.2 Model Evaluation**
@@ -196,11 +199,11 @@ You can also use the content editing toolbar to revise the description of test r
 
 For example:
 
-1. Within your model documentation, locate the Data Preparation section and click on **2.3 Correlations and Interactions** to expand that section.
+1. Within your documentation, click on **2.3 Correlations and Interactions** to expand that section.
 
 2. Click on the text to edit the description for our individually inserted `HighPearsonCorrelation:balanced_raw_dataset` test:
 
-  ![Editor for a test result description](/notebooks/tutorials/model_development/high-pearson-correlation-block.png){fig-alt="Screenshot showing the editor for a test result description" .screenshot}
+  ![Editor for a test result description](/notebooks/tutorials/development/high-pearson-correlation-block.png){fig-alt="Screenshot showing the editor for a test result description" .screenshot}
 
 :::
 
@@ -215,8 +218,8 @@ For example:
 **Add & edit content blocks**
 :::
 
-1. Select the name of your record you registered for this course to open up the record details page.
-2. On the left sidebar that appears for your record, click **Development** under {{< fa file >}} Documents.
+1. Select the name of your model you registered for this course to open up the model details page.
+2. On the left sidebar that appears for your model, click **Development** under {{< fa file >}} Documents.
 3. Click into any section of the documentation to add and edit a content block.
 
 When you're done, click [{{< fa chevron-right >}}]() to continue.
@@ -226,7 +229,7 @@ When you're done, click [{{< fa chevron-right >}}]() to continue.
 {{< include /training/common-slides/_document-checker.qmd >}}
 
 <br>
-Learn how to **use the {{< var vm.checker >}} to review model documentation** on the next page. {{< fa hand-point-right >}}
+Learn how to **use the {{< var vm.checker >}} to review documentation** on the next page. {{< fa hand-point-right >}}
 
 ## {.scrollable}
 
@@ -257,8 +260,8 @@ Use the {{< var vm.checker >}}
 **Check your documentation**
 :::
 
-1. Select the name of your record you registered for this course to open up the record details page.
-2. On the left sidebar that appears for your record, click **Development** under {{< fa file >}} Documents.
+1. Select the name of your model you registered for this course to open up the model details page.
+2. On the left sidebar that appears for your model, click **Development** under {{< fa file >}} Documents.
 3. Locate the {{< var vm.checker >}} box on the right and click **{{< fa check >}} Check Document**.
 4. Select a **[regulation]{.smallcaps}** and an associated **[assessment]{.smallcaps}** from the drop-down menus to to check your document against.
 5. Scroll to the bottom and click **Check Document**.
@@ -312,8 +315,8 @@ Comment threads
 **Comment on documentation**
 :::
 
-1. Select the name of your record you registered for this course to open up the record details page.
-2. On the left sidebar that appears for your record, click **Development** under {{< fa file >}} Documents.
+1. Select the name of your model you registered for this course to open up the model details page.
+2. On the left sidebar that appears for your model, click **Development** under {{< fa file >}} Documents.
 3. **In the content block you added earlier**: Post a comment, reply to it, and then resolve the thread.
 
 When you're done, click [{{< fa chevron-right >}}]() to continue.
@@ -321,7 +324,7 @@ When you're done, click [{{< fa chevron-right >}}]() to continue.
 ::::
 
 
-# Track record activity {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
+# Track activity {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
 {{< include /training/common-slides/_track-changes-updates.qmd >}}
 
@@ -331,15 +334,15 @@ When you're done, click [{{< fa chevron-right >}}]() to continue.
 
 ## {background-iframe="https://app.prod.validmind.ai/analytics" background-interactive="true" data-preload="yes"}
 
-:::: {.slideover--l .three-quarters .auto-collapse-10}
+:::: {.slideover--r .three-quarters .auto-collapse-10}
 **Welcome to {{< fa square-poll-vertical >}} Analytics**
 
-Here, you can find executive summaries, track information on models, artifacts, and more.
+Under analytics, you can find executive summaries, track information on records (models), artifacts, and more.
 
 For example:
 
-1. Click **Models** to review reports on models.
-3. Click into any widget to review the models reported by that widget.
+1. Select **Models** to review reports on models.
+2. Click into any widget to review the models reported by that widget.
 
 When you're done exploring, click [{{< fa chevron-right >}}]() to continue.
 
@@ -351,7 +354,7 @@ When you're done exploring, click [{{< fa chevron-right >}}]() to continue.
 
 :::: {.columns}
 ::: {.column width="30%" .pr4 .f2}
-Finalizing model documentation
+Finalizing documentation
 
 
 ::: {.f3}
@@ -365,9 +368,9 @@ Finalizing model documentation
 In this final module, you learned how to:
 
 - [x] View logged test result metadata
-- [x] Add or edit content blocks in your model documentation
-- [x] Submit your model documentation for approval
-- [x] Collaborate with other stakeholders on your model
+- [x] Add or edit content blocks in your documentation
+- [x] Submit your documentation for approval
+- [x] Collaborate with other stakeholders
 - [x] Track updates on your model
 - [x] Navigate the analytics dashboard
 
@@ -376,10 +379,11 @@ In this final module, you learned how to:
 
 ::: {.f3}
 <br>
-There is more that {{< var vm.product >}} can do to help you create model documentation, from using your own template to code samples you can adapt for your own use case:
+There is more that {{< var vm.product >}} can do to help you create documentation, from using your own template to code samples you can adapt for your own use case:
+<br><br>
 :::
 
 ::: {.tc}
-[All model documentation guides](/guide/guides.qmd#model-documentation){.button target="_blank"}
+[All documentation guides](/guide/guides.qmd#documentation){.button target="_blank"}
 
 :::
\ No newline at end of file
diff --git a/site/training/developer-fundamentals/implementing-custom-tests.qmd b/site/training/developer-fundamentals/implementing-custom-tests.qmd
index e4d2750093..278a6aa0e9 100644
--- a/site/training/developer-fundamentals/implementing-custom-tests.qmd
+++ b/site/training/developer-fundamentals/implementing-custom-tests.qmd
@@ -53,7 +53,7 @@ This third module is part of a four-part series:
 :::: {.columns .f3}
 ::: {.column width="50%" .mt4 .pr4}
 ### Introduction
-- [{{< var vm.product >}} for model development](#validmind-for-model-development)
+- [{{< var vm.product >}} for development](#validmind-for-development)
 :::
 
 :::
@@ -72,7 +72,7 @@ This third module is part of a four-part series:
 ### Section 2
 
 - [Include custom test results](#include-custom-test-results)
-- [Configure the model's documentation template](#configure-documentation-templates)
+- [Configure your documentation template](#configure-documentation-templates)
 :::
 
 ::::
@@ -97,7 +97,7 @@ To continue, you need to have been [onboarded](developer-fundamentals-register.q
 :::: {.columns}
 ::: {.column width="60%"}
 ::: {.tc}
-[Using {{< var vm.product >}} for Model Development](using-validmind-for-model-development.html){.button target="_blank"}
+[Using {{< var vm.product >}} for Development](using-validmind-for-development.html){.button target="_blank"}
 :::
 
 :::
@@ -120,7 +120,7 @@ Already logged in and refreshed this module? Click [{{< fa chevron-right >}}]()
 
 <!-- USING THE VARIABLE IN THE HEADING MESSES UP THE PAGE ANCHOR -->
 
-# ValidMind for model development {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
+# ValidMind for development {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
 ## {.scrollable .center}
 
@@ -129,7 +129,7 @@ Already logged in and refreshed this module? Click [{{< fa chevron-right >}}]()
 Jupyter Notebook series
 
 ::: {.f3}
-When you run these notebooks, they will generate a draft of model documentation and upload it to {{< var vm.product >}}, complete with supporting test results.
+When you run these notebooks, they will generate a draft of documentation and upload it to {{< var vm.product >}}, complete with supporting test results.
 
 ::: {.f5 .nt2 .pl2 .mb4}
 <br>
@@ -142,14 +142,14 @@ You will need to have already completed notebooks **1** and **2** during the fir
 :::
 
 ::: {.column width="70%" .bl .pl4 .f3}
-#### {{< var vm.product >}} for model development
+#### {{< var vm.product >}} for development
 
-Our series of four introductory notebooks for model developers include sample code and how-to information to get you started with {{< var vm.product >}}:
+Our series of four introductory notebooks for developers include sample code and how-to information to get you started with {{< var vm.product >}}:
 
-1 — [Set up the {{< var validmind.developer >}}](/notebooks/tutorials/model_development/1-set_up_validmind.ipynb){target="_blank"}<br>
-2 — [Start the model development process](/notebooks/tutorials/model_development/2-start_development_process.ipynb){target="_blank"}<br>
-3 — [Integrate custom tests](/notebooks/tutorials/model_development/3-integrate_custom_tests.ipynb){target="_blank"}<br>
-4 — [Finalize testing and documentation](/notebooks/tutorials/model_development/4-finalize_testing_documentation.ipynb){target="_blank"}<br>
+1 — [Set up the {{< var validmind.developer >}}](/notebooks/tutorials/development/1-set_up_validmind.ipynb){target="_blank"}<br>
+2 — [Start the development process](/notebooks/tutorials/development/2-start_development_process.ipynb){target="_blank"}<br>
+3 — [Integrate custom tests](/notebooks/tutorials/development/3-integrate_custom_tests.ipynb){target="_blank"}<br>
+4 — [Finalize testing and documentation](/notebooks/tutorials/development/4-finalize_testing_documentation.ipynb){target="_blank"}<br>
 <br>
 
 ::: {.f4 .pl3 .pr3 .embed}
@@ -163,7 +163,7 @@ Let's continue our journey with **Section 1** on the next page. {{< fa hand-poin
 
 # Section 1 {background-color="#083E44" background-image="/assets/img/about-us-esphere.svg"}
 
-## {background-iframe="/notebooks/EXECUTED/model_development/3-integrate_custom_tests.html" background-interactive="yes" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/3-integrate_custom_tests.html" background-interactive="yes" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **3 — Integrate custom tests**
@@ -176,14 +176,14 @@ This is the third notebook in our introductory series, which will walk you throu
 
 {{< include /training/common-slides/_get-your-code-snippet.qmd >}}
 
-## {background-iframe="/notebooks/EXECUTED/model_development/3-integrate_custom_tests.html#initialize-the-validmind-library" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/3-integrate_custom_tests.html#initialize-the-validmind-library" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Connect to your model**
 
 With your code snippet copied to your clipboard:
 
-1. Open **3 — Integrate custom tests**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/3-integrate_custom_tests.ipynb){target="_blank"}
+1. Open **3 — Integrate custom tests**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/3-integrate_custom_tests.ipynb){target="_blank"}
 2. Run all the cells under the **Setting up** section.
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
@@ -211,28 +211,28 @@ Let's implement a custom *inline test* that calculates the confusion matrix for
 :::
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_development/3-integrate_custom_tests.html#create-a-confusion-matrix-plot" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/3-integrate_custom_tests.html#create-a-confusion-matrix-plot" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Create a custom test**
 
 The [`@vm.test` wrapper](/validmind/validmind.qmd#test){target="_blank"} allows you to create a reusable test:
 
-1. Continue with **3 — Integrate custom tests**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/3-integrate_custom_tests.ipynb){target="_blank"}
+1. Continue with **3 — Integrate custom tests**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/3-integrate_custom_tests.ipynb){target="_blank"}
 2. Run all the cells in the following section under Implementing a custom inline test: **Create a confusion matrix plot**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_development/3-integrate_custom_tests.html#add-parameters-to-custom-tests" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/3-integrate_custom_tests.html#add-parameters-to-custom-tests" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Adjust your custom test**
 
 Custom tests can take parameters just like any other function:
 
-1. Continue with **3 — Integrate custom tests**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/3-integrate_custom_tests.ipynb){target="_blank"}
+1. Continue with **3 — Integrate custom tests**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/3-integrate_custom_tests.ipynb){target="_blank"}
 2. Run all the cells in the following sections under Implementing a custom inline test:
     - **Add parameters to custom tests**
     - **Pass parameters to custom tests**
@@ -241,21 +241,21 @@ When you're done, return to this page and click [{{< fa chevron-right >}}]() to
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_development/3-integrate_custom_tests.html#log-the-confusion-matrix-results" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/3-integrate_custom_tests.html#log-the-confusion-matrix-results" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Log your custom test**
 
 Use the [`.log()` method](/validmind/validmind/vm_models.qmd#log){target="_blank"} to send the results of your custom test to the {{< var validmind.platform >}}:
 
-1. Continue with **3 — Integrate custom tests**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/3-integrate_custom_tests.ipynb){target="_blank"}
+1. Continue with **3 — Integrate custom tests**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/3-integrate_custom_tests.ipynb){target="_blank"}
 2. Run the cell in the following section under Implementing a custom inline test: **Log the confusion matrix results**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-# Use external test providers {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
+# Use external <br>test providers {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
 ## {.scrollable .center}
 
@@ -270,50 +270,50 @@ Reusable custom tests
 ::: {.column width="70%" .bl .pl4 .f3}
 #### External test providers
 
-Creating inline custom tests with a function is a great way to customize your model documentation.
+Creating inline custom tests with a function is a great way to customize your documentation.
 
-- However, sometimes you may want to reuse the same set of tests across multiple models and share them with others in your organization.
+- However, sometimes you may want to reuse the same set of tests across multiple records (models) and share them with others in your organization.
 - In this case, you can create an external custom test provider that will allow you to load custom tests from a local folder or a Git repository.
 
 :::
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_development/3-integrate_custom_tests.html#create-custom-tests-folder" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/3-integrate_custom_tests.html#create-custom-tests-folder" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Create custom tests folder**
 
 Create a new folder that will contain reusable custom tests from your existing inline tests:
 
-1. Continue with **3 — Integrate custom tests**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/3-integrate_custom_tests.ipynb){target="_blank"}
+1. Continue with **3 — Integrate custom tests**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/3-integrate_custom_tests.ipynb){target="_blank"}
 2. Run the cell under the following Using external test providers section: **Create custom tests folder**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_development/3-integrate_custom_tests.html#save-an-inline-test" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/3-integrate_custom_tests.html#save-an-inline-test" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Save inline test**
 
 The `@vm.test` decorator also includes a convenience method that allows you to save the test to a Python file at a specified path:
 
-1. Continue with **3 — Integrate custom tests**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/3-integrate_custom_tests.ipynb){target="_blank"}
+1. Continue with **3 — Integrate custom tests**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/3-integrate_custom_tests.ipynb){target="_blank"}
 2. Run all the cells under the Using external test providers section: **Save an inline test**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_development/3-integrate_custom_tests.html#register-a-local-test-provider" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/3-integrate_custom_tests.html#register-a-local-test-provider" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Register local test provider**
 
 Next, let's initialize a test provider that will tell the {{< var validmind.developer >}} where to find your saved custom tests:
 
-1. Continue with **3 — Integrate custom tests**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/3-integrate_custom_tests.ipynb){target="_blank"}
+1. Continue with **3 — Integrate custom tests**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/3-integrate_custom_tests.ipynb){target="_blank"}
 2. Run all the cells under the Using external test providers section: **Register a local test provider**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
@@ -331,7 +331,7 @@ Custom test results
 :::
 
 ::: {.tc}
-[Learn more ...](/notebooks/EXECUTED/model_development/3-integrate_custom_tests.ipynb#add-test-results-to-documentation){.button target="_blank"}
+[Learn more ...](/notebooks/EXECUTED/development/3-integrate_custom_tests.ipynb#add-test-results-to-documentation){.button target="_blank"}
 
 :::
 
@@ -340,7 +340,7 @@ Custom test results
 :::
 
 ::: {.column width="70%" .bl .pl4 .f4}
-#### Add test results to model documentation
+#### Add test results to documentation
 
 With the custom test results logged, let's head to the model we connected to at the beginning of this notebook and insert our test results into the documentation:
 
@@ -348,7 +348,7 @@ With the custom test results logged, let's head to the model we connected to at
 
 2. In the left sidebar that appears for your model, click **Development** under {{< fa file >}} Documents.
 
-3. Locate the Data Preparation section and click on **3.2 Model Evaluation** to expand that section.
+3. Click on **3.2 Model Evaluation** to expand that section.
 
 4. Hover under the Pearson Correlation Matrix content block until a horizontal line with a **{{< fa plus >}}** button appears, indicating that you can insert a new block.
 
@@ -357,7 +357,7 @@ With the custom test results logged, let's head to the model we connected to at
     - Click on **Custom** under [test-driven]{.smallcaps} in the left sidebar.
     - Select the two custom `ConfusionMatrix` tests you logged previously:
 
-    ![The ConfusionMatrix tests selected](/notebooks/tutorials/model_development/selecting-confusion-matrix-test.png){fig-alt="Screenshot showing the ConfusionMatrix tests selected" .screenshot}
+    ![The ConfusionMatrix tests selected](/notebooks/tutorials/development/selecting-confusion-matrix-test.png){fig-alt="Screenshot showing the ConfusionMatrix tests selected" .screenshot}
 
 6. Finally, click **Insert 2 Test Results to Document** to add the test results to the documentation.
 
@@ -376,7 +376,7 @@ With the custom test results logged, let's head to the model we connected to at
 
 1. Select the name of your model you registered for this course to open up the model details page.
 2. In the left sidebar that appears for your model, click **Development** under {{< fa file >}} Documents.
-3. Locate the Data Preparation section and click on **3.2 Model Evaluation** to expand that section.
+3. Click on **3.2 Model Evaluation** to expand that section.
 4. Hover under the Pearson Correlation Matrix content block until a horizontal line with a **{{< fa plus >}}** button appears, indicating that you can insert a new block.
 5. Click **{{< fa plus >}}** and then select **Test-Driven Block** under [from library]{.smallcaps}:
     - Click on **Custom** under [test-driven]{.smallcaps} in the left sidebar.
@@ -389,12 +389,12 @@ When you're done, click [{{< fa chevron-right >}}]() to continue.
 
 # Section 2 {background-color="#083E44" background-image="/assets/img/about-us-esphere.svg"}
 
-## {background-iframe="/notebooks/EXECUTED/model_development/4-finalize_testing_documentation.html" background-interactive="yes" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/4-finalize_testing_documentation.html" background-interactive="yes" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **4 — Finalize testing and documentation**
 
-This is the final notebook in our introductory series, which will walk you through wrapping custom test results into your documentation, as well as how to update the configuration for the entire model documentation template to suit your needs.
+This is the final notebook in our introductory series, which will walk you through wrapping custom test results into your documentation, as well as how to update the configuration for the entire documentation template to suit your needs.
 
 **Scroll through this notebook** to explore. When you are done, click [{{< fa chevron-right >}}]() to continue.
 
@@ -402,44 +402,44 @@ This is the final notebook in our introductory series, which will walk you throu
 
 {{< include /training/common-slides/_retrieve-your-code-snippet.qmd >}}
 
-## {background-iframe="/notebooks/EXECUTED/model_development/4-finalize_testing_documentation.html#initialize-the-validmind-library" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/4-finalize_testing_documentation.html#initialize-the-validmind-library" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Connect to your model**
 
 With your code snippet copied to your clipboard:
 
-1. Open **4 — Finalize testing and documentation**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/4-finalize_testing_documentation.ipynb){target="_blank"}
+1. Open **4 — Finalize testing and documentation**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/4-finalize_testing_documentation.ipynb){target="_blank"}
 2. Run all the cells under the **Setting up** section.
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-# Include custom test results {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
+# Include custom <br>test results {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
-## {background-iframe="/notebooks/EXECUTED/model_development/4-finalize_testing_documentation.html#reconnect-to-validmind" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/4-finalize_testing_documentation.html#reconnect-to-validmind" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Reconnect to {{< var vm.product >}}**
 
 After you insert test-driven blocks, changes should persist and become available every time you call the [`preview_template()` function](/validmind/validmind.qmd#preview_template){target="_blank"}:
 
-1. Continue with **4 — Finalize testing and documentation**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/4-finalize_testing_documentation.ipynb){target="_blank"}
+1. Continue with **4 — Finalize testing and documentation**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/4-finalize_testing_documentation.ipynb){target="_blank"}
 2. Run all the cells under the **Reconnect to {{< var vm.product >}}** section.
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_development/4-finalize_testing_documentation.html#include-custom-test-results" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/4-finalize_testing_documentation.html#include-custom-test-results" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Log custom test results**
 
 Now that your custom test IDs are part of your template, you can now run tests for an entire section and all additional custom tests will be loaded:
 
-1. Continue with **4 — Finalize testing and documentation**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/4-finalize_testing_documentation.ipynb){target="_blank"}
+1. Continue with **4 — Finalize testing and documentation**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/4-finalize_testing_documentation.ipynb){target="_blank"}
 2. Run the cell under the **Include custom test results** section.
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
@@ -453,7 +453,7 @@ When you're done, return to this page and click [{{< fa chevron-right >}}]() to
 
 :::: {.columns}
 ::: {.column width="30%" .pr4 .f2}
-Documentation template configuration
+Configuring documentation template tests
 
 ::: {.tc}
 [Learn more ...](/validmind/validmind/vm_models.qmd#get_default_config){.button target="_blank"}
@@ -475,27 +475,27 @@ The utility function `vm.get_test_suite().get_default_config()` will return the
 :::
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_development/4-finalize_testing_documentation.html#documentation-template-configuration" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/4-finalize_testing_documentation.html#configuring-documentation-template-tests" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Retrieve default configuration**
 
-1. Continue with **4 — Finalize testing and documentation**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/4-finalize_testing_documentation.ipynb){target="_blank"}
-2. Run the first cell under the **Documentation template configuration** section.
+1. Continue with **4 — Finalize testing and documentation**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/4-finalize_testing_documentation.ipynb){target="_blank"}
+2. Run the first two cells under the **Configuring documentation template tests** section.
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_development/4-finalize_testing_documentation.html#update-the-config" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/4-finalize_testing_documentation.html#run-updated-documentation-section-tests" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
-**Update template configuration**
+**Run updated documentation section tests**
 
 The default configuration does not assign any inputs to a test, but you can assign inputs to individual tests as needed:
 
-1. Continue with **4 — Finalize testing and documentation**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/4-finalize_testing_documentation.ipynb){target="_blank"}
-2. Run the all the cells under the following Documentation template configuration section: **Update the config**
+1. Continue with **4 — Finalize testing and documentation**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/4-finalize_testing_documentation.ipynb){target="_blank"}
+2. Run the all the cells under the following Configuring documentation template tests section: **Run updated documentation section tests**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
@@ -518,15 +518,15 @@ In this third module, you learned how to:
 - [x] Implement, run, and log custom inline tests
 - [x] Register external test providers for reusable custom tests
 - [x] Include custom test results in your documentation template
-- [x] Configure your model's documentation template
+- [x] Configure your documentation template
 
 :::
 ::::
 
 ::: {.tc}
 <br>
-Continue your model development journey with:
+Continue your development journey with:
 <br><br>
 <!-- IMPORTANT: USE THE .HTML PATH AND NOT THE .QMD PATH FOR THE REVEALJS OUTPUT -->
-[Finalizing Model Documentation](finalizing-model-documentation.html){.button target="_blank"}
+[Finalizing Documentation](finalizing-documentation.html){.button target="_blank"}
 :::
\ No newline at end of file
diff --git a/site/training/developer-fundamentals/learning-to-run-tests.qmd b/site/training/developer-fundamentals/learning-to-run-tests.qmd
index 55426a2661..c720e5c9b5 100644
--- a/site/training/developer-fundamentals/learning-to-run-tests.qmd
+++ b/site/training/developer-fundamentals/learning-to-run-tests.qmd
@@ -38,7 +38,7 @@ includes:
 
 # Learning objectives {.center}
 
-_"As a **developer** who has registered a model with {{< var vm.product >}}, I want to identify relevant tests to run from {{< var vm.product >}}'s test repository, run and log tests for my model, and insert the test results into my model's documentation."_
+_"As a **developer** who has registered a record (model) with {{< var vm.product >}}, I want to identify relevant tests to run from {{< var vm.product >}}'s test repository, run and log tests, and insert the test results into my documentation."_
 
 ::: {.tc}
 <br>
@@ -51,7 +51,7 @@ This second module is part of a four-part series:
 ## Module 2 — Contents {.center}
 
 ::: {.f2}
-1. [{{< var vm.product >}} for model development](#validmind-for-model-development)
+1. [{{< var vm.product >}} for development](#validmind-for-development)
 2. [Explore ValidMind tests](#explore-validmind-tests)
 3. [Run tests with the {{< var validmind.developer >}}](#run-validmind-tests)
 4. [Log tests to the {{< var validmind.platform >}}](#log-validmind-tests)
@@ -73,7 +73,7 @@ To continue, you need to have been [onboarded](developer-fundamentals-register.q
 
 ::: {.tc}
 <!-- IMPORTANT: USE THE .HTML PATH AND NOT THE .QMD PATH FOR THE REVEALJS OUTPUT -->
-[Using {{< var vm.product >}} for Model Development](using-validmind-for-model-development.html){.button target="_blank"}
+[Using {{< var vm.product >}} for Development](using-validmind-for-development.html){.button target="_blank"}
 :::
 
 :::: {.tc .mt5 .f2 .embed}
@@ -87,7 +87,7 @@ Already logged in and refreshed this module? Click [{{< fa chevron-right >}}]()
 
 <!-- USING THE VARIABLE IN THE HEADING MESSES UP THE PAGE ANCHOR -->
 
-# ValidMind for model development {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
+# ValidMind for development {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
 ## {.scrollable .center}
 
@@ -96,7 +96,7 @@ Already logged in and refreshed this module? Click [{{< fa chevron-right >}}]()
 Jupyter Notebook series
 
 ::: {.f3}
-When you run these notebooks, they will generate a draft of model documentation and upload it to {{< var vm.product >}}, complete with supporting test results.
+When you run these notebooks, they will generate a draft of documentation and upload it to {{< var vm.product >}}, complete with supporting test results.
 
 ::: {.f5 .nt2 .pl2 .mb4}
 <br>
@@ -107,31 +107,31 @@ You will need to have already completed **1 — Set up the {{< var validmind.dev
 :::
 
 ::: {.column width="70%" .bl .pl4 .f3}
-#### {{< var vm.product >}} for model development
+#### {{< var vm.product >}} for development
 
-Our series of four introductory notebooks for model developers include sample code and how-to information to get you started with {{< var vm.product >}}:
+Our series of four introductory notebooks for developers include sample code and how-to information to get you started with {{< var vm.product >}}:
 
-1 — [Set up the {{< var validmind.developer >}}](/notebooks/tutorials/model_development/1-set_up_validmind.ipynb){target="_blank"}<br>
-2 — [Start the model development process](/notebooks/tutorials/model_development/2-start_development_process.ipynb){target="_blank"}<br>
-3 — [Integrate custom tests](/notebooks/tutorials/model_development/3-integrate_custom_tests.ipynb){target="_blank"}<br>
-4 — [Finalize testing and documentation](/notebooks/tutorials/model_development/4-finalize_testing_documentation.ipynb){target="_blank"}<br>
+1 — [Set up the {{< var validmind.developer >}}](/notebooks/tutorials/development/1-set_up_validmind.ipynb){target="_blank"}<br>
+2 — [Start the development process](/notebooks/tutorials/development/2-start_development_process.ipynb){target="_blank"}<br>
+3 — [Integrate custom tests](/notebooks/tutorials/development/3-integrate_custom_tests.ipynb){target="_blank"}<br>
+4 — [Finalize testing and documentation](/notebooks/tutorials/development/4-finalize_testing_documentation.ipynb){target="_blank"}<br>
 <br>
 
 ::: {.f4 .pl3 .pr3 .embed}
-In this second module, we'll run through **2 — Start the model development process** together. 
+In this second module, we'll run through **2 — Start the development process** together.
 :::
 
 :::
 ::::
 
-Let's continue our journey with **2 — Start the model development process** on the next page. {{< fa hand-point-right >}}
+Let's continue our journey with **2 — Start the development process** on the next page. {{< fa hand-point-right >}}
 
-## {background-iframe="/notebooks/EXECUTED/model_development/2-start_development_process.html" background-interactive="yes" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/2-start_development_process.html" background-interactive="yes" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
-**2 — Start the model development process**
+**2 — Start the development process**
 
-During this course, we'll run through these notebooks together, and at the end of your learning journey you'll have a fully documented sample model ready for review.
+During this course, we'll run through these notebooks together, and at the end of your learning journey you'll have a fully documented sample record (model) ready for review.
 
 For now, **scroll through this notebook** to explore. When you are done, click [{{< fa chevron-right >}}]() to continue.
 
@@ -145,14 +145,14 @@ For now, **scroll through this notebook** to explore. When you are done, click [
 
 {{< include /training/common-slides/_get-your-code-snippet.qmd >}}
 
-## {background-iframe="/notebooks/EXECUTED/model_development/2-start_development_process.html#initialize-the-validmind-library" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/2-start_development_process.html#initialize-the-validmind-library" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Connect to your model**
 
 With your code snippet copied to your clipboard:
 
-1. Open **2 — Start the model development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/2-start_development_process.ipynb){target="_blank"}
+1. Open **2 — Start the development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/2-start_development_process.ipynb){target="_blank"}
 2. Run the following cells in the Setting up section:
     - **Initialize the {{< var validmind.developer >}}**
     - **Import sample dataset**
@@ -161,29 +161,29 @@ When you're done, return to this page and click [{{< fa chevron-right >}}]() to
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_development/2-start_development_process.html#identify-qualitative-tests" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/2-start_development_process.html#identify-qualitative-tests" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Identify qualitative tests**
 
-Next, we'll use the [`list_tests()` function](/notebooks/EXECUTED/model_development/1-set_up_validmind.ipynb#explore-available-tests){target="_blank"} to pinpoint tests we want to run:
+Next, we'll use the [`list_tests()` function](/notebooks/EXECUTED/development/1-set_up_validmind.ipynb#explore-available-tests){target="_blank"} to pinpoint tests we want to run:
 
-1. Continue with **2 — Start the model development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/2-start_development_process.ipynb){target="_blank"}
+1. Continue with **2 — Start the development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/2-start_development_process.ipynb){target="_blank"}
 2. Run all the cells under the Setting up section: **Identify qualitative tests**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_development/2-start_development_process.html#initialize-the-validmind-datasets" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/2-start_development_process.html#initialize-the-validmind-dataset" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Initialize {{< var vm.product >}} datasets**
 
 Then, we'll use the [`init_dataset()` function](/validmind/validmind.qmd#init_dataset){target="_blank"} to connect the sample data with a {{< var vm.product >}} `Dataset` object in preparation for running tests:
 
-1. Continue with **2 — Start the model development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/2-start_development_process.ipynb){target="_blank"}
-2. Run the following cell in the Setting up section: **Initialize the {{< var vm.product >}} datasets**
+1. Continue with **2 — Start the development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/2-start_development_process.ipynb){target="_blank"}
+2. Run the following cell in the Setting up section: **Initialize the {{< var vm.product >}} dataset**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
@@ -193,28 +193,28 @@ When you're done, return to this page and click [{{< fa chevron-right >}}]() to
 
 # Run ValidMind tests {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
-## {background-iframe="/notebooks/EXECUTED/model_development/2-start_development_process.html#run-tabular-data-tests" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/2-start_development_process.html#run-tabular-data-tests" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Run tabular data tests**
 
 You run individual tests by calling the [`run_test()` function](/validmind/validmind/tests.qmd#run_test){target="_blank"} provided by the `validmind.tests` module:
 
-1. Continue with **2 — Start the model development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/2-start_development_process.ipynb){target="_blank"}
+1. Continue with **2 — Start the development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/2-start_development_process.ipynb){target="_blank"}
 2. Run all the cells under the Running tests section: **Run tabular data tests**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_development/2-start_development_process.html#utilize-test-output" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/2-start_development_process.html#utilize-test-output" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Utilize test output**
 
 You can utilize the output from a ValidMind test for further use, for example, if you want to remove highly correlated features:
 
-1. Continue with **2 — Start the model development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/2-start_development_process.ipynb){target="_blank"}
+1. Continue with **2 — Start the development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/2-start_development_process.ipynb){target="_blank"}
 2. Run all the cells under the Running tests section: **Utilize test output**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
@@ -243,33 +243,33 @@ Document test results
 Every test result returned by the `run_test()` function has a `.log()` method that can be used to send the test results to the {{< var validmind.platform >}}:
 
 - When using `run_documentation_tests()`, documentation sections will be automatically populated with the results of all tests registered in the documentation template.
-- When logging individual test results to the platform, you'll need to manually add those results to the desired section of the model documentation.
+- When logging individual test results to the platform, you'll need to manually add those results to the desired section of the documentation.
 
 :::
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_development/2-start_development_process.html#run-and-log-multiple-tests" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/2-start_development_process.html#run-and-log-multiple-tests" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Run & log multiple tests**
 
 The [`run_documentation_tests()` function](/validmind/validmind.qmd#run_documentation_tests){target="_blank"} allows you to run multiple tests at once and automatically log the results to your documentation:
 
-1. Continue with **2 — Start the model development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/2-start_development_process.ipynb){target="_blank"}
+1. Continue with **2 — Start the development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/2-start_development_process.ipynb){target="_blank"}
 2. Run the following cell in the Documenting results section: **Run and log multiple tests**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_development/2-start_development_process.html#run-and-log-an-individual-test" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/2-start_development_process.html#run-and-log-an-individual-test" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Run & log an individual test**
 
 Next, we'll run an individual test and log the result to the {{< var validmind.platform >}}:
 
-1. Continue with **2 — Start the model development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/2-start_development_process.ipynb){target="_blank"}
+1. Continue with **2 — Start the development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/2-start_development_process.ipynb){target="_blank"}
 2. Run the following cell in the Running tests section: **Run and log an individual test**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
@@ -283,7 +283,7 @@ When you're done, return to this page and click [{{< fa chevron-right >}}]() to
 Work with test results
 
 ::: {.tc}
-[Learn more ...](/notebooks/EXECUTED/model_development/2-start_development_process.ipynb#add-individual-test-results-to-model-documentation){.button target="_blank"}
+[Learn more ...](/notebooks/EXECUTED/development/2-start_development_process.ipynb#add-individual-test-results-to-documentation){.button target="_blank"}
 
 :::
 
@@ -305,9 +305,9 @@ Work with test results
 **Insert a test-driven block**
 :::
 
-1. Select the name of your record you registered for this course to open up the record details page.
-2. In the left sidebar that appears for your record, click **Development** under {{< fa file >}} Documents.
-3. Locate the Data Preparation section and click on **2.3 Correlations and Interactions** to expand that section.
+1. Select the name of your model you registered for this course to open up the model details page.
+2. In the left sidebar that appears for your model, click **Development** under {{< fa file >}} Documents.
+3. Click on **2.3 Correlations and Interactions** to expand that section.
 4. Hover under the Pearson Correlation Matrix content block until a horizontal line with a **{{< fa plus >}}** button appears, indicating that you can insert a new block.
 5. Click **{{< fa plus >}}** and then select **Test-Driven Block** under [from library]{.smallcaps}:
     - Click on **VM Library** under [test-driven]{.smallcaps} in the left sidebar.
@@ -325,7 +325,7 @@ When you're done, click [{{< fa chevron-right >}}]() to continue.
 
 :::: {.columns}
 ::: {.column width="50%" .pr4 .f2}
-Model testing with {{< var vm.product >}}
+Testing with {{< var vm.product >}}
 
 :::
 
@@ -337,7 +337,7 @@ Try it **live** on the next pages. {{< fa hand-point-right >}}
 
 ::: {.f3}
 <br>
-So far, we’ve focused on the data assessment and pre-processing that usually occurs prior to any models being built. Now, let’s instead assume we have already built a model and we want to incorporate some model results into our documentation:
+So far, we’ve focused on the data assessment and pre-processing that usually occurs prior to any records (models) being built. Now, let’s instead assume we have already built a model and we want to incorporate some results into our documentation:
 
 ::: {.panel-tabset .f4}
 
@@ -360,57 +360,60 @@ In this next example, we’ll focus on running the tests within the Model Develo
 
 :::
 
-## {background-iframe="/notebooks/EXECUTED/model_development/2-start_development_process.html#train-simple-logistic-regression-model" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/2-start_development_process.html#train-simple-logistic-regression-model" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Train your model**
 
 Using {{< var vm.product >}} tests, we'll train a simple logistic regression model on our dataset and evaluate its performance:
 
-1. Continue with **2 — Start the model development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/2-start_development_process.ipynb){target="_blank"}
-2. Run all the cells under the Model testing section: **Train simple logistic regression model**
+1. Continue with **2 — Start the development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/2-start_development_process.ipynb){target="_blank"}
+2. Run all the cells under the Running model evaluation tests section: **Train simple logistic regression model**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_development/2-start_development_process.html#initialize-model-evaluation-objects" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/2-start_development_process.html#initialize-validmind-datasets" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
-**Initialize a model object**
+**Initialize ValidMind objects**
 
 Use the `init_dataset()` and [`init_model()` functions](/validmind/validmind.qmd#init_model){target="_blank"} to initialize these objects:
 
-1. Continue with **2 — Start the model development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/2-start_development_process.ipynb){target="_blank"}
-2. Run the cell under the following Model testing section: **Initialize model evaluation objects**
+1. Continue with **2 — Start the development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/2-start_development_process.ipynb){target="_blank"}
+2. Run the cells under the following Running model evaluation tests sections:
+
+  - **Initialize {{< var vm.product >}} datasets**
+  - **Initialize a {{< var vm.product >}} model**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_development/2-start_development_process.html#assign-predictions" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/2-start_development_process.html#assign-predictions" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Assign predictions**
 
 Use the [`assign_predictions()` method](/validmind/validmind/vm_models.qmd#assign_predictions){target="_blank"} from the `Dataset` object to link existing predictions to any number of models:
 
-1. Continue with **2 — Start the model development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/2-start_development_process.ipynb){target="_blank"}
-2. Run the cell under the following Model testing section: **Assign predictions**
+1. Continue with **2 — Start the development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/2-start_development_process.ipynb){target="_blank"}
+2. Run the following cell under the Running model evaluation tests section: **Assign predictions**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_development/2-start_development_process.html#run-the-model-evaluation-tests" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/2-start_development_process.html#run-the-model-evaluation-tests" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Run the model evaluation tests**
 
 Finally, we'll run only the tests within the Model Development section of the model documentation:
 
-1. Continue with **2 — Start the model development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/2-start_development_process.ipynb){target="_blank"}
-2. Run the cell under the following Model testing section: **Run the model evaluation tests**
+1. Continue with **2 — Start the development process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/2-start_development_process.ipynb){target="_blank"}
+2. Run the cell under the Running model evaluation tests section: **Run the model evaluation tests**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
@@ -433,14 +436,14 @@ In this second module, you learned how to:
 - [x] Initialize {{< var vm.product >}} `Dataset` and `Model` objects
 - [x] Run out-of-the-box tests with the {{< var validmind.developer >}}
 - [x] Log test results to the {{< var validmind.platform >}}
-- [x] Insert logged test results into your model's documentation
+- [x] Insert logged test results into your documentation
 
 :::
 ::::
 
 ::: {.tc}
 <br>
-Continue your model development journey with:
+Continue your development journey with:
 <br><br>
 <!-- IMPORTANT: USE THE .HTML PATH AND NOT THE .QMD PATH FOR THE REVEALJS OUTPUT -->
 [Implementing Custom Tests](implementing-custom-tests.html){.button target="_blank"}
diff --git a/site/training/developer-fundamentals/using-validmind-for-model-development.qmd b/site/training/developer-fundamentals/using-validmind-for-development.qmd
similarity index 64%
rename from site/training/developer-fundamentals/using-validmind-for-model-development.qmd
rename to site/training/developer-fundamentals/using-validmind-for-development.qmd
index dda1c92849..ef4bf79cca 100644
--- a/site/training/developer-fundamentals/using-validmind-for-model-development.qmd
+++ b/site/training/developer-fundamentals/using-validmind-for-development.qmd
@@ -2,7 +2,9 @@
 # Copyright © 2023-2026 ValidMind Inc. All rights reserved.
 # Refer to the LICENSE file in the root of this repository for details.
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
-title: "Using {{< var vm.product >}} <br>for Model Development"
+title: "Using {{< var vm.product >}} <br>for Development"
+aliases:
+  - /training/developer-fundamentals/using-validmind-for-model-development.html
 subtitle: "Developer Fundamentals — Module 1 of 4<br><br>_Click [{{< fa chevron-right >}}](#learning-objectives) to start_"
 lightbox: true
 format:
@@ -26,7 +28,7 @@ format:
       - slideover
   html:
   # Change this to the file name prepended by a _ to get around the global HTML output settings required by _metadata.yml
-    output-file: _using-validmind-for-model-development.html
+    output-file: _using-validmind-for-development.html
     search: false
 title-slide-attributes:
   data-background-color: "#083E44"
@@ -38,7 +40,7 @@ includes:
 
 # Learning objectives {.center}
 
-_"As a **developer** who is new to {{< var vm.product >}}, I want to learn how to register a model in the {{< var validmind.platform >}}, install the {{< var validmind.developer >}} in my local environment, and preview my model's documentation template."_
+_"As a **developer** who is new to {{< var vm.product >}}, I want to learn how to register a record (model) in the {{< var validmind.platform >}}, install the {{< var validmind.developer >}} in my local environment, and preview my documentation template."_
 
 ::: {.tc}
 <br>
@@ -51,10 +53,10 @@ This first module is part of a four-part series:
 ## Module 1 — Contents {.center}
 
 ::: {.f2}
-1. [{{< var vm.product >}} for model development](#validmind-for-model-development)
-2. [Register a model in the {{< var validmind.platform >}}](#register-a-model)
+1. [{{< var vm.product >}} for development](#validmind-for-development)
+2. [Register a record (model) in the {{< var validmind.platform >}}](#register-a-model)
 3. [Install the {{< var validmind.developer >}}](#install-the-validmind-library)
-4. [Preview your model's documentation template](#preview-model-documentation)
+4. [Preview your documentation template](#preview-documentation-template)
 
 :::
 
@@ -83,7 +85,7 @@ Already logged in and refreshed this module? Click [{{< fa chevron-right >}}]()
 
 <!-- USING THE VARIABLE IN THE HEADING MESSES UP THE PAGE ANCHOR -->
 
-# ValidMind for model development {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
+# ValidMind for development {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
 ## {.scrollable .center}
 
@@ -92,20 +94,20 @@ Already logged in and refreshed this module? Click [{{< fa chevron-right >}}]()
 Jupyter Notebook series
 
 ::: {.f3}
-When you run these notebooks, they will generate a draft of model documentation and upload it to {{< var vm.product >}}, complete with supporting test results.
+When you run these notebooks, they will generate a draft of documentation and upload it to {{< var vm.product >}}, complete with supporting test results.
 
 :::
 :::
 
 ::: {.column width="70%" .bl .pl4 .f3}
-#### {{< var vm.product >}} for model development
+#### {{< var vm.product >}} for development
 
-Our series of four introductory notebooks for model developers include sample code and how-to information to get you started with {{< var vm.product >}}:
+Our series of four introductory notebooks for developers include sample code and how-to information to get you started with {{< var vm.product >}}:
 
-1 — [Set up the {{< var validmind.developer >}}](/notebooks/tutorials/model_development/1-set_up_validmind.ipynb){target="_blank"}<br>
-2 — [Start the model development process](/notebooks/tutorials/model_development/2-start_development_process.ipynb){target="_blank"}<br>
-3 — [Integrate custom tests](/notebooks/tutorials/model_development/3-integrate_custom_tests.ipynb){target="_blank"}<br>
-4 — [Finalize testing and documentation](/notebooks/tutorials/model_development/4-finalize_testing_documentation.ipynb){target="_blank"}<br>
+1 — [Set up the {{< var validmind.developer >}}](/notebooks/tutorials/development/1-set_up_validmind.ipynb){target="_blank"}<br>
+2 — [Start the development process](/notebooks/tutorials/development/2-start_development_process.ipynb){target="_blank"}<br>
+3 — [Integrate custom tests](/notebooks/tutorials/development/3-integrate_custom_tests.ipynb){target="_blank"}<br>
+4 — [Finalize testing and documentation](/notebooks/tutorials/development/4-finalize_testing_documentation.ipynb){target="_blank"}<br>
 <br>
 
 ::: {.f4 .pl3 .pr3 .embed}
@@ -119,13 +121,13 @@ In this first module, we'll run through **1 — Set up the {{< var validmind.dev
 
 Let's start our journey with **1 — Set up the {{< var validmind.developer >}}** on the next page. {{< fa hand-point-right >}}
 
-## {background-iframe="/notebooks/EXECUTED/model_development/1-set_up_validmind.html" background-interactive="yes" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/1-set_up_validmind.html" background-interactive="yes" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 
 **1 — Set up the {{< var validmind.developer >}}**
 
-During this course, we'll run through these notebooks together, and at the end of your learning journey you'll have a fully documented sample model ready for review.
+During this course, we'll run through these notebooks together, and at the end of your learning journey you'll have a fully documented sample record (model) ready for review.
 
 For now, **scroll through this notebook** to explore. When you are done, click [{{< fa chevron-right >}}]() to continue.
 
@@ -140,9 +142,9 @@ For now, **scroll through this notebook** to explore. When you are done, click [
 
 From here, you can:
 
-- Keep track of your models in the customizable inventory ...
-- Review and edit model documentation generated via the {{< var validmind.developer >}} ...
-- Collaborate with model validators to get your model approved ...
+- Keep track of your records (models) in the customizable inventory ...
+- Review and edit documentation generated via the {{< var validmind.developer >}} ...
+- Collaborate with validators to get your records approved ...
 - ... and much more!
 
 ::: {.embed}
@@ -161,13 +163,13 @@ When you're done exploring, click [{{< fa chevron-right >}}]() to continue.
 :::: {.slideover--r}
 **Welcome to the {{< fa cubes >}} Inventory**
 
-Use the model inventory to track comprehensive details for all your models throughout the model lifecycle. The model inventory is customizable and extensible, with a layout that can be configured to suit your needs.
+Use the inventory to track comprehensive details for all your records (models) throughout their lifecycles. The inventory is customizable and extensible, with a layout that can be configured to suit your needs.
 
 ::: {.f6 .pl3 .pr3 .embed}
-To start the documentation process, a model must already be registered in the model inventory via the **Register Model** modal.
+To start the documentation process, a record must already be registered in the inventory.
 :::
 
-**Let's register a model together** on the next page. {{< fa hand-point-right >}}
+**Let's register a model-type record together** on the next page. {{< fa hand-point-right >}}
 
 ::::
 
@@ -180,49 +182,52 @@ To start the documentation process, a model must already be registered in the mo
 **Apply a documentation template**
 :::
 
-Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier.
+Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier.
 
 1. Click on the name of the model you registered earlier.
 2. In the left sidebar that appears for your model, click **{{< fa file >}} Documents** and select **Development**.
 3. Under [create document]{.smallcaps}, select `Binary classification` from the **[template]{.smallcaps}** drop-down menu.
 4. Click **Use Template** to apply the template.
 
+:::: {.f2 .embed}
+If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents){target="_blank"})
+
+:::
+
 When you're done, click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
 <!-- USING THE VARIABLE IN THE HEADING MESSES UP THE PAGE ANCHOR -->
 
-# Install the ValidMind Library {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
+# Install the <br>ValidMind Library {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
 {{< include /training/common-slides/_get-your-code-snippet.qmd >}}
 
-## {background-iframe="/notebooks/EXECUTED/model_development/1-set_up_validmind.html#install-the-validmind-library" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/1-set_up_validmind.html#setting-up" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Install & initialize the {{< var validmind.developer >}}**
 
 With your code snippet copied to your clipboard:
 
-1. Open **1 — Set up the {{< var validmind.developer >}}**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/1-set_up_validmind.ipynb){target="_blank"}
-2. Run all the cells in the sections under **Initializing the {{< var validmind.developer >}}**.
+1. Open **1 — Set up the {{< var validmind.developer >}}**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/1-set_up_validmind.ipynb){target="_blank"}
+2. Run all the cells in the sections under **Setting up**.
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-<!-- USING THE VARIABLE IN THE HEADING MESSES UP THE PAGE ANCHOR -->
-
-# Preview model documentation {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
+# Preview documentation template {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
-## {background-iframe="/notebooks/EXECUTED/model_development/1-set_up_validmind.html#preview-the-documentation-template" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/1-set_up_validmind.html#getting-to-know-validmind" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
-**Preview the documentation template**
+**Get to know {{< var vm.product >}}**
 
-You can preview your model's documentation template right from the {{< var validmind.developer >}}:
+You can preview your model's documentation template right from the {{< var validmind.developer >}}, as well as explore available tests without leaving your development environment:
 
-1. Continue with **1 — Set up the {{< var validmind.developer >}}**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_development/1-set_up_validmind.ipynb){target="_blank"}
+1. Continue with **1 — Set up the {{< var validmind.developer >}}**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/development/1-set_up_validmind.ipynb){target="_blank"}
 2.  Run all the cells in the sections under **Getting to know ValidMind**.
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
@@ -254,24 +259,24 @@ When you're done, click [{{< fa chevron-right >}}]() to continue.
 
 :::: {.columns}
 ::: {.column width="30%" .pr4 .f2}
-Using {{< var vm.product >}} for model development
+Using {{< var vm.product >}} for development
 
 :::
 
 ::: {.column width="70%" .bl .pl4 .f3}
 In this first module, you learned how to:
 
-- [x] Register a model in the {{< var validmind.platform >}}
+- [x] Register a record (model) in the {{< var validmind.platform >}}
 - [x] Install the {{< var validmind.developer >}} in your environment
 - [x] Connect to your registered model in the {{< var validmind.platform >}}
-- [x] Preview and verify your model's documentation template
+- [x] Preview and verify your documentation template
 
 :::
 ::::
 
 ::: {.tc}
 <br>
-Continue your model development journey with:
+Continue your development journey with:
 <br><br>
 <!-- IMPORTANT: USE THE .HTML PATH AND NOT THE .QMD PATH FOR THE REVEALJS OUTPUT -->
 [Learning to Run Tests](learning-to-run-tests.html){.button target="_blank"}
diff --git a/site/training/program/learning-paths.qmd b/site/training/program/learning-paths.qmd
index cb3a24e2e8..7d469a3128 100644
--- a/site/training/program/learning-paths.qmd
+++ b/site/training/program/learning-paths.qmd
@@ -80,7 +80,7 @@ Learn how to use {{< var vm.product >}} as an **administrator** to onboard your
 :::: {.flex .flex-wrap .justify-around}
 
 ::: {.w-80-ns}
-Learn how to use {{< var vm.product >}} as a **developer** to generate model documentation, automate testing, and track your model's progress through the model lifecycle.
+Learn how to use {{< var vm.product >}} as a **developer** to generate documentation, automate testing, and track your record's progress throughout its entire lifecycle.
 
 :::
 
@@ -95,21 +95,21 @@ Learn how to use {{< var vm.product >}} as a **developer** to generate model doc
 :::: {.flex .flex-wrap .justify-around}
 
 ::: {.w-50-ns}
-#### <sup>Module 1</sup><br> Using {{< var vm.product >}} for Model Development
+#### <sup>Module 1</sup><br> Using {{< var vm.product >}} for Development
 
-- Register a model in the {{< var validmind.platform >}}
+- Register a record (model) in the {{< var validmind.platform >}}
 - Install the {{< var validmind.developer >}} in your environment
 - Connect to your registered model
-- Preview your model's documentation template
+- Preview your documentation template
 :::
 
 ::: {.w-50-ns}
 #### <sup>Module 2</sup><br> Learning to Run Tests
 
 - Identify relevant tests to run from {{< var vm.product >}}'s test vault
-- Initialize datasets & models for use with the {{< var validmind.developer >}}
-- Run and log out-of-the-box tests for new and existing models
-- Insert test results into your model's documentation
+- Initialize ValidMind objects for use with the {{< var vm.developer >}}
+- Run and log out-of-the-box tests
+- Insert test results into your documentation
 :::
 
 ::::
@@ -120,16 +120,16 @@ Learn how to use {{< var vm.product >}} as a **developer** to generate model doc
 #### <sup>Module 3</sup><br> Implementing Custom Tests
 
 - Implement, run, and log custom inline and reusable tests
-- Refresh your template to include inserted test-driven blocks
-- Configure your template to include custom tests
+- Refresh template to include inserted test-driven blocks
+- Configure template to include custom tests
 :::
 
 ::: {.w-50-ns}
-#### <sup>Module 4</sup><br> Finalizing Model Documentation
+#### <sup>Module 4</sup><br> Finalizing Documentation
 
-- Refine your model documentation
-- Submit your model documentation for approval
-- Track changes and other updates to your model
+- Refine your documentation 
+- Submit your documentation for approval
+- Track changes and other updates to your record (model)
 :::
 
 ::::
@@ -140,7 +140,7 @@ Learn how to use {{< var vm.product >}} as a **developer** to generate model doc
 :::: {.flex .flex-wrap .justify-around}
 
 ::: {.w-80-ns}
-Learn how to use {{< var vm.product >}} as a **validator** to generate validation reports, automate testing, and collaborate with your model development team.
+Learn how to use {{< var vm.product >}} as a **validator** to generate validation reports, automate testing, and collaborate with your development team.
 
 :::
 
@@ -155,12 +155,12 @@ Learn how to use {{< var vm.product >}} as a **validator** to generate validatio
 :::: {.flex .flex-wrap .justify-around}
 
 ::: {.w-50-ns}
-#### <sup>Module 1</sup><br> Using {{< var vm.product >}} for Model Validation
+#### <sup>Module 1</sup><br> Using {{< var vm.product >}} for Validation
 
 - Install the {{< var validmind.developer >}} in your environment
-- Connect to a champion model as a validator
-- Preview the model's validation report template
-- Review submitted model documentation
+- Connect to a champion record (model) as a validator
+- Preview the validation report template
+- Review submitted documentation
 
 :::
 
@@ -170,7 +170,7 @@ Learn how to use {{< var vm.product >}} as a **validator** to generate validatio
 - Identify relevant tests to run from {{< var vm.product >}}'s test vault
 - Initialize datasets for use with the {{< var validmind.developer >}}
 - Run and log out-of-the-box tests on your datasets
-- Insert test results into your model’s validation report
+- Insert test results into your validation report
 
 :::
 
@@ -179,11 +179,11 @@ Learn how to use {{< var vm.product >}} as a **validator** to generate validatio
 :::: {.flex .flex-wrap .justify-around}
 
 ::: {.w-50-ns}
-#### <sup>Module 3</sup><br> Developing Challenger Models
+#### <sup>Module 3</sup><br> Developing Potential Challengers
 
-- Initialize models for use with the {{< var validmind.developer >}}
-- Run and log out-of-the box and custom tests for your models
-- Use the results of tests to log model artifacts (findings)
+- Initialize records (models) for use with the {{< var validmind.developer >}}
+- Run and log out-of-the-box and custom tests
+- Use the results of tests to log artifacts (findings)
 
 :::
 
@@ -192,7 +192,7 @@ Learn how to use {{< var vm.product >}} as a **validator** to generate validatio
 
 - Make qualitative edits to your validation report
 - Submit your validation report for approval
-- Track artifact resolution and other updates to your model
+- Track artifact resolution and other updates to your record (model)
 
 :::
 
@@ -204,7 +204,7 @@ Learn how to use {{< var vm.product >}} as a **validator** to generate validatio
 :::: {.flex .flex-wrap .justify-around}
 
 ::: {.w-80-ns}
-Learn how to use {{< var vm.product >}} as a developer managing the **ongoing monitoring** of your models with ongoing monitoring plans, scheduled monitoring runs, and tracked metrics over time.
+Learn how to use {{< var vm.product >}} as a developer managing the **ongoing monitoring** of your records (models) with ongoing monitoring plans, scheduled monitoring runs, and tracked metrics over time.
 
 :::
 
@@ -247,8 +247,8 @@ Learn how to use {{< var vm.product >}} as a developer managing the **ongoing mo
 ::: {.w-50-ns}
 #### <sup>Module 1</sup><br> Using {{< var vm.product >}} for Ongoing Monitoring
 
-- How monitoring integrates with model documentation <!-- {{< fa x >}} -->
-- Enable monitoring for a model <!-- {{< fa check >}} -->
+- How monitoring integrates with documentation <!-- {{< fa x >}} -->
+- Enable monitoring for a record (model) <!-- {{< fa check >}} -->
 - Preview the monitoring template <!-- {{< fa check >}} -->
 :::
 
@@ -256,7 +256,7 @@ Learn how to use {{< var vm.product >}} as a developer managing the **ongoing mo
 #### <sup>Module 2</sup><br> Setting Up Monitoring
 
 - Load the reference and monitoring datasets <!-- {{< fa check >}} -->
-- Load the production model <!-- {{< fa check >}} -->
+- Load the production record (model) <!-- {{< fa check >}} -->
 - Initialize datasets and a model object <!-- {{< fa check >}} -->
 - Assign predictions to the datasets <!-- {{< fa check >}} -->
 :::
@@ -270,7 +270,7 @@ Learn how to use {{< var vm.product >}} as a developer managing the **ongoing mo
 
 - Run the ongoing monitoring tests <!-- {{< fa check >}} -->
 - Conduct target and feature drift testing <!-- {{< fa check >}} -->
-- Model performance monitoring tests <!-- {{< fa check >}} -->
+- Performance monitoring tests <!-- {{< fa check >}} -->
 - How to schedule quarterly or monthly monitoring runs <!-- {{< fa x >}} -->
 :::
 
@@ -314,7 +314,7 @@ As a solutions architect who is new to {{< var vm.product >}}, learn how to set
 #### Module 1: TBD
 
 - Notebooks that show running tests, test suites, single-function documentation
-- LaTex formulas in JSON templates
+- LaTeX formulas in JSON templates
 ::: -->
 
 
@@ -391,7 +391,7 @@ Take a guided tour of {{< var vm.product >}} and discover how the platform helps
 #### <sup>Section 6</sup><br> Risk Insights & Regulatory Alignment
 
 - Use AI-powered document checker for compliance
-- Align with regulatory frameworks like SR 11-7, SS1/23, E-23, and EU AI Act
+- Align with regulatory frameworks like SR 26-2, SS1/23, E-23, and EU AI Act
 - Generate risk assessments with recommendations
 :::
 
diff --git a/site/training/program/program-overview.qmd b/site/training/program/program-overview.qmd
index eea7b05cc4..2f4b25b7f0 100644
--- a/site/training/program/program-overview.qmd
+++ b/site/training/program/program-overview.qmd
@@ -43,7 +43,7 @@ Our training program is built on three pillars:
 - Accelerate time-to-value with structured learning paths
 - Build internal expertise across key roles
 - Maintain compliance with industry standards
-- Scale model risk management capabilities efficiently
+- Scale risk management capabilities efficiently
 
 ::: {.column-margin}
 ::: {#learning-paths}
@@ -52,10 +52,10 @@ Our training program is built on three pillars:
 
 ### Role-based expertise
 
-Our training develops competency across your entire model risk management team:
+Our training develops competency across your entire risk management teams:
 
-- **Model developers** master efficient documentation and testing
-- **Model validators** learn systematic validation approaches
+- **Developers** master efficient documentation and testing
+- **Validators** learn systematic validation approaches
 - **Governance administrators** implement robust oversight processes
 
 ## Options for every organization
diff --git a/site/training/program/training-faq.qmd b/site/training/program/training-faq.qmd
index 033b2d631b..dafcbb16f3 100644
--- a/site/training/program/training-faq.qmd
+++ b/site/training/program/training-faq.qmd
@@ -10,12 +10,12 @@ Here's what we have been asked about {{< var vm.product >}} during training sess
 
 ## Answers by topic
 
-### Model inventory
+### Inventory
 
-:::: {.flex .flex-wrap .justify-around} 
+:::: {.flex .flex-wrap .justify-around}
 
 ::: {.w-60-ns .nb3 .pr2}
-- How do I configure the model inventory?
+- How do I configure the inventory?
 :::
 
 ::: {.w-40-ns .nb3 .pl2}
@@ -27,7 +27,7 @@ Here's what we have been asked about {{< var vm.product >}} during training sess
 :::: {.flex .flex-wrap .justify-around}
 
 ::: {.w-60-ns .nb3 .pr2}
-- How do I add model inventory fields?
+- How do I add inventory fields?
 :::
 
 ::: {.w-40-ns .nb3 .pl2}
@@ -86,7 +86,7 @@ Here's what we have been asked about {{< var vm.product >}} during training sess
 
 ::::
 
-### Workflows for model lifecycle management
+### Workflows for lifecycle management
 
 :::: {.flex .flex-wrap .justify-around}
 
@@ -145,7 +145,7 @@ Here's what we have been asked about {{< var vm.product >}} during training sess
 :::
 
 ::: {.w-40-ns .nb3 .pl2}
-[{{< fa graduation-cap >}} training](/training/developer-fundamentals/implementing-custom-tests.html#/configure-documentation-templates){.button-small} [{{< fa book-open >}} docs](/notebooks/tutorials/model_development/4-finalize_testing_documentation.ipynb#documentation-template-configuration){.button-small}
+[{{< fa graduation-cap >}} training](/training/developer-fundamentals/implementing-custom-tests.html#/configure-documentation-templates){.button-small} [{{< fa book-open >}} docs](/notebooks/tutorials/development/4-finalize_testing_documentation.ipynb#configuring-documentation-template-tests){.button-small}
 :::
 
 ::::
@@ -162,16 +162,16 @@ Here's what we have been asked about {{< var vm.product >}} during training sess
 
 ::::
 
-### Model documentation
+### Documentation
 
 :::: {.flex .flex-wrap .justify-around}
 
 ::: {.w-60-ns .nb3 .pr2}
-- How do I register a model with existing template?
+- How do I register a record (model) with existing template?
 :::
 
 ::: {.w-40-ns .nb3 .pl2}
-[{{< fa graduation-cap >}} training](/training/developer-fundamentals/using-validmind-for-model-development.html#/register-a-model){.button-small} [{{< fa book-open >}} docs](/guide/inventory/register-records-in-inventory.qmd){.button-small}
+[{{< fa graduation-cap >}} training](/training/developer-fundamentals/using-validmind-for-development.html#/register-a-model){.button-small} [{{< fa book-open >}} docs](/guide/inventory/register-records-in-inventory.qmd){.button-small}
 :::
 
 ::::
@@ -179,11 +179,11 @@ Here's what we have been asked about {{< var vm.product >}} during training sess
 :::: {.flex .flex-wrap .justify-around}
 
 ::: {.w-60-ns .nb3 .pr2}
-- How do I generate documentation for models?
+- How do I generate documentation for records (models)?
 :::
 
 ::: {.w-40-ns .nb3 .pl2}
-[{{< fa graduation-cap >}} training](/training/developer-fundamentals/learning-to-run-tests.html#/section-8){.button-small} [{{< fa book-open >}} docs](/notebooks/quickstart/quickstart_model_documentation.ipynb){.button-small}
+[{{< fa graduation-cap >}} training](/training/developer-fundamentals/learning-to-run-tests.html#/section-8){.button-small} [{{< fa book-open >}} docs](/notebooks/quickstart/quickstart_documentation.ipynb){.button-small}
 :::
 
 ::::
@@ -191,16 +191,16 @@ Here's what we have been asked about {{< var vm.product >}} during training sess
 :::: {.flex .flex-wrap .justify-around}
 
 ::: {.w-60-ns .nb3 .pr2}
-- How do I submit my model documentation for validation?
+- How do I submit my documentation for validation?
 :::
 
 ::: {.w-40-ns .nb3 .pl2}
-[{{< fa graduation-cap >}} training](/training/developer-fundamentals/finalizing-model-documentation.html#/submit-documentation-for-approval){.button-small} [{{< fa book-open >}} docs](/guide/documentation/submit-documents.qmd){.button-small}
+[{{< fa graduation-cap >}} training](/training/developer-fundamentals/finalizing-documentation.html#/submit-documentation-for-approval){.button-small} [{{< fa book-open >}} docs](/guide/documentation/submit-documents.qmd){.button-small}
 :::
 
 ::::
 
-### Model testing
+### Testing
 
 :::: {.flex .flex-wrap .justify-around}
 
@@ -226,7 +226,7 @@ Here's what we have been asked about {{< var vm.product >}} during training sess
 
 ::::
 
-### Model validation
+### Validation
 
 :::: {.flex .flex-wrap .justify-around}
 
diff --git a/site/training/risk-governance-fundamentals.qmd/risk-governance-fundamentals.qmd b/site/training/risk-governance-fundamentals.qmd/risk-governance-fundamentals.qmd
index 5a9603f32c..09e285d038 100644
--- a/site/training/risk-governance-fundamentals.qmd/risk-governance-fundamentals.qmd
+++ b/site/training/risk-governance-fundamentals.qmd/risk-governance-fundamentals.qmd
@@ -85,7 +85,7 @@ Get overviews for validation activities and risk exposure.
 TBD. 
 
 ::: {.tc}
-[Learn more ...](/about/overview-model-risk-management.qmd){.button target="_blank"}
+[Learn more ...](/about/use-cases/model-risk-management.qmd){.button target="_blank"}
 :::
 
 Or, find your next learning resource on [{{< var validmind.training >}}](/training/training.qmd).
diff --git a/site/training/training-templates/course-slides.qmd b/site/training/training-templates/course-slides.qmd
index 7115456efc..3fc38f03b5 100644
--- a/site/training/training-templates/course-slides.qmd
+++ b/site/training/training-templates/course-slides.qmd
@@ -157,7 +157,7 @@ Speaking of important information in callouts ... if you update the extension, *
 
 # iFrame embed bottom {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
-## {background-iframe="/notebooks/EXECUTED/model_development/1-set_up_validmind.html" background-interactive="yes" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/development/1-set_up_validmind.html" background-interactive="yes" data-preload="yes"}
 
 :::: {.slideover--b}
 **This is a collapsible bottom-aligned modal (`slideover--b`) on top of a rendered site file.**
@@ -195,7 +195,7 @@ The box will also automatically scroll once past a certain length (a percentage
 
 # iFrame embed top {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
-## {background-iframe="/notebooks/EXECUTED/model_development/1-set_up_validmind.html" background-interactive="yes" data-preload="yes"} 
+## {background-iframe="/notebooks/EXECUTED/development/1-set_up_validmind.html" background-interactive="yes" data-preload="yes"} 
 
 :::: {.slideover--t .auto-collapse-10}
 **This is a collapsible top-aligned modal (`slideover--t`) on top of a rendered site file.**
diff --git a/site/training/training.qmd b/site/training/training.qmd
index 6c88aa65e6..8e8e3365de 100644
--- a/site/training/training.qmd
+++ b/site/training/training.qmd
@@ -56,33 +56,51 @@ listing:
     table-hover: true
     image-align: left
     contents:
-    - path: https://jupyterhub.validmind.ai/hub/user-redirect/lab/tree/quickstart/quickstart_model_documentation.ipynb
-      title: "Quickstart for model documentation"
+    - path: https://jupyterhub.validmind.ai/hub/user-redirect/lab/tree/quickstart/quickstart_documentation.ipynb
+      title: "Quickstart for documentation"
       subtitle: "Open notebook in JupyterHub {{< fa chevron-right >}}"
-      description: "Gets you started with the basic process of documenting models with {{< var vm.product >}}, from the {{< var vm.developer >}} to the {{< var vm.platform >}}."
+      description: "Gets you started with the basic process of documenting records such as models with {{< var vm.product >}}, from the {{< var vm.developer >}} to the {{< var vm.platform >}}."
       categories: ["[Demo] Customer Churn Model"]
       reading-time: "20"
+    - path: https://jupyterhub.validmind.ai/hub/user-redirect/lab/tree/quickstart/quickstart_validation.ipynb
+      title: "Quickstart for validation"
+      subtitle: "Open notebook in JupyterHub {{< fa chevron-right >}}"
+      description: "Gets you started with the basic process of validating records such as models with {{< var vm.product >}}, from the {{< var vm.developer >}} to the {{< var vm.platform >}}."
+      categories: ["[Demo] Customer Churn Model"]
+      reading-time: "45"
       author: "{{< var vm.product >}}"
-    - path: https://jupyterhub.validmind.ai/hub/user-redirect/lab/tree/tutorials/model_development/101-set_up_validmind.ipynb
-      title: "{{< var vm.product >}} for model development (4-part series)"
+    - path: https://jupyterhub.validmind.ai/hub/user-redirect/lab/tree/tutorials/development/1-set_up_validmind.ipynb
+      title: "{{< var vm.product >}} for development (4-part series)"
       subtitle: "Open series in JupyterHub {{< fa chevron-right >}}"
-      description: "Learn how the end-to-end documentation process works based on common scenarios you encounter in model development settings."
+      description: "Learn how the end-to-end documentation process works based on common scenarios you encounter in development settings."
       categories: ["[Demo] Customer Churn Model"]
       reading-time: "60"
+    - path: https://jupyterhub.validmind.ai/hub/user-redirect/lab/tree/tutorials/validation/1-set_up_validmind_for_validation.ipynb
+      title: "{{< var vm.product >}} for validation (4-part series)"
+      subtitle: "Open series in JupyterHub {{< fa chevron-right >}}"
+      description: "Learn how the end-to-end challenge process works based on common scenarios you encounter in validation settings."
+      categories: ["[Demo] Customer Churn Model"]
+      reading-time: "120"
       author: "{{< var vm.product >}}"
-    - path: https://jupyterhub.validmind.ai/hub/user-redirect/lab/tree/code_samples/credit_risk/application_scorecard_demo.ipynb
-      title: "Document an application scorecard model"
+    - path: https://jupyterhub.validmind.ai/hub/user-redirect/lab/tree/use_cases/credit_risk/document_excel_application_scorecard_demo.ipynb
+      title: "Document an Excel-based application scorecard model"
+      subtitle: "Open notebook in JupyterHub {{< fa chevron-right >}}"
+      description: "Guides you through building and documenting an application scorecard model built with Excel using the Lending Club sample dataset from Kaggle."
+      categories: ["[Demo] Credit Risk Model"]
+      reading-time: "60"
+    - path: https://jupyterhub.validmind.ai/hub/user-redirect/lab/tree/use_cases/validation/validate_application_scorecard_demo.ipynb
+      title: "Validate an application scorecard model"
       subtitle: "Open notebook in JupyterHub {{< fa chevron-right >}}"
-      description: "Guides you through building and documenting an application scorecard model using the Lending Club sample dataset from Kaggle."
+      description: "Guides you through validating an application scorecard model using the Lending Club sample dataset from Kaggle."
       categories: ["[Demo] Credit Risk Model"]
-      reading-time: "30"
+      reading-time: "120"
       author: "{{< var vm.product >}}"
-    - path: https://jupyterhub.validmind.ai/hub/user-redirect/lab/tree/code_samples/nlp_and_llm/foundation_models_integration_demo.ipynb
-      title: "Prompt validation for large language models (LLMs)"
+    - path: https://jupyterhub.validmind.ai/hub/user-redirect/lab/tree/agents/document_agentic_ai.ipynb
+      title: "Document an agentic AI system"
       subtitle: "Open notebook in JupyterHub {{< fa chevron-right >}}"
-      description: "Run and document prompt validation tests for a large language model (LLM) specialized in sentiment analysis for financial news."
-      categories: ["[Demo] Foundation Model - Text Sentiment Analysis"]
-      reading-time: "15"
+      description: "Guides you through building and documenting an agentic AI system with the ValidMind Library."
+      categories: ["[Demo] LangGraph-based Banking Agent"]
+      reading-time: "90"
       author: "{{< var vm.product >}}"
 ---
 
@@ -156,15 +174,15 @@ Gain **practical experience** and discover what the platform has to offer with o
 ::: {.attn}
 ## ![](/favicon.svg){height=30px} Learn by doing
 
-Our training environment mimics a production environment and includes comprehensive resources such as notebooks with sample code you can run, sample models registered in the model inventory, and draft documentation and validation reports.
+Our training environment mimics a production environment and includes comprehensive resources such as notebooks with sample code you can run, sample records (models) registered in the inventory, and draft documentation and validation reports.
 
-Most of our model documentation features are available for you to test in the training environment, including automated model testing and documentation, preparing model validation reports, and large language model (LLM) support. 
+Most of our documentation features are available for you to test in the training environment, including automated testing and documentation, preparing  validation reports, and large language model (LLM) support.
 
-These features provide a rich context for testing and evaluation, using models and datasets provided by {{< var vm.product >}} and hosted in our own environment. 
+These features provide a rich context for testing and evaluation, using records and datasets provided by {{< var vm.product >}} and hosted in our own environment.
 
-### Sample models
+### Sample records
 
-Sample models registered in the model inventory include:
+Sample mode-type records registered in the inventory include:
 
 - Housing prices prediction model
 - Credit risk scorecard model
@@ -172,11 +190,11 @@ Sample models registered in the model inventory include:
 - Interest rate time series forecasting model
 - Large language model (LLM) demo application
 
-Please note that we make updates to the models and datasets available in the training environment from time to time to provide you with our latest features. 
+Please note that we make updates to the models and datasets available in the training environment from time to time to provide you with our latest features.
 
-### Sample notebooks 
+### Sample notebooks
 
-Each interactive notebook includes the sample code needed to test and document a model provided in the {{< var validmind.platform >}}: 
+Each interactive notebook includes the sample code needed to test and document a model provided in the {{< var validmind.platform >}}:
 
 :::{#sample-notebooks}
 :::
diff --git a/site/training/validator-fundamentals/developing-challenger-models.qmd b/site/training/validator-fundamentals/developing-potential-challengers.qmd
similarity index 64%
rename from site/training/validator-fundamentals/developing-challenger-models.qmd
rename to site/training/validator-fundamentals/developing-potential-challengers.qmd
index 8ffa13ebbb..7625b6b481 100644
--- a/site/training/validator-fundamentals/developing-challenger-models.qmd
+++ b/site/training/validator-fundamentals/developing-potential-challengers.qmd
@@ -2,8 +2,10 @@
 # Copyright © 2023-2026 ValidMind Inc. All rights reserved.
 # Refer to the LICENSE file in the root of this repository for details.
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
-title: "Developing <br>Challenger Models"
+title: "Developing <br>Potential Challengers"
 subtitle: "Validator Fundamentals — Module 3 of 4<br><br>_Click [{{< fa chevron-right >}}](#learning-objectives) to start_"
+aliases:
+  - /training/validator-fundamentals/developing-challenger-models.html
 lightbox: true
 format:
   revealjs:
@@ -26,7 +28,7 @@ format:
       - slideover
   html:
   # Change this to the file name prepended by a _ to get around the global HTML output settings required by _metadata.yml
-    output-file: _developing-challenger-models.html
+    output-file: _developing-potential-challengers.html
     search: false
 title-slide-attributes:
   data-background-color: "#083E44"
@@ -36,7 +38,7 @@ skip_preview: true
 
 # Learning objectives {.center}
 
-_"As a **validator** who has already run and logged data quality tests with {{< var vm.product >}}, I want to next run both out-of-the-box and custom model evaluation tests for the champion model and a potential challenger model, and use the results of my testing to log model artifacts (findings)."_
+_"As a **validator** who has already run and logged data quality tests with {{< var vm.product >}}, I want to next run both out-of-the-box and custom evaluation tests for the champion and a potential challenger, and use the results of my testing to log artifacts (findings)."_
 
 ::: {.tc}
 <br>
@@ -51,7 +53,7 @@ This third module is part of a four-part series:
 :::: {.columns .f3}
 ::: {.column width="50%" .mt4 .pr4}
 ### Introduction
-- [{{< var vm.product >}} for model validation](#validmind-for-model-validation)
+- [{{< var vm.product >}} for validation](#validmind-for-validation)
 :::
 
 :::
@@ -95,7 +97,7 @@ To continue, you need to have been [onboarded](validator-fundamentals-register.q
 :::: {.columns}
 ::: {.column width="60%"}
 ::: {.tc}
-[Using {{< var vm.product >}} for Model Validation](using-validmind-for-model-validation.html){.button target="_blank"}
+[Using {{< var vm.product >}} for Validation](using-validmind-for-validation.html){.button target="_blank"}
 :::
 
 :::
@@ -118,7 +120,7 @@ Already logged in and refreshed this module? Click [{{< fa chevron-right >}}]()
 
 <!-- USING THE VARIABLE IN THE HEADING MESSES UP THE PAGE ANCHOR -->
 
-# ValidMind for model validation {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
+# ValidMind for validation {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
 ## {.scrollable .center}
 
@@ -127,7 +129,7 @@ Already logged in and refreshed this module? Click [{{< fa chevron-right >}}]()
 Jupyter Notebook series
 
 ::: {.f3}
-These notebooks walk you through how to validate a model using {{< var vm.product >}}, complete with supporting test results attached as evidence to your validation report.
+These notebooks walk you through how to validate a record (model) using {{< var vm.product >}}, complete with supporting test results attached as evidence to your validation report.
 
 ::: {.f5 .nt2 .pl2 .mb4}
 <br>
@@ -140,14 +142,14 @@ You will need to have already completed notebooks **1** and **2** during the fir
 :::
 
 ::: {.column width="70%" .bl .pl4 .f3}
-#### {{< var vm.product >}} for model validation
+#### {{< var vm.product >}} for validation
 
-Our series of four introductory notebooks for model validators include sample code and how-to information to get you started with {{< var vm.product >}}:
+Our series of four introductory notebooks for validators include sample code and how-to information to get you started with {{< var vm.product >}}:
 
-1 — [Set up the {{< var validmind.developer >}} for validation](/notebooks/tutorials/model_validation/1-set_up_validmind_for_validation.ipynb){target="_blank"}<br>
-2 — [Start the model validation process](/notebooks/tutorials/model_validation/2-start_validation_process.ipynb){target="_blank"}<br>
-3 — [Developing a potential challenger model](/notebooks/tutorials/model_validation/3-developing_challenger_model.ipynb){target="_blank"}<br>
-4 — [Finalize testing and reporting](/notebooks/tutorials/model_validation/4-finalize_validation_reporting.ipynb){target="_blank"}<br>
+1 — [Set up the {{< var validmind.developer >}} for validation](/notebooks/tutorials/validation/1-set_up_validmind_for_validation.ipynb){target="_blank"}<br>
+2 — [Start the validation process](/notebooks/tutorials/validation/2-start_validation_process.ipynb){target="_blank"}<br>
+3 — [Developing a potential challenger](/notebooks/tutorials/validation/3-developing_potential_challenger.ipynb){target="_blank"}<br>
+4 — [Finalize testing and reporting](/notebooks/tutorials/validation/4-finalize_validation_reporting.ipynb){target="_blank"}<br>
 <br>
 
 ::: {.f4 .pl3 .pr3 .embed}
@@ -161,12 +163,12 @@ Let's continue our journey with **Section 1** on the next page. {{< fa hand-poin
 
 # Section 1 {background-color="#083E44" background-image="/assets/img/about-us-esphere.svg"}
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/3-developing_challenger_model.html" background-interactive="yes" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/3-developing_potential_challenger.html" background-interactive="yes" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
-**3 — Developing a potential challenger model**
+**3 — Developing a potential challenger**
 
-This is the third notebook in our introductory series, which will walk you through how to evaluate your champion model against a potential challenger with {{< var vm.product >}}.
+This is the third notebook in our introductory series, which will walk you through how to evaluate your champion against a potential challenger with {{< var vm.product >}}.
 
 **Scroll through this notebook** to explore. When you are done, click [{{< fa chevron-right >}}]() to continue.
 
@@ -174,41 +176,41 @@ This is the third notebook in our introductory series, which will walk you throu
 
 {{< include /training/common-slides/_get-your-code-snippet.qmd >}}
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/3-developing_challenger_model.html#initialize-the-validmind-library" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/3-developing_potential_challenger.html#initialize-the-validmind-library" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Connect to your model**
 
 With your code snippet copied to your clipboard:
 
-1. Open **3 — Developing a potential challenger model**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/3-developing_challenger_model.ipynb){target="_blank"}
+1. Open **3 — Developing a potential challenger**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/3-developing_potential_challenger.ipynb){target="_blank"}
 2. Run all the cells under the **Setting up** section.
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/3-developing_challenger_model.html#import-the-champion-model" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/3-developing_potential_challenger.html#import-the-champion-model" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Import the champion model**
 
 Next, let's import the champion model submitted by the model development team in the format of a `.pkl` file for evaluation:
 
-1. Continue with **3 — Developing a potential challenger model**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/3-developing_challenger_model.ipynb){target="_blank"}
+1. Continue with **3 — Developing a potential challenger**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/3-developing_potential_challenger.ipynb){target="_blank"}
 2. Run the cell under the **Import the champion model** section.
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-# Train a challenger model {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
+# Train a <br>challenger model {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
 ## {.scrollable .center}
 
 :::: {.columns}
 ::: {.column width="60%" .pr4 .f2}
-Champion vs. challenger models
+Champion vs. challengers
 
 :::
 
@@ -221,7 +223,7 @@ Try it **live** on the next pages. {{< fa hand-point-right >}}
 
 ::: {.f4}
 
-We're curious how an alternate model compares to our champion model, so let's train a challenger model as a basis for our testing:
+We're curious how an alternate record (model) compares to our champion, so let's train a challenger as a basis for our testing:
 
 ::: {.panel-tabset}
 
@@ -240,35 +242,35 @@ We're curious how an alternate model compares to our champion model, so let's tr
 
 :::
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/3-developing_challenger_model.html#training-a-potential-challenger-model" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/3-developing_potential_challenger.html#training-a-potential-challenger-model" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Random forest classification model**
 
 Let's train our potential challenger model:
 
-1. Continue with **3 — Developing a potential challenger model**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/3-developing_challenger_model.ipynb){target="_blank"}
+1. Continue with **3 — Developing a potential challenger**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/3-developing_potential_challenger.ipynb){target="_blank"}
 2. Run the cell under the following Training a potential challenger model section: **Random forest classification model**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/3-developing_challenger_model.html#initializing-the-model-objects" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/3-developing_potential_challenger.html#initialize-the-validmind-models" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
-**Initialize the model objects**
+**Initialize the ValidMind models**
 
 In addition to the initialized datasets, you'll also need to initialize a ValidMind model object (`vm_model`) that can be passed to other functions for analysis and tests on the data for each of our two models using [the `vm.init_model()` method](/validmind/validmind.qmd#init_model){target="_blank"}:
 
-1. Continue with **3 — Developing a potential challenger model**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/3-developing_challenger_model.ipynb){target="_blank"}
-2. Run all the cells under the section **Initializing the model objects**.
+1. Continue with **3 — Developing a potential challenger**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/3-developing_potential_challenger.ipynb){target="_blank"}
+2. Run all the cells under the section **Initialize the ValidMind models**.
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-# Run model evaluation tests {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
+# Run model <br>evaluation tests {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
 ## {.scrollable .center}
 
@@ -287,7 +289,7 @@ Try it **live** on the next pages. {{< fa hand-point-right >}}
 
 ::: {.f4}
 
-With everything ready for us, let's run the rest of our validation tests. We'll focus on comprehensive testing around model performance of both the champion and challenger models going forward as we've already verified the data quality of the datasets used to train the champion model:
+With everything ready for us, let's run the rest of our validation tests. We'll focus on comprehensive testing around performance of both the champion and challenger going forward as we've already verified the data quality of the datasets used to train the champion:
 
 ::: {.panel-tabset}
 
@@ -308,14 +310,14 @@ Finally, we want to verify the relative influence of different input features on
 
 :::
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/3-developing_challenger_model.html#run-model-performance-tests" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/3-developing_potential_challenger.html#run-model-performance-tests" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Run model performance tests**
 
 Use the [`list_tests()` function](/validmind/validmind/tests.qmd#list_tests){target="_blank"} to identify all the model performance tests for classification:
 
-1. Continue with **3 — Developing a potential challenger model**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/3-developing_challenger_model.ipynb){target="_blank"}
+1. Continue with **3 — Developing a potential challenger**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/3-developing_potential_challenger.ipynb){target="_blank"}
 2. Run all the cells under the Running model evaluation tests section: **Run model performance tests**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
@@ -333,7 +335,7 @@ Log an artifact (finding)
 :::
 
 ::: {.tc}
-[Learn more ...](/notebooks/EXECUTED/model_validation/3-developing_challenger_model.html#log-an-artifact){.button target="_blank"}
+[Learn more ...](/guide/validation/assess-compliance.qmd#link-artifacts-to-reports){.button target="_blank"}
 
 :::
 
@@ -361,39 +363,40 @@ As we can observe from the output in our notebook, our champion model doesn't pa
 
 1. Select the name of your model you registered for this course to open up the model details page.
 2. In the left sidebar that appears for your model, click **Validation** under {{< fa file >}} Documents.
-3. Locate the Data Preparation section and click on **2.2.2. Model Performance** to expand that section.
-4. Under the Model Performance Metrics section, locate Artifacts then click **Link Artifact to Report** and select **Validation Issue**.
-5. Click **{{< fa plus >}} Add Validation Issue** to add a validation issue type artifact.
-6. Enter in the details for your validation issue and click **Save**.
-7. Select the validation issue you just added to link to your validation report.
-8. Click **Update Linked Artifacts** to insert your validation issue.
+3. Click on **2.2.2. Model Performance** to expand that section.
+4. Under the Model Performance Metrics guideline, click to expand the **Artifacts** panel.
+5. Click **{{< fa link >}} Link Artifact** and select **Validation Issue** as the type of artifact.
+6. Click **{{< fa plus >}} Add Validation Issue** and enter the details for your validation issue.
+7. Click **Add Validation Issue** to submit the validation issue.
+8. Select the validation issue you just added to link to your validation report.
+9. Click **Update Linked Artifacts** to insert your validation issue.
 
 When you're done, click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/3-developing_challenger_model.html#run-diagnostic-tests" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/3-developing_potential_challenger.html#run-diagnostic-tests" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Run diagnostic tests**
 
 This time, use `list_tests()` to identify all the model diagnosis tests for classification:
 
-1. Continue with **3 — Developing a potential challenger model**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/3-developing_challenger_model.ipynb){target="_blank"}
+1. Continue with **3 — Developing a potential challenger**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/3-developing_potential_challenger.ipynb){target="_blank"}
 2. Run all the cells under the Running model evaluation tests section: **Run diagnostic tests**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/3-developing_challenger_model.html#run-feature-importance-tests" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/3-developing_potential_challenger.html#run-feature-importance-tests" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Run feature importance tests**
 
 Use `list_tests()` again to identify all the feature importance tests for classification:
 
-1. Continue with **3 — Developing a potential challenger model**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/3-developing_challenger_model.ipynb){target="_blank"}
+1. Continue with **3 — Developing a potential challenger**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/3-developing_potential_challenger.ipynb){target="_blank"}
 2. Run all the cells under the Running model evaluation tests section: **Run feature importance tests**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
@@ -402,7 +405,7 @@ When you're done, return to this page and click [{{< fa chevron-right >}}]() to
 
 # Section 2 {background-color="#083E44" background-image="/assets/img/about-us-esphere.svg"}
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/4-finalize_validation_reporting.html" background-interactive="yes" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/4-finalize_validation_reporting.html" background-interactive="yes" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **4 — Finalize testing and reporting**
@@ -415,14 +418,14 @@ This is the final notebook in our introductory series, which will walk you throu
 
 {{< include /training/common-slides/_retrieve-your-code-snippet.qmd >}}
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/4-finalize_validation_reporting.html#initialize-the-validmind-library" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/4-finalize_validation_reporting.html#initialize-the-validmind-library" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Connect to your model**
 
 With your code snippet copied to your clipboard:
 
-1. Open **4 — Finalize testing and validation**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/4-finalize_validation_reporting.ipynb){target="_blank"}
+1. Open **4 — Finalize testing and reporting**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/4-finalize_validation_reporting.ipynb){target="_blank"}
 2. Run all the cells under the **Setting up** section.
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
@@ -445,33 +448,33 @@ Custom tests
 Let's implement a *custom test* that calculates a confusion matrix:
 
 - You'll note that the custom test function is just a regular Python function that can include and require any Python library as you see fit.
-- In a usual model validation situation, you would load a saved custom test provided by the model development team. In the following section, we'll have you implement the same custom test and make it available for reuse, to familiarize you with the processes.
+- In a usual validation situation, you would load a saved custom test provided by the development team. In the following section, we'll have you implement the same custom test and make it available for reuse, to familiarize you with the processes.
 
 :::
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/4-finalize_validation_reporting.html#implement-a-custom-inline-test" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/4-finalize_validation_reporting.html#implement-a-custom-inline-test" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Implement a custom inline test**
 
 An *inline test* refers to a test written and executed within the same environment as the code being tested — in the following example, right in our Jupyter Notebook —  without requiring a separate test file or framework:
 
-1. Continue with **4 — Finalize testing and validation**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/4-finalize_validation_reporting.ipynb){target="_blank"}
+1. Continue with **4 — Finalize testing and reporting**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/4-finalize_validation_reporting.ipynb){target="_blank"}
 2. Run all the cells in the following sections under Implementing custom tests: **Implement a custom inline test**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/4-finalize_validation_reporting.html#use-external-test-providers" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/4-finalize_validation_reporting.html#use-external-test-providers" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Use external test providers**
 
 Sometimes you may want to reuse the same set of custom tests across multiple models and share them with others in your organization, like the model development team would have done with you in this example workflow featured in this series of notebooks:
 
-1. Continue with **4 — Finalize testing and validation**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/4-finalize_validation_reporting.ipynb){target="_blank"}
+1. Continue with **4 — Finalize testing and reporting**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/4-finalize_validation_reporting.ipynb){target="_blank"}
 2. Run all the cells in the following sections under Implementing custom tests: **Use external test providers**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
@@ -480,14 +483,14 @@ When you're done, return to this page and click [{{< fa chevron-right >}}]() to
 
 # Verify test runs {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/4-finalize_validation_reporting.html#verify-test-runs" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/4-finalize_validation_reporting.html#verify-test-runs" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Verify model development testing**
 
 Our final task is to verify that all the tests provided by the model development team were run and reported accurately:
 
-1. Continue with **4 — Finalize testing and validation**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/4-finalize_validation_reporting.ipynb){target="_blank"}
+1. Continue with **4 — Finalize testing and reporting**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/4-finalize_validation_reporting.ipynb){target="_blank"}
 2. Run all the cells under the **Verify test runs** section.
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
@@ -500,7 +503,7 @@ When you're done, return to this page and click [{{< fa chevron-right >}}]() to
 
 :::: {.columns}
 ::: {.column width="30%" .pr4 .f2}
-Developing challenger models
+Developing potential challengers
 
 :::
 
@@ -511,14 +514,14 @@ In this third module, you learned how to:
 - [x] Log an artifact within your validation report
 - [x] Implement, run, and log custom inline tests
 - [x] Register external test providers for reusable custom tests
-- [x] Verify testing done by model development using {{< var vm.product >}}
+- [x] Verify testing done by development using {{< var vm.product >}}
 
 :::
 ::::
 
 ::: {.tc}
 <br>
-Continue your model development journey with:
+Continue your validation journey with:
 <br><br>
 <!-- IMPORTANT: USE THE .HTML PATH AND NOT THE .QMD PATH FOR THE REVEALJS OUTPUT -->
 [Finalizing Validation Reports](finalizing-validation-reports.html){.button target="_blank"}
diff --git a/site/training/validator-fundamentals/finalizing-validation-reports.qmd b/site/training/validator-fundamentals/finalizing-validation-reports.qmd
index 76b9ff22f9..83efc88156 100644
--- a/site/training/validator-fundamentals/finalizing-validation-reports.qmd
+++ b/site/training/validator-fundamentals/finalizing-validation-reports.qmd
@@ -36,7 +36,7 @@ skip_preview: true
 
 # Learning objectives {.center}
 
-_"As a **validator** who has logged validation tests with the {{< var validmind.developer >}} to the {{< var validmind.platform >}}, I want to refine my model's validation report, submit my validation report for approval, and track artifact (finding) resolution and other updates to my model."_
+_"As a **validator** who has logged validation tests with the {{< var validmind.developer >}} to the {{< var validmind.platform >}}, I want to refine my validation report, submit my validation report for approval, and track artifact (finding) resolution and other updates."_
 
 ::: {.tc}
 <br>
@@ -64,7 +64,7 @@ This final module is part of a four-part series:
 ### Section 2
 
 - [Collaborate with others](#collaborate-with-others)
-- [Track record activity](#track-record-activity)
+- [Track activity](#track-activity)
 - [View analytics](#view-analytics)
 
 :::
@@ -88,7 +88,7 @@ To continue, you need to have been [onboarded](validator-fundamentals-register.q
 :::: {.columns}
 ::: {.column width="30%"}
 ::: {.tc}
-[Module 1](using-validmind-for-model-validation.html){.button target="_blank"}
+[Module 1](using-validmind-for-validation.html){.button target="_blank"}
 :::
 
 :::
@@ -101,7 +101,7 @@ To continue, you need to have been [onboarded](validator-fundamentals-register.q
 
 ::: {.column width="30%"}
 ::: {.tc}
-[Module 3](developing-challenger-models.html){.button target="_blank"}
+[Module 3](developing-potential-challengers.html){.button target="_blank"}
 :::
 
 :::
@@ -171,7 +171,7 @@ For example:
 
 3. Edit the description for our individually inserted `ClassImbalance:raw_dataset_preprocessed` test:
 
-  ![Editor for a test result description](/notebooks/tutorials/model_validation/class-imbalance-results-detail.png){fig-alt="Screenshot showing the editor for a test result description" .screenshot}
+  ![Editor for a test result description](/notebooks/tutorials/validation/class-imbalance-results-detail.png){fig-alt="Screenshot showing the editor for a test result description" .screenshot}
 
 :::
 
@@ -185,8 +185,8 @@ For example:
 **Add & edit content blocks**
 :::
 
-1. Select the name of your record you registered for this course to open up the record details page.
-2. On the left sidebar that appears for your record, click **Validation** under {{< fa file >}} Documents.
+1. Select the name of your model you registered for this course to open up the model details page.
+2. On the left sidebar that appears for your model, click **Validation** under {{< fa file >}} Documents.
 3. Click on **1. Executive Summary** to add and edit a content block.
 4. Click on **2.2.1. Data Quality** to edit the description for the linked Class Imbalance Assessment test results.
 
@@ -198,43 +198,38 @@ When you're done, click [{{< fa chevron-right >}}]() to continue.
 
 :::: {.columns}
 ::: {.column width="30%" .pr4 .f2}
-Assess model compliance
-
-::: {.f5 .nt2 .pl2 .mb4}
-(Scroll down for the full instructions.)
-:::
+Automatically map & assess evidence
 
 ::: {.tc}
-[Learn more ...](/guide/validation/assess-compliance.qmd#provide-compliance-assessments){.button target="_blank"}
-
+[Learn more ...](/guide/validation/map-and-assess-evidence.qmd){.button target="_blank"}
 :::
 
-<br>Try it **live** on the next page. {{< fa hand-point-right >}}
 :::
 
-::: {.column width="70%" .bl .pl4 .f4}
-
-::: {.panel-tabset}
+::: {.column width="70%" .bl .pl4 .f3}
 
-### Add risk assessment notes
+{{< include /guide/validation/_how-does-mapping-assessment-work.qmd >}}
 
-1. From the **{{< fa cubes >}} Inventory** in the {{< var validmind.platform >}}, go to the model you connected to earlier.
-
-2. In the left sidebar that appears for your model, click **Validation** under {{< fa file >}} Documents.
+:::
+::::
 
-3. Click on **2.2.1. Data Quality** to expand that section and locate the Class Imbalance Assessment sub-section.
+## {.scrollable}
 
-4. Click under **Risk Assessment Notes** to edit the content block using the content editing toolbar.
+:::: {.columns}
+::: {.column width="30%" .pr4 .f2}
+Automatically map evidence
 
-    For example, use **{{< fa diamond >}} <sup>[beta]{.smallcaps}</sup> (Generate Text with AI)** to create a draft summarizing the contents of the Class Imbalance Assessment sub-section.
+::: {.f5 .nt2 .pl2 .mb4}
+(Scroll down for the full instructions.)
+:::
 
-      ![Sample compliance assessment](class-imbalance-assessment.png){width=90% fig-alt="A screenshot showing a sample compliance assessment" .screenshot}
 
-### Provide compliance assessments
+<br>Try it **live** on the next page. {{< fa hand-point-right >}}
+:::
 
-{{< include /guide/validation/_provide-compliance-assessments.qmd >}}
+::: {.column width="70%" .bl .pl4 .f4}
 
-:::
+{{< include /guide/validation/_map-evidence-to-guidelines.qmd >}}
 
 :::
 ::::
@@ -243,27 +238,30 @@ Assess model compliance
 
 :::: {.slideover--b .auto-collapse-10}
 ::: {.tc}
-**Add your compliance assessments**
+**Map evidence to a guideline**
+:::
+
+:::: {.mt2 .f2 .embed}
+Please note that test results and content blocks must be present on your model's associated default Development document for Developer Evidence to be automatically mapped to your validation report.
+
 :::
 
 1. Select the name of your model you registered for this course to open up the model details page.
 2. On the left sidebar that appears for your model, click **Validation** under {{< fa file >}} Documents.
-3. Click on **2.2.1. Data Quality** to assess compliance for the Class Imbalance Assessment sub-section.
+3. Click on **2.2.2. Model Performance** to expand that section.
+4. Under the Model Performance Metrics guideline, locate Evidence then click **{{< fa wand-magic-sparkles >}} Map Evidence**.
+5. Configure the mapping options, then click **Map Evidence** to run the AI mapping.
+6. Review and approve the mapped evidence.
 
 When you're done, click [{{< fa chevron-right >}}]() to continue.
 
 :::
 
-{{< include /training/common-slides/_document-checker.qmd >}}
-
-<br>
-Learn how to **use the {{< var vm.checker >}} to review validation reports** on the next page. {{< fa hand-point-right >}}
-
 ## {.scrollable}
 
 :::: {.columns}
 ::: {.column width="30%" .pr4 .f2}
-Use the {{< var vm.checker >}}
+Automatically assess evidence
 
 ::: {.f5 .nt2 .pl2 .mb4}
 (Scroll down for the full instructions.)
@@ -275,29 +273,33 @@ Use the {{< var vm.checker >}}
 
 ::: {.column width="70%" .bl .pl4 .f4}
 
-{{< include /guide/documentation/_check-documents.qmd >}}
+{{< include /guide/validation/_assess-evidence-for-compliance.qmd >}}
 
 :::
-
 ::::
 
 ## {background-iframe="https://app.prod.validmind.ai/model-inventory" background-interactive="true" data-preload="yes"}
 
 :::: {.slideover--b .auto-collapse-10}
 ::: {.tc}
-**Check your validation report**
+**Assess mapped evidence for compliance**
+:::
+
+:::: {.mt2 .f2 .embed}
+Please note that evidence must already be mapped to be assessed automatically on your validation report.
+
 :::
 
 1. Select the name of your model you registered for this course to open up the model details page.
 2. On the left sidebar that appears for your model, click **Validation** under {{< fa file >}} Documents.
-3. Locate {{< fa file-circle-check >}} Check Document on the right and click to expand the menu, then click **{{< fa check >}} Check Document**.
-4. Select a **[regulation]{.smallcaps}** and an associated **[assessment]{.smallcaps}** from the drop-down menus to to check your report against.
-5. Scroll to the bottom and click **Check Validation Document**.
-6. After the {{< var vm.checker >}} has completed its analysis, expand individual questions or click **Expand All** to look through the observations.
+3. Click on **2.2.2. Model Performance** to expand that section.
+4. Under the Model Performance Metrics guideline, click **{{< fa wand-magic-sparkles >}} Assess Evidence** under the Evidence Assessment panel.
+5. Review and approve the evidence assessment.
 
 When you're done, click [{{< fa chevron-right >}}]() to continue.
 
-::::
+:::
+
 
 # Manage artifacts {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
@@ -324,25 +326,58 @@ Try it **live** on the next pages. {{< fa hand-point-right >}}
 
 ::: {.column width="70%" .bl .pl4 .f4}
 
-Along with adding artifacts directly via validation reports, you can also add artifacts during your review of model documentation:
+1. In the left sidebar, click **{{< fa cubes >}} Inventory**.
+
+2. Select a record or [find your record by applying a filter or searching for it](/guide/inventory/working-with-the-inventory.qmd#search-filter-and-sort-records){target="_blank"}.
+
+3. Add additional artifacts from your validation report, or via during your review of documentation:
+
+::: {.panel-tabset}
+
+### Autogenerate validation issues on reports
+
+{{< include /guide/validation/_autogenerate-validation-issues.qmd >}}
+
+### Add artifacts on documentation
+
+Along with adding artifacts via validation reports, you can also add artifacts during your review of documentation:
 
 {{< include /guide/validation/_add-artifacts-on-documentation.qmd >}}
 
+:::
+
 :::
 ::::
 
 ## {background-iframe="https://app.prod.validmind.ai/model-inventory" background-interactive="true" data-preload="yes"}
 
+:::: {.slideover--b .auto-collapse-10}
+::: {.tc}
+**Autogenerate validation issues**
+
+:::
+
+1. Select the name of your model you registered for this course to open up the model details page.
+2. On the left sidebar that appears for your model, click **Validation** under {{< fa file >}} Documents.
+3. Click on **2.2.2. Model Performance** to expand that section.
+4. Under the Model Performance Metrics guideline, locate Artifacts then click **{{< fa wand-magic-sparkles >}} Suggest Validation Issues**.
+5. Approve or reject any suggested validation issues.
+
+When you're done, click [{{< fa chevron-right >}}]() to continue.
+
+:::
+
+## {background-iframe="https://app.prod.validmind.ai/model-inventory" background-interactive="true" data-preload="yes"}
+
 :::: {.slideover--b .auto-collapse-10}
 ::: {.tc}
 **Add an artifact on documentation**
 
-<!-- **Add an artifact via overview** -->
 :::
 
 1. Select the name of your model you registered for this course to open up the model details page.
 2. On the left sidebar that appears for your model, click **Development** under {{< fa file >}} Documents.
-3. Click **{{< fa plus >}} Add Model Artifact** to add an artifact from the overview.
+3. Click **{{< fa plus >}} Add Artifact** to add an artifact from the overview.
 
 When you're done, click [{{< fa chevron-right >}}]() to continue.
 
@@ -429,7 +464,98 @@ When you're done, click [{{< fa chevron-right >}}]() to continue.
 
 :::
 
-# Submit report for approval {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
+# Submit report <br>for approval {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
+
+## {.scrollable}
+
+:::: {.columns}
+::: {.column width="30%" .pr4 .f2}
+Assigning compliance assessments
+
+::: {.f5 .nt2 .pl2 .mb4}
+(Scroll down for the full instructions.)
+:::
+
+::: {.tc}
+[Learn more ...](/guide/validation/assess-compliance.qmd#assign-compliance-assessments){.button target="_blank"}
+
+:::
+
+:::: {.pa3 .mt3 .f5 .embed}
+**Assessment options available for selection depend on configuration for individual validation report templates.**
+
+Your organization can customize these options to match its own assessment framework, or choose to remove them from templates entirely.
+
+:::
+
+Try it **live** on the next page. {{< fa hand-point-right >}}
+:::
+
+::: {.column width="70%" .bl .pl4 .f4}
+{{< include /guide/validation/_assign-compliance-assessments.qmd >}}
+
+:::
+::::
+
+## {background-iframe="https://app.prod.validmind.ai/model-inventory" background-interactive="true" data-preload="yes"}
+
+:::: {.slideover--b .auto-collapse-10}
+::: {.tc}
+**Assign your compliance assessments**
+:::
+
+1. Select the name of your model you registered for this course to open up the model details page.
+2. On the left sidebar that appears for your model, click **Validation** under {{< fa file >}} Documents.
+3. Locate the Data Preparation section and click on **2.2.2. Model Performance** to assign the compliance assessment for the Model Performance Metrics guideline.
+
+When you're done, click [{{< fa chevron-right >}}]() to continue.
+
+:::
+
+{{< include /training/common-slides/_document-checker.qmd >}}
+
+<br>
+Learn how to **use the {{< var vm.checker >}} to review validation reports** on the next page. {{< fa hand-point-right >}}
+
+## {.scrollable}
+
+:::: {.columns}
+::: {.column width="30%" .pr4 .f2}
+Use the {{< var vm.checker >}}
+
+::: {.f5 .nt2 .pl2 .mb4}
+(Scroll down for the full instructions.)
+:::
+
+
+<br>Try it **live** on the next page. {{< fa hand-point-right >}}
+:::
+
+::: {.column width="70%" .bl .pl4 .f4}
+
+{{< include /guide/documentation/_check-documents.qmd >}}
+
+:::
+
+::::
+
+## {background-iframe="https://app.prod.validmind.ai/model-inventory" background-interactive="true" data-preload="yes"}
+
+:::: {.slideover--b .auto-collapse-10}
+::: {.tc}
+**Check your validation report**
+:::
+
+1. Select the name of your model you registered for this course to open up the model details page.
+2. On the left sidebar that appears for your model, click **Validation** under {{< fa file >}} Documents.
+3. Locate {{< fa file-circle-check >}} Check Document on the right and click to expand the menu, then click **{{< fa check >}} Check Document**.
+4. Select a **[regulation]{.smallcaps}** and an associated **[assessment]{.smallcaps}** from the drop-down menus to to check your report against.
+5. Scroll to the bottom and click **Check Validation Document**.
+6. After the {{< var vm.checker >}} has completed its analysis, expand individual questions or click **Expand All** to look through the observations.
+
+When you're done, click [{{< fa chevron-right >}}]() to continue.
+
+::::
 
 {{< include /training/common-slides/_work-with-workflows.qmd >}}
 
@@ -458,7 +584,7 @@ Comment threads
 
 {{< include /guide/documentation/_comment-activity.qmd >}}
 
-Have a question about the model? Collaborate with your developer right in the model documentation:
+Have a question about the record? Collaborate with your developer right in the documentation:
 
 ::: {.panel-tabset}
 
@@ -477,8 +603,8 @@ Have a question about the model? Collaborate with your developer right in the mo
 **Comment on a text block**
 :::
 
-1. Select the name of your record you registered for this course to open up the record details page.
-2. On the left sidebar that appears for your record, click **Validation** under {{< fa file >}} Documents.
+1. Select the name of your model you registered for this course to open up the model details page.
+2. On the left sidebar that appears for your model, click **Validation** under {{< fa file >}} Documents.
 3. **In the content block you added earlier**: Post a comment, reply to it, and then resolve the thread.
 
 When you're done, click [{{< fa chevron-right >}}]() to continue.
@@ -486,7 +612,7 @@ When you're done, click [{{< fa chevron-right >}}]() to continue.
 ::::
 
 
-# Track record activity {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
+# Track activity {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
 {{< include /training/common-slides/_track-changes-updates.qmd >}}
 
@@ -494,17 +620,17 @@ When you're done, click [{{< fa chevron-right >}}]() to continue.
 
 # View analytics {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
-## {background-iframe="https://app.prod.validmind.ai/analytics" background-interactive="true" data-preload="yes"}
+## {background-iframe="https://app.prod.validmind.ai" background-interactive="true" data-preload="yes"}
 
-:::: {.slideover--l .three-quarters .auto-collapse-10}
+:::: {.slideover--r .three-quarters .auto-collapse-10}
 **Welcome to {{< fa square-poll-vertical >}} Analytics**
 
-Here, you can find executive summaries, track information on models, artifacts, and more.
+Under analytics, you can find executive summaries, track information on records (models), artifacts, and more.
 
 For example:
 
-1. Click **Validation Issues** to review reports on validation issues.
-3. Click into any widget to review the validation issues reported by that widget.
+1. Select **Validation Issues** to review reports on validation issues.
+2. Click into any widget to review the validation issues reported by that widget.
 
 When you're done, click [{{< fa chevron-right >}}]() to continue.
 
@@ -530,10 +656,10 @@ Finalizing validation reports
 In this final module, you learned how to:
 
 - [x] Add or edit content blocks in your validation report
-- [x] Assess the compliance of a model within your validation report
+- [x] Assess the compliance of a record (model) within your validation report
 - [x] Manage artifacts via multiple methods
 - [x] Submit your validation report for approval
-- [x] Collaborate with other stakeholders on your model
+- [x] Collaborate with other stakeholders
 - [x] Track updates on your model
 - [x] Navigate the analytics dashboard
 :::
@@ -541,10 +667,11 @@ In this final module, you learned how to:
 
 ::: {.f3}
 <br>
-There is more that {{< var vm.product >}} can do to help you validate models, from using your own template to code samples you can adapt for your own use case:
+There is more that {{< var vm.product >}} can do to help you validate records, from using your own template to code samples you can adapt for your own use case:
+<br><br>
 :::
 
 ::: {.tc}
-[All model validation guides](/guide/guides.qmd#validation){.button target="_blank"}
+[All validation guides](/guide/guides.qmd#validation){.button target="_blank"}
 
 :::
\ No newline at end of file
diff --git a/site/training/validator-fundamentals/running-data-quality-tests.qmd b/site/training/validator-fundamentals/running-data-quality-tests.qmd
index 7db2c28985..1108595116 100644
--- a/site/training/validator-fundamentals/running-data-quality-tests.qmd
+++ b/site/training/validator-fundamentals/running-data-quality-tests.qmd
@@ -36,7 +36,7 @@ skip_preview: true
 
 # Learning objectives {.center}
 
-_"As a **validator** who has connected to a champion model via the {{< var validmind.developer >}}, I want to identify relevant tests to run from {{< var vm.product >}}'s test repository, run and log data quality tests, and insert the test results into my model's validation report."_
+_"As a **validator** who has connected to a champion via the {{< var validmind.developer >}}, I want to identify relevant tests to run from {{< var vm.product >}}'s test repository, run and log data quality tests, and insert the test results into my validation report."_
 
 ::: {.tc}
 <br>
@@ -49,7 +49,7 @@ This second module is part of a four-part series:
 ## Module 2 — Contents {.center}
 
 ::: {.f2}
-1. [{{< var vm.product >}} for model validation](#validmind-for-model-validation)
+1. [{{< var vm.product >}} for validation](#validmind-for-validation)
 2. [Explore ValidMind tests](#explore-validmind-tests)
 3. [Run tests with the {{< var validmind.developer >}}](#run-validmind-tests)
 4. [Log tests to the {{< var validmind.platform >}}](#log-validmind-tests)
@@ -71,7 +71,7 @@ To continue, you need to have been [onboarded](validator-fundamentals-register.q
 
 ::: {.tc}
 <!-- IMPORTANT: USE THE .HTML PATH AND NOT THE .QMD PATH FOR THE REVEALJS OUTPUT -->
-[Using {{< var vm.product >}} for Model Validation](using-validmind-for-model-validation.html){.button target="_blank"}
+[Using {{< var vm.product >}} for Validation](using-validmind-for-validation.html){.button target="_blank"}
 :::
 
 :::: {.tc .mt5 .f2 .embed}
@@ -85,7 +85,7 @@ Already logged in and refreshed this module? Click [{{< fa chevron-right >}}]()
 
 <!-- USING THE VARIABLE IN THE HEADING MESSES UP THE PAGE ANCHOR -->
 
-# ValidMind for model validation {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
+# ValidMind for validation {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
 ## {.scrollable .center}
 
@@ -94,7 +94,7 @@ Already logged in and refreshed this module? Click [{{< fa chevron-right >}}]()
 Jupyter Notebook series
 
 ::: {.f3}
-These notebooks walk you through how to validate a model using {{< var vm.product >}}, complete with supporting test results attached as evidence to your validation report.
+These notebooks walk you through how to validate a record (model) using {{< var vm.product >}}, complete with supporting test results attached as evidence to your validation report.
 
 ::: {.f5 .nt2 .pl2 .mb4}
 <br>
@@ -105,30 +105,30 @@ You will need to have already completed **1 — Set up the {{< var validmind.dev
 :::
 
 ::: {.column width="70%" .bl .pl4 .f3}
-#### {{< var vm.product >}} for model validation
+#### {{< var vm.product >}} for validation
 
-Our series of four introductory notebooks for model validators include sample code and how-to information to get you started with {{< var vm.product >}}:
+Our series of four introductory notebooks for validators include sample code and how-to information to get you started with {{< var vm.product >}}:
 
-1 — [Set up the {{< var validmind.developer >}} for validation](/notebooks/tutorials/model_validation/1-set_up_validmind_for_validation.ipynb){target="_blank"}<br>
-2 — [Start the model validation process](/notebooks/tutorials/model_validation/2-start_validation_process.ipynb){target="_blank"}<br>
-3 — [Developing a potential challenger model](/notebooks/tutorials/model_validation/3-developing_challenger_model.ipynb){target="_blank"}<br>
-4 — [Finalize testing and reporting](/notebooks/tutorials/model_validation/4-finalize_validation_reporting.ipynb){target="_blank"}<br>
+1 — [Set up the {{< var validmind.developer >}} for validation](/notebooks/tutorials/validation/1-set_up_validmind_for_validation.ipynb){target="_blank"}<br>
+2 — [Start the validation process](/notebooks/tutorials/validation/2-start_validation_process.ipynb){target="_blank"}<br>
+3 — [Developing a potential challenger](/notebooks/tutorials/validation/3-developing_potential_challenger.ipynb){target="_blank"}<br>
+4 — [Finalize testing and reporting](/notebooks/tutorials/validation/4-finalize_validation_reporting.ipynb){target="_blank"}<br>
 <br>
 
 ::: {.f4 .pl3 .pr3 .embed}
-In this second module, we'll run through **2 — Start the model validation process** together.
+In this second module, we'll run through **2 — Start the validation process** together.
 :::
 
 :::
 
 ::::
 
-Let's continue our journey with **2 — Start the model validation process** on the next page. {{< fa hand-point-right >}}
+Let's continue our journey with **2 — Start the validation process** on the next page. {{< fa hand-point-right >}}
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/2-start_validation_process.html" background-interactive="yes" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/2-start_validation_process.html" background-interactive="yes" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
-**2 — Start the model validation process**
+**2 — Start the validation process**
 
 During this course, we'll run through these notebooks together, and at the end of your learning journey you'll have a fully supported sample validation report ready for review.
 
@@ -144,56 +144,56 @@ For now, **scroll through this notebook** to explore. When you are done, click [
 
 {{< include /training/common-slides/_get-your-code-snippet.qmd >}}
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/2-start_validation_process.html#initialize-the-validmind-library" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/2-start_validation_process.html#initialize-the-validmind-library" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Connect to your model**
 
 With your code snippet copied to your clipboard:
 
-1. Open **2 — Start the model validation process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/2-start_validation_process.ipynb){target="_blank"}
+1. Open **2 — Start the validation process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/2-start_validation_process.ipynb){target="_blank"}
 2. Run the cell under the **Setting up** section.
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/2-start_validation_process.html#load-the-sample-dataset" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/2-start_validation_process.html#load-the-sample-dataset" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Load the sample dataset**
 
-After you've successfully initialized the {{< var validmind.developer >}}, let's import the sample dataset that was used to develop the dummy champion model:
+After you've successfully initialized the {{< var validmind.developer >}}, let's import the sample dataset that was used to develop the dummy champion:
 
-1. Continue with **2 — Start the model validation process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/2-start_validation_process.ipynb){target="_blank"}
+1. Continue with **2 — Start the validation process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/2-start_validation_process.ipynb){target="_blank"}
 2. Run the cell under the **Load the sample dataset** section.
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/2-start_validation_process.html#identify-qualitative-tests" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/2-start_validation_process.html#identify-qualitative-tests" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Identify qualitative tests**
 
-Next, we'll use the [`list_tests()` function](/notebooks/EXECUTED/model_validation/1-set_up_validmind_for_validation.ipynb#explore-available-tests){target="_blank"} to pinpoint tests we want to run:
+Next, we'll use the [`list_tests()` function](/notebooks/EXECUTED/validation/1-set_up_validmind_for_validation.ipynb#explore-available-tests){target="_blank"} to pinpoint tests we want to run:
 
-1. Continue with **2 — Start the model validation process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/2-start_validation_process.ipynb){target="_blank"}
+1. Continue with **2 — Start the validation process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/2-start_validation_process.ipynb){target="_blank"}
 2. Run all the cells under the Verifying data quality adjustments section: **Identify qualitative tests**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/2-start_validation_process.html#initialize-the-validmind-datasets" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/2-start_validation_process.html#initialize-the-validmind-dataset" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Initialize {{< var vm.product >}} datasets**
 
 Then, we'll use the [`init_dataset()` function](/validmind/validmind.qmd#init_dataset){target="_blank"} to connect the sample data with a {{< var vm.product >}} `Dataset` object in preparation for running tests:
 
-1. Continue with **2 — Start the model validation process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/2-start_validation_process.ipynb){target="_blank"}
-2. Run the following cell in the  Verifying data quality adjustments section: **Initialize the {{< var vm.product >}} datasets**
+1. Continue with **2 — Start the validation process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/2-start_validation_process.ipynb){target="_blank"}
+2. Run the following cell in the Verifying data quality adjustments section: **Initialize the {{< var vm.product >}} dataset**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
@@ -204,28 +204,28 @@ When you're done, return to this page and click [{{< fa chevron-right >}}]() to
 
 # Run ValidMind tests {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/2-start_validation_process.html#run-data-quality-tests" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/2-start_validation_process.html#run-data-quality-tests" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Run data quality tests**
 
 You run individual tests by calling the [`run_test()` function](/validmind/validmind/tests.qmd#run_test){target="_blank"} provided by the `validmind.tests` module:
 
-1. Continue with **2 — Start the model validation process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/2-start_validation_process.ipynb){target="_blank"}
+1. Continue with **2 — Start the validation process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/2-start_validation_process.ipynb){target="_blank"}
 2. Run all the cells under the Verifying data quality adjustments section: **Run data quality tests**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/2-start_validation_process.html#remove-highly-correlated-features" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/2-start_validation_process.html#remove-highly-correlated-features" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Remove highly correlated features**
 
 You can utilize the output from a ValidMind test for further use, for example, if you want to remove highly correlated features:
 
-1. Continue with **2 — Start the model validation process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/2-start_validation_process.ipynb){target="_blank"}
+1. Continue with **2 — Start the validation process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/2-start_validation_process.ipynb){target="_blank"}
 2. Run all the cells under the Verifying data quality adjustments section: **Remove highly correlated features**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
@@ -260,28 +260,28 @@ Every test result returned by the `run_test()` function has a `.log()` method th
 :::
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/2-start_validation_process.html#configure-and-run-comparison-tests" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/2-start_validation_process.html#configure-and-run-comparison-tests" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Configure and run comparison tests**
 
-You can leverage the {{< var validmind.developer >}} to easily run comparison tests, between both datasets and models. Here, we compare the original raw dataset and the final preprocessed dataset, then log the results to the {{< var validmind.platform >}}:
+You can leverage the {{< var validmind.developer >}} to easily run comparison tests, between both datasets and records (models). Here, we compare the original raw dataset and the final preprocessed dataset, then log the results to the {{< var validmind.platform >}}:
 
-1. Continue with **2 — Start the model validation process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/2-start_validation_process.ipynb){target="_blank"}
+1. Continue with **2 — Start the validation process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/2-start_validation_process.ipynb){target="_blank"}
 2. Run all the cells under the Documenting test results section: **Configure and run comparison tests**
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/2-start_validation_process.html#log-tests-with-unique-identifiers" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/2-start_validation_process.html#log-tests-with-unique-identifiers" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Log tests with unique identifiers**
 
 When running individual tests, you can use a custom `result_id` to tag the individual result with a unique identifier:
 
-1. Continue with **2 — Start the model validation process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/2-start_validation_process.ipynb){target="_blank"}
+1. Continue with **2 — Start the validation process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/2-start_validation_process.ipynb){target="_blank"}
 2. Run the cell under the following Documenting test results section:  **Log tests with unique identifiers**.
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
@@ -295,7 +295,7 @@ When you're done, return to this page and click [{{< fa chevron-right >}}]() to
 Add test results to reporting
 
 ::: {.tc}
-[Learn more ...](/notebooks/EXECUTED/model_validation/2-start_validation_process.ipynb#add-test-results-to-reporting){.button target="_blank"}
+[Learn more ...](/guide/validation/assess-compliance.qmd#map-evidence){.button target="_blank"}
 
 :::
 
@@ -305,7 +305,40 @@ Add test results to reporting
 ::: {.column width="70%" .bl .pl4 .f4}
 #### Link validator evidence
 
-{{< include /guide/validation/_link-validator-evidence.qmd >}}
+With some test results logged, let's head to the record we connected to at the beginning of this notebook and insert our test results into the validation report as evidence.
+
+While the example below focuses on a specific test result, you can follow the same general procedure for your other results:
+
+::: {.panel-tabset}
+
+### 1. Link data quality test results
+a. From the **{{< fa cubes >}} Inventory** in the {{< var validmind.platform >}}, go to the record you connected to earlier.
+
+b. In the left sidebar that appears for your record, click **Validation** under {{< fa file >}} Documents.
+
+c. Click **2.2.1. Data Quality** to expand that section.
+
+d. Under the Class Imbalance Assessment guideline, click **Evidence** to expand the evidence panel.
+
+e. Click **{{< fa link >}} Link Evidence**, then select **Validator Evidence**.
+
+f. Select the Class Imbalance test results we logged: **ValidMind Data Validation Class Imbalance**
+
+    ![The ClassImbalance tests selected](/notebooks/tutorials/validation/selecting-class-imbalance-results.png){fig-alt="Screenshot showing the ClassImbalance tests selected" .screenshot}
+
+g. Click **Update Linked Evidence** to add the test results to the validation report.
+
+h. Confirm that the results for the Class Imbalance test you inserted has been correctly inserted into right section under **2.2.1. Data Quality** of the report.
+
+### 2. Review Class Imbalance test results
+
+- Once linked as evidence to section **2.2.1. Data Quality**, note that the ValidMind Data Validation Class Imbalance test results are flagged as **Requires Attention** — as they include comparative results from our initial raw dataset.
+- Click **See evidence details** to review the LLM-generated description that summarizes the test results, that confirm that our final preprocessed dataset actually passes our test:
+
+  ![ClassImbalance test generated description in the text editor](/notebooks/tutorials/validation/class-imbalance-results-detail.png){fig-alt="Screenshot showing the ClassImbalance test generated description in the text editor" .screenshot}
+
+:::
+
 
 :::
 
@@ -320,10 +353,11 @@ Add test results to reporting
 
 1. Select the name of your model you registered for this course to open up the model details page.
 2. In the left sidebar that appears for your model, click **Validation** under {{< fa file >}} Documents.
-3. Locate the Data Preparation section and click on **2.2.1. Data Quality** to expand that section.
-4. Under the Class Imbalance Assessment section, locate Validator Evidence then click **Link Evidence to Report**.
-5. Select the Class Imbalance test results we logged: **ValidMind Data Validation Class Imbalance**
-6. Click **Update Linked Evidence** to add the test results to the validation report.
+3. Click **2.2.1. Data Quality** to expand that section.
+4. Under the Class Imbalance Assessment guideline, click **Evidence** to expand the evidence panel.
+5. Click **{{< fa link >}}  Link Evidence**, then select **Validator Evidence**.
+6. Select the Class Imbalance test results we logged: **ValidMind Data Validation Class Imbalance**
+7. Click **Update Linked Evidence** to add the test results to the validation report.
 
 When you're done, click [{{< fa chevron-right >}}]() to continue.
 
@@ -331,15 +365,15 @@ When you're done, click [{{< fa chevron-right >}}]() to continue.
 
 # Prepare datasets for model evaluation {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/2-start_validation_process.html#split-the-preprocessed-dataset" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/2-start_validation_process.html#preparing-the-preprocessed-dataset" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
-**Split the preprocessed dataset**
+**Preparing the preprocessed dataset**
 
 So far, we've rebalanced our raw dataset and used the results of {{< var vm.product >}} tests to additionally remove highly correlated features from our dataset. Next, let's now spilt our dataset into train and test in preparation for model evaluation testing:
 
-1. Continue with **2 — Start the model validation process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/2-start_validation_process.ipynb){target="_blank"}
-2. Run all the cells under the **Split the preprocessed dataset** section.
+1. Continue with **2 — Start the validation process**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/2-start_validation_process.ipynb){target="_blank"}
+2. Run all the cells under the **Preparing the preprocessed dataset** section.
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
 
@@ -361,15 +395,15 @@ In this second module, you learned how to:
 - [x] Initialize {{< var vm.product >}} `Dataset` objects
 - [x] Run out-of-the-box tests with the {{< var validmind.developer >}}
 - [x] Log test results to the {{< var validmind.platform >}}
-- [x] Attach logged test results onto your model's validation report
+- [x] Attach logged test results onto your validation report
 
 :::
 ::::
 
 ::: {.tc}
 <br>
-Continue your model development journey with:
+Continue your model validation journey with:
 <br><br>
 <!-- IMPORTANT: USE THE .HTML PATH AND NOT THE .QMD PATH FOR THE REVEALJS OUTPUT -->
-[Developing Challenger Models](developing-challenger-models.html){.button target="_blank"}
+[Developing Potential Challengers](developing-potential-challengers.html){.button target="_blank"}
 :::
\ No newline at end of file
diff --git a/site/training/validator-fundamentals/using-validmind-for-model-validation.qmd b/site/training/validator-fundamentals/using-validmind-for-validation.qmd
similarity index 66%
rename from site/training/validator-fundamentals/using-validmind-for-model-validation.qmd
rename to site/training/validator-fundamentals/using-validmind-for-validation.qmd
index 778d9310ea..5606c4bf65 100644
--- a/site/training/validator-fundamentals/using-validmind-for-model-validation.qmd
+++ b/site/training/validator-fundamentals/using-validmind-for-validation.qmd
@@ -2,7 +2,9 @@
 # Copyright © 2023-2026 ValidMind Inc. All rights reserved.
 # Refer to the LICENSE file in the root of this repository for details.
 # SPDX-License-Identifier: AGPL-3.0 AND ValidMind Commercial
-title: "Using {{< var vm.product >}} <br>for Model Validation"
+title: "Using {{< var vm.product >}} <br>for Validation"
+aliases:
+  - /training/validator-fundamentals/using-validmind-for-model-validation.html
 subtitle: "Validator Fundamentals — Module 1 of 4<br><br>_Click [{{< fa chevron-right >}}](#learning-objectives) to start_"
 lightbox: true
 format:
@@ -26,7 +28,7 @@ format:
       - slideover
   html:
   # Change this to the file name prepended by a _ to get around the global HTML output settings required by _metadata.yml
-    output-file: _using-validmind-for-model-validation.html
+    output-file: _using-validmind-for-validation.html
     search: false
 title-slide-attributes:
   data-background-color: "#083E44"
@@ -36,7 +38,7 @@ skip_preview: true
 
 # Learning objectives {.center}
 
-_"As a **validator** who is new to {{< var vm.product >}}, I want to learn how to connect to a champion model in the {{< var validmind.platform >}} using the {{< var validmind.developer >}} installed in my local environment, preview the model's validation report template, and review submitted documentation for the model."_
+_"As a **validator** who is new to {{< var vm.product >}}, I want to learn how to connect to a champion record (model) in the {{< var validmind.platform >}} using the {{< var validmind.developer >}} installed in my local environment, preview my validation report template, and review submitted documentation."_
 
 ::: {.tc}
 <br>
@@ -49,11 +51,11 @@ This first module is part of a four-part series:
 ## Module 1 — Contents {.center}
 
 ::: {.f2}
-1. [{{< var vm.product >}} for model validation](#validmind-for-model-validation)
+1. [{{< var vm.product >}} for validation](#validmind-for-validation)
 2. [The {{< var validmind.platform >}}](#the-validmind-platform)
-3. [Connect to your champion model](#connect-to-a-model)
-4. [Preview your model's validation report template](#preview-validation-report)
-5. [Review submitted model documentation](#review-model-documentation)
+3. [Connect to your champion](#connect-to-a-model)
+4. [Preview your validation report template](#preview-validation-report)
+5. [Review submitted documentation](#review-documentation)
 
 :::
 
@@ -83,7 +85,7 @@ Already logged in and refreshed this module? Click [{{< fa chevron-right >}}]()
 
 <!-- USING THE VARIABLE IN THE HEADING MESSES UP THE PAGE ANCHOR -->
 
-# ValidMind for model validation {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
+# ValidMind for validation {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
 ## {.scrollable .center}
 
@@ -92,20 +94,20 @@ Already logged in and refreshed this module? Click [{{< fa chevron-right >}}]()
 Jupyter Notebook series
 
 ::: {.f3}
-These notebooks walk you through how to validate a model using {{< var vm.product >}}, complete with supporting test results attached as evidence to your validation report.
+These notebooks walk you through how to validate a record (model) using {{< var vm.product >}}, complete with supporting test results attached as evidence to your validation report.
 
 :::
 :::
 
 ::: {.column width="70%" .bl .pl4 .f3}
-#### {{< var vm.product >}} for model validation
+#### {{< var vm.product >}} for validation
 
-Our series of four introductory notebooks for model validators include sample code and how-to information to get you started with {{< var vm.product >}}:
+Our series of four introductory notebooks for validators include sample code and how-to information to get you started with {{< var vm.product >}}:
 
-1 — [Set up the {{< var validmind.developer >}} for validation](/notebooks/tutorials/model_validation/1-set_up_validmind_for_validation.ipynb){target="_blank"}<br>
-2 — [Start the model validation process](/notebooks/tutorials/model_validation/2-start_validation_process.ipynb){target="_blank"}<br>
-3 — [Developing a potential challenger model](/notebooks/tutorials/model_validation/3-developing_challenger_model.ipynb){target="_blank"}<br>
-4 — [Finalize testing and reporting](/notebooks/tutorials/model_validation/4-finalize_validation_reporting.ipynb){target="_blank"}<br>
+1 — [Set up the {{< var validmind.developer >}} for validation](/notebooks/tutorials/validation/1-set_up_validmind_for_validation.ipynb){target="_blank"}<br>
+2 — [Start the validation process](/notebooks/tutorials/validation/2-start_validation_process.ipynb){target="_blank"}<br>
+3 — [Developing a potential challenger](/notebooks/tutorials/validation/3-developing_potential_challenger.ipynb){target="_blank"}<br>
+4 — [Finalize testing and reporting](/notebooks/tutorials/validation/4-finalize_validation_reporting.ipynb){target="_blank"}<br>
 <br>
 
 ::: {.f4 .pl3 .pr3 .embed}
@@ -119,7 +121,7 @@ In this first module, we'll run through **1 — Set up the {{< var validmind.dev
 
 Let's start our journey with **1 — Set up the {{< var validmind.developer >}} for validation** on the next page. {{< fa hand-point-right >}}
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/1-set_up_validmind_for_validation.html" background-interactive="yes" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/1-set_up_validmind_for_validation.html" background-interactive="yes" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **1 — Set up the {{< var validmind.developer >}} for validation**
@@ -141,10 +143,10 @@ For now, **scroll through this notebook** to explore. When you are done, click [
 
 From here, you can:
 
-- Keep track of your models in the customizable inventory ...
-- Review model documentation submitted by model developers ...
-- Assess the compliance of models by logging artifacts (findings) and test results as evidence on validation reports ...
-- View analytics on your models and artifacts, and create custom reports ...
+- Keep track of your records (models) in the customizable inventory ...
+- Review documentation submitted by developers ...
+- Assess the compliance of records by logging artifacts (findings) and test results as evidence on validation reports ...
+- View analytics on your records and artifacts, and create custom reports ...
 - ... and much more!
 
 ::: {.embed}
@@ -162,15 +164,15 @@ When you're done exploring, click [{{< fa chevron-right >}}]() to continue.
 :::: {.slideover--r}
 **Welcome to the {{< fa cubes >}} Inventory**
 
-Use the model inventory to track comprehensive details for all your models throughout the model lifecycle. The model inventory is customizable and extensible, with a layout that can be configured to suit your needs.
+Use the inventory to track comprehensive details for all your records (models) throughout their lifecycles. The inventory is customizable and extensible, with a layout that can be configured to suit your needs.
 
 ::: {.embed}
-Typically, you will be asked to validate a champion model that has already been independently registered in the model inventory.
+Typically, you will be asked to validate a champion record that has already been independently registered in the inventory.
 
-For this training course, you'll register a dummy model via the **{{< fa plus >}} Register Model** modal and assign yourself as the validator to familiarize you with the {{< var validmind.platform >}} interface.
+For this training course, you'll register a dummy record and assign yourself as the validator to familiarize you with the {{< var validmind.platform >}} interface.
 :::
 
-**Let's register a model together** for use with validation on the next page. {{< fa hand-point-right >}}
+**Let's register a model-type record together** for use with validation on the next page. {{< fa hand-point-right >}}
 
 ::::
 
@@ -184,10 +186,10 @@ For this training course, you'll register a dummy model via the **{{< fa plus >}
 
 :::
 
-In order to log tests as a validator instead of as a developer, we'll need to adjust your **model stakeholder** permissions:
+In order to log tests as a validator instead of as a developer, we'll need to adjust your **inventory record stakeholder** permissions:
 
 1. Select the name of your model you registered for this course to open up the model details page.
-2. Remove yourself as a model owner by clicking on the **[owners]{.smallcaps}** tile, then clicking on the **x** next to your name. Click **Save** to apply your changes to that role.
+2. Remove yourself as an owner by clicking on the **[owners]{.smallcaps}** tile, then clicking on the **x** next to your name. Click **Save** to apply your changes to that role.
 3. Remove yourself as a developer by clicking on the **[developers]{.smallcaps}** tile, then clicking on the **x** next to your name. Click **Save** to apply your changes to that role.
 4. Add yourself as a validator by clicking on the **[validators]{.smallcaps}** tile, and selecting your name from the drop-down menu. Click **Save** to apply your changes to that role.
 
@@ -202,7 +204,7 @@ When you're done, click [{{< fa chevron-right >}}]() to continue.
 **Apply a documentation template**
 :::
 
-Once you've registered your model, let's select a documentation template. A template predefines sections for your model documentation and provides a general outline to follow, making the documentation process much easier for developers.
+Once you've registered your model, let's select a documentation template. A template predefines sections for your documentation and provides a general outline to follow, making the documentation process much easier for developers.
 
 We'll need this documentation template later for reference as we draft our validation report:
 
@@ -211,6 +213,11 @@ We'll need this documentation template later for reference as we draft our valid
 3. Under [create document]{.smallcaps}, select `Binary classification` from the **[template]{.smallcaps}** drop-down menu.
 4. Click **Use Template** to apply the template.
 
+:::: {.f2 .embed}
+If you cannot locate your Development document, make sure Development type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents){target="_blank"})
+
+:::
+
 When you're done, click [{{< fa chevron-right >}}]() to continue.
 
 ::::
@@ -229,6 +236,11 @@ Next, let's select a validation report template. A template predefines sections
 3. Under [create document]{.smallcaps}, select `Generic Validation Report` from the **[template]{.smallcaps}** drop-down menu.
 4. Click **Use Template** to apply the template.
 
+:::: {.f2 .embed}
+If you cannot locate your Validation document, make sure Validation type documents are enabled for model records and create a new document. (**Learn more:** [Manage documents](https://docs.validmind.ai/guide/templates/manage-documents.html#add-record-documents){target="_blank"})
+
+:::
+
 When you're done, click [{{< fa chevron-right >}}]() to continue.
 
 ::::
@@ -237,14 +249,14 @@ When you're done, click [{{< fa chevron-right >}}]() to continue.
 
 {{< include /training/common-slides/_get-your-code-snippet.qmd >}}
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/1-set_up_validmind_for_validation.html#install-the-validmind-library" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/1-set_up_validmind_for_validation.html#install-the-validmind-library" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
 **Install & initialize the {{< var validmind.developer >}}**
 
 With your code snippet copied to your clipboard:
 
-1. Open **1 — Set up the {{< var validmind.developer >}} for validation**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/1-set_up_validmind_for_validation.ipynb){target="_blank"}
+1. Open **1 — Set up the {{< var validmind.developer >}} for validation**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/1-set_up_validmind_for_validation.ipynb){target="_blank"}
 2. Run all the cells under the Setting up sections:
     - **Install the {{< var validmind.developer >}}**
     - **Initialize the {{< var validmind.developer >}}**
@@ -255,14 +267,14 @@ When you're done, return to this page and click [{{< fa chevron-right >}}]() to
 
 # Preview validation report {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
-## {background-iframe="/notebooks/EXECUTED/model_validation/1-set_up_validmind_for_validation.html#preview-the-validation-report-template" data-preload="yes"}
+## {background-iframe="/notebooks/EXECUTED/validation/1-set_up_validmind_for_validation.html#preview-the-validation-report-template" data-preload="yes"}
 
 :::: {.slideover--r .three-quarters}
-**Preview the validation report template**
+**Get to know {{< var vm.product >}}**
 
-You can preview your model's validation report template right from the {{< var validmind.developer >}}:
+You can preview your validation report template right from the {{< var validmind.developer >}}, as well as explore available tests without leaving your validation environment:
 
-1. Continue with **1 — Set up the {{< var validmind.developer >}} for validation**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/model_validation/1-set_up_validmind_for_validation.ipynb){target="_blank"}
+1. Continue with **1 — Set up the {{< var validmind.developer >}} for validation**: [{{< fa square-arrow-up-right >}} JupyterHub]({{< var url.jupyterhub >}}/hub/user-redirect/lab/tree/tutorials/validation/1-set_up_validmind_for_validation.ipynb){target="_blank"}
 2.  Run all the cells in the sections under **Getting to know ValidMind**.
 
 When you're done, return to this page and click [{{< fa chevron-right >}}]() to continue.
@@ -286,7 +298,7 @@ When you're done exploring, click [{{< fa chevron-right >}}]() to continue.
 
 ::::
 
-# Review model documentation {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
+# Review documentation {background-color="#083E44" background-image="/training/assets/home-hero.svg"}
 
 {{< include /training/common-slides/_document-overview.qmd >}}
 
@@ -295,7 +307,7 @@ When you're done exploring, click [{{< fa chevron-right >}}]() to continue.
 :::: {.slideover--r .auto-collapse-10}
 **Explore sample documentation**
 
-Typically, a champion model is submitted to you for validation with completed documentation.
+Typically, a champion is submitted to you for validation with completed documentation.
 
 Here, review the empty sample documentation for the record you registered earlier to familiarize you with what the structure of documentation could look like when presented to you for review:
 
@@ -317,7 +329,7 @@ When you're done exploring, click [{{< fa chevron-right >}}]() to continue.
 
 :::: {.columns}
 ::: {.column width="30%" .pr4 .f2}
-Using {{< var vm.product >}} for model validation
+Using {{< var vm.product >}} for validation
 
 :::
 
@@ -325,16 +337,16 @@ Using {{< var vm.product >}} for model validation
 In this first module, you learned how to:
 
 - [x] Install the {{< var validmind.developer >}} in your environment
-- [x] Connect to a model in the {{< var validmind.platform >}} as a validator
-- [x] Preview and verify your model's validation report template
-- [x] View your champion model's documentation
+- [x] Connect to a record (model) in the {{< var validmind.platform >}} as a validator
+- [x] Preview and verify your validation report template
+- [x] View your champion's documentation
 
 :::
 ::::
 
 ::: {.tc}
 <br>
-Continue your model development journey with:
+Continue your validation journey with:
 <br><br>
 <!-- IMPORTANT: USE THE .HTML PATH AND NOT THE .QMD PATH FOR THE REVEALJS OUTPUT -->
 [Running Data Quality Tests](running-data-quality-tests.html){.button target="_blank"}
diff --git a/site/training/validator-fundamentals/validator-fundamentals-register.qmd b/site/training/validator-fundamentals/validator-fundamentals-register.qmd
index 4fad4463fc..81f500c9e4 100644
--- a/site/training/validator-fundamentals/validator-fundamentals-register.qmd
+++ b/site/training/validator-fundamentals/validator-fundamentals-register.qmd
@@ -17,34 +17,34 @@ listing:
     table-hover: true
     image-align: left
     contents:
-    - path: using-validmind-for-model-validation.html
-      title: "Using {{< var vm.product >}} for Model Validation"
+    - path: using-validmind-for-validation.html
+      title: "Using {{< var vm.product >}} for Validation"
       subtitle: "Module 1"
-      description: "{{< fa check >}} Install the {{< var validmind.developer >}} in your environment <br> {{< fa check >}} Connect to a champion model as a validator <br> {{< fa check >}} Preview the model's validation report template <br> {{< fa check >}} Review submitted model documentation"
+      description: "{{< fa check >}} Install the {{< var validmind.developer >}} in your environment <br> {{< fa check >}} Connect to a champion record (model) as a validator <br> {{< fa check >}} Preview the validation report template <br> {{< fa check >}} Review submitted documentation"
       reading-time: "30"
       author: "{{< var vm.product >}}"
     - path: running-data-quality-tests.html
       title: "Running Data Quality Tests"
       subtitle: "Module 2"
-      description: "{{< fa check >}} Identify relevant tests to run from {{< var vm.product >}}'s test vault <br> {{< fa check >}} Initialize datasets for use with the {{< var validmind.developer >}} <br> {{< fa check >}} Run and log out-of-the-box tests on your datasets <br> {{< fa check >}} Insert test results into your model’s validation report"
+      description: "{{< fa check >}} Identify relevant tests to run from {{< var vm.product >}}'s test vault <br> {{< fa check >}} Initialize datasets for use with the {{< var validmind.developer >}} <br> {{< fa check >}} Run and log out-of-the-box tests on your datasets <br> {{< fa check >}} Insert test results into your validation report"
       reading-time: "45"
       author: "{{< var vm.product >}}"
-    - path: developing-challenger-models.html
-      title: "Developing Challenger Models"
+    - path: developing-potential-challengers.html
+      title: "Developing Potential Challengers"
       subtitle: "Module 3"
-      description: "{{< fa check >}} Initialize models for use with the {{< var validmind.developer >}} <br> {{< fa check >}} Run and log out-of-the box and custom tests for your models <br> {{< fa check >}} Use the results of tests to log model artifacts (findings)"
+      description: "{{< fa check >}} Initialize records (models) for use with the {{< var validmind.developer >}} <br> {{< fa check >}} Run and log out-of-the-box and custom tests <br> {{< fa check >}} Use the results of tests to log artifacts (findings)"
       reading-time: "75"
       author: "{{< var vm.product >}}"
     - path: finalizing-validation-reports.html
       title: "Finalizing Validation Reports"
       subtitle: "Module 4"
-      description: "{{< fa check >}} Make qualitative edits to your validation report <br> {{< fa check >}} Submit your validation report for approval <br> {{< fa check >}} Track artifact resolution and other updates to your model"
+      description: "{{< fa check >}} Make qualitative edits to your validation report <br> {{< fa check >}} Submit your validation report for approval <br> {{< fa check >}} Track artifact resolution and other updates to your record (model)"
       reading-time: "30"
       author: "{{< var vm.product >}}"
     fields: [title, subtitle, description, reading-time]
 ---
 
-Learn how to use {{< var vm.product >}} as a **validator** to generate validation reports, automate testing, and collaborate with your model development team.
+Learn how to use {{< var vm.product >}} as a **validator** to generate validation reports, automate testing, and collaborate with your development team.
 
 ::: {.column-margin}
 {{< include /training/_compatibility.qmd >}}
diff --git a/site/training/what-is-validmind/what-is-validmind-register.qmd b/site/training/what-is-validmind/what-is-validmind-register.qmd
index 77dde88c75..1839864d57 100644
--- a/site/training/what-is-validmind/what-is-validmind-register.qmd
+++ b/site/training/what-is-validmind/what-is-validmind-register.qmd
@@ -103,7 +103,7 @@ Take a guided tour of {{< var vm.product >}} and discover how the platform helps
 #### <sup>Section 6</sup><br> Risk Insights & Regulatory Alignment
 
 - Use AI-powered document checker for compliance
-- Align with regulatory frameworks like SR 11-7, SS1/23, E-23, and EU AI Act
+- Align with regulatory frameworks like SR 26-2, SS1/23, E-23, and EU AI Act
 - Generate risk assessments with recommendations
 :::
 
diff --git a/site/training/what-is-validmind/what-is-validmind.qmd b/site/training/what-is-validmind/what-is-validmind.qmd
index e2d558ca25..845c847e62 100644
--- a/site/training/what-is-validmind/what-is-validmind.qmd
+++ b/site/training/what-is-validmind/what-is-validmind.qmd
@@ -672,7 +672,7 @@ As a validator, use the same tools used to develop models to ...
 :::: columns
 
 ::: {.column width="30%" .tc .nt4}
-[[{{< fa circle-info >}}&ensp;Validator Quickstart]{.button .button-light-green .shadow-5-ns}](/notebooks/quickstart/quickstart_model_validation.ipynb){target="_blank"}
+[[{{< fa circle-info >}}&ensp;Validator Quickstart]{.button .button-light-green .shadow-5-ns}](/notebooks/quickstart/quickstart_validation.ipynb){target="_blank"}
 :::
 
 ::: {.column width="40%" .tc .nt4}
@@ -680,7 +680,7 @@ As a validator, use the same tools used to develop models to ...
 :::
 
 ::: {.column width="30%" .tc .nt4}
-[[{{< fa code >}}&ensp;Validation Use Case]{.button .button-light-green .shadow-5-ns}](/notebooks/use_cases/model_validation/validate_application_scorecard.ipynb){target="_blank"}<br>
+[[{{< fa code >}}&ensp;Validation Use Case]{.button .button-light-green .shadow-5-ns}](/notebooks/use_cases/validation/validate_application_scorecard.ipynb){target="_blank"}<br>
 :::
 
 ::::
@@ -861,7 +861,7 @@ Use {{< var vm.product >}}'s {{< var vm.checker >}} to:
 - [Guide]{.b} you on how to improve clarity, completeness, and compliance.
 - [Align]{.b} with regulatory expectations for risk and model governance.
 
-  [SR 11-7]{.bubble .smallcaps} [SS1/23]{.bubble .smallcaps} [E-23]{.bubble .smallcaps} [EU AI ACT]{.bubble .smallcaps}
+  [SR 26-2]{.bubble .smallcaps} [SS1/23]{.bubble .smallcaps} [E-23]{.bubble .smallcaps} [EU AI ACT]{.bubble .smallcaps}
 
 :::
 
@@ -894,7 +894,7 @@ Use our implementation guides for:
 ::: {.f4 .pl3 .pt2}
 [[AI Governance<br>[[[EU AI ACT]{.green}]{.bubble}]{.f5}](/about/use-cases/ai-governance.qmd){target="_blank"}]{.button .shadow-5-ns .f4 .content-tile style="width: 100%;"}
 
-[[Model Risk Management<br>[[[SR 11-7]{.green}]{.bubble} [[SS1/23]{.green}]{.bubble} [[E-23]{.green}]{.bubble}]{.f5}](/about/use-cases/model-risk-management.qmd){target="_blank"}]{.button .shadow-5-ns .f4 .content-tile style="width: 100%;"}
+[[Model Risk Management<br>[[[SR 26-2]{.green}]{.bubble} [[SS1/23]{.green}]{.bubble} [[E-23]{.green}]{.bubble}]{.f5}](/about/use-cases/model-risk-management.qmd){target="_blank"}]{.button .shadow-5-ns .f4 .content-tile style="width: 100%;"}
 :::
 :::