From 2e2c87282f155ee40e44d5e1b8e7a50b98630ad5 Mon Sep 17 00:00:00 2001
From: Yiheng Tao <ruby092977@gmail.com>
Date: Thu, 24 Jul 2025 08:56:25 -0700
Subject: [PATCH] feat: Introduce PyEval functionality for secure Python
 expression evaluation

- Added a new endpoint for evaluating Python expressions via the PyEval API.
- Implemented a dedicated page in the web interface for users to input and evaluate expressions safely.
- Integrated the RestrictedPythonEvaluator to ensure secure execution of user-provided code.
- Updated the main application routes and templates to include navigation to the new PyEval feature.
- Enhanced the evaluator with additional safe built-in functions and improved error handling.

This update significantly expands the capabilities of the application, allowing users to safely evaluate Python expressions in a controlled environment.
---
 server/api/__init__.py       |   4 +-
 server/api/pyeval.py         | 141 ++++++++++++
 server/main.py               |   6 +
 server/templates/base.html   |   1 +
 server/templates/pyeval.html | 433 +++++++++++++++++++++++++++++++++++
 utils/pyeval/evaluator.py    |  40 +++-
 6 files changed, 623 insertions(+), 2 deletions(-)
 create mode 100644 server/api/pyeval.py
 create mode 100644 server/templates/pyeval.html

diff --git a/server/api/__init__.py b/server/api/__init__.py
index cc90ad5..b2df8f3 100644
--- a/server/api/__init__.py
+++ b/server/api/__init__.py
@@ -67,6 +67,8 @@
     api_export_dataframe,
 )
 
+from .pyeval import pyeval_routes
+
 # Aggregate all routes into a single list
 api_routes = [
     # Knowledge management endpoints
@@ -127,4 +129,4 @@
     Route("/api/dataframes/{df_id}/summary", endpoint=api_get_dataframe_summary, methods=["GET"]),
     Route("/api/dataframes/{df_id}/execute", endpoint=api_execute_dataframe_operation, methods=["POST"]),
     Route("/api/dataframes/{df_id}/export", endpoint=api_export_dataframe, methods=["POST"]),
-]
+] + pyeval_routes
diff --git a/server/api/pyeval.py b/server/api/pyeval.py
new file mode 100644
index 0000000..71053c6
--- /dev/null
+++ b/server/api/pyeval.py
@@ -0,0 +1,141 @@
+"""API endpoints for Python expression evaluation using the pyeval utility."""
+
+import logging
+from typing import Any, Dict, Optional
+
+from starlette.requests import Request
+from starlette.responses import JSONResponse
+from starlette.routing import Route
+
+from utils.pyeval.evaluator import RestrictedPythonEvaluator, EvaluationError
+
+logger = logging.getLogger(__name__)
+
+
+async def evaluate_expression(request: Request) -> JSONResponse:
+    """Evaluate a Python expression using the RestrictedPythonEvaluator.
+
+    POST /api/pyeval/evaluate
+
+    Request body:
+    {
+        "expression": "python_expression_to_evaluate",
+        "context": {
+            "variable_name": "variable_value",
+            ...
+        }
+    }
+
+    Response:
+    {
+        "success": true/false,
+        "result": "evaluation_result" | null,
+        "execution_time_ms": 123.45,
+        "error_message": "error_description" | null
+    }
+    """
+    try:
+        # Parse request body
+        body = await request.json()
+        expression = body.get("expression", "").strip()
+        context = body.get("context", {})
+
+        # Validate input
+        if not expression:
+            return JSONResponse({
+                "success": False,
+                "result": None,
+                "execution_time_ms": 0.0,
+                "error_message": "Expression cannot be empty"
+            }, status_code=400)
+
+        if not isinstance(context, dict):
+            return JSONResponse({
+                "success": False,
+                "result": None,
+                "execution_time_ms": 0.0,
+                "error_message": "Context must be a dictionary"
+            }, status_code=400)
+
+        logger.info(f"Evaluating expression: {expression[:100]}{'...' if len(expression) > 100 else ''}")
+        logger.debug(f"Context variables: {list(context.keys())}")
+
+        # Create evaluator and evaluate expression
+        evaluator = RestrictedPythonEvaluator()
+        result = evaluator.evaluate_expression(expression, context)
+
+        # Format result for JSON response
+        if result.success:
+            # Convert result to string representation for JSON serialization
+            result_str = _format_result_for_json(result.result)
+            logger.info(f"Expression evaluated successfully in {result.execution_time_ms:.2f}ms")
+
+            return JSONResponse({
+                "success": True,
+                "result": result_str,
+                "execution_time_ms": result.execution_time_ms,
+                "error_message": None
+            })
+        else:
+            logger.warning(f"Expression evaluation failed: {result.error_message}")
+            return JSONResponse({
+                "success": False,
+                "result": None,
+                "execution_time_ms": result.execution_time_ms,
+                "error_message": result.error_message
+            })
+
+    except Exception as e:
+        logger.error(f"Error in evaluate_expression endpoint: {e}", exc_info=True)
+        return JSONResponse({
+            "success": False,
+            "result": None,
+            "execution_time_ms": 0.0,
+            "error_message": f"Server error: {str(e)}"
+        }, status_code=500)
+
+
+def _format_result_for_json(result: Any) -> str:
+    """Format evaluation result for JSON serialization.
+
+    Args:
+        result: The result from expression evaluation
+
+    Returns:
+        String representation of the result suitable for JSON response
+    """
+    try:
+        # Handle pandas DataFrames specially
+        if hasattr(result, 'to_string'):
+            # This covers pandas DataFrames and Series
+            return result.to_string()
+
+        # Handle numpy arrays
+        elif hasattr(result, 'tolist'):
+            return str(result)
+
+        # Handle other iterables (but not strings)
+        elif hasattr(result, '__iter__') and not isinstance(result, (str, bytes)):
+            # Convert to string representation, but limit length for very large iterables
+            str_result = str(result)
+            if len(str_result) > 10000:
+                return str_result[:10000] + "... (truncated)"
+            return str_result
+
+        # Handle basic types
+        else:
+            str_result = str(result)
+            # Limit very long string results
+            if len(str_result) > 10000:
+                return str_result[:10000] + "... (truncated)"
+            return str_result
+
+    except Exception as e:
+        logger.warning(f"Error formatting result for JSON: {e}")
+        return f"<Error formatting result: {str(e)}>"
+
+
+# API routes for pyeval functionality
+pyeval_routes = [
+    Route("/api/pyeval/evaluate", endpoint=evaluate_expression, methods=["POST"]),
+]
diff --git a/server/main.py b/server/main.py
index 05b81da..1a90de9 100644
--- a/server/main.py
+++ b/server/main.py
@@ -391,6 +391,11 @@ async def dataframe_detail_page(request: Request):
         "dataframe_detail.html", {"request": request, "current_page": "dataframes", "df_id": df_id}
     )
 
+async def pyeval_page(request: Request):
+    return templates.TemplateResponse(
+        "pyeval.html", {"request": request, "current_page": "pyeval"}
+    )
+
 
 # --- Add routes ---
 routes = [
@@ -402,6 +407,7 @@ async def dataframe_detail_page(request: Request):
     Route("/visualizations", endpoint=visualizations_page, methods=["GET"]),
     Route("/dataframes", endpoint=dataframes_page, methods=["GET"]),
     Route("/dataframes/{df_id}", endpoint=dataframe_detail_page, methods=["GET"]),
+    Route("/pyeval", endpoint=pyeval_page, methods=["GET"]),
     Route("/config", endpoint=config_page, methods=["GET"]),
     Route("/sse", endpoint=handle_sse),
     Mount("/messages/", app=sse.handle_post_message),
diff --git a/server/templates/base.html b/server/templates/base.html
index 4a626ee..40a2740 100644
--- a/server/templates/base.html
+++ b/server/templates/base.html
@@ -370,6 +370,7 @@ <h1>MCP Knowledge Server</h1>
             <a href="/knowledge" class="nav-link {{ 'active' if current_page == 'knowledge' else '' }}">Knowledge</a>
             <a href="/jobs" class="nav-link {{ 'active' if current_page == 'jobs' else '' }}">Background Jobs</a>
             <a href="/dataframes" class="nav-link {{ 'active' if current_page == 'dataframes' else '' }}">DataFrames</a>
+            <a href="/pyeval" class="nav-link {{ 'active' if current_page == 'pyeval' else '' }}">PyEval</a>
             <a href="/tools" class="nav-link {{ 'active' if current_page == 'tools' else '' }}">Tools</a>
             <a href="/tool-history" class="nav-link {{ 'active' if current_page == 'tool_history' else '' }}">Tool
                 History</a>
diff --git a/server/templates/pyeval.html b/server/templates/pyeval.html
new file mode 100644
index 0000000..bcc7b2d
--- /dev/null
+++ b/server/templates/pyeval.html
@@ -0,0 +1,433 @@
+{% extends "base.html" %}
+
+{% block title %}PyEval - MCP Knowledge Server{% endblock %}
+
+{% block extra_styles %}
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/codemirror/5.65.2/codemirror.min.css">
+<link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/codemirror/5.65.2/theme/default.min.css">
+<style>
+    .pyeval-container {
+        max-width: 1200px;
+        margin: 0 auto;
+    }
+
+    .evaluation-panel {
+        display: grid;
+        grid-template-columns: 1fr 1fr;
+        gap: 2em;
+        margin-bottom: 2em;
+    }
+
+    .code-input-section {
+        background: white;
+        padding: 1.5em;
+        border-radius: 8px;
+        box-shadow: 0 2px 4px rgba(0,0,0,0.1);
+    }
+
+    .result-section {
+        background: white;
+        padding: 1.5em;
+        border-radius: 8px;
+        box-shadow: 0 2px 4px rgba(0,0,0,0.1);
+    }
+
+    .CodeMirror {
+        height: 300px;
+        border: 1px solid #ddd;
+        border-radius: 4px;
+        font-family: 'Monaco', 'Menlo', 'Ubuntu Mono', monospace;
+    }
+
+    .context-section {
+        margin-bottom: 1em;
+    }
+
+    .context-input {
+        width: 100%;
+        height: 120px;
+        font-family: 'Monaco', 'Menlo', 'Ubuntu Mono', monospace;
+        font-size: 12px;
+        resize: vertical;
+    }
+
+    .evaluation-controls {
+        display: flex;
+        gap: 1em;
+        align-items: center;
+        margin-top: 1em;
+    }
+
+    .result-display {
+        background: #f8f9fa;
+        border: 1px solid #e9ecef;
+        border-radius: 4px;
+        padding: 1em;
+        min-height: 200px;
+        font-family: 'Monaco', 'Menlo', 'Ubuntu Mono', monospace;
+        font-size: 12px;
+        white-space: pre-wrap;
+        overflow-x: auto;
+    }
+
+    .result-success {
+        background: #d4edda;
+        border-color: #c3e6cb;
+        color: #155724;
+    }
+
+    .result-error {
+        background: #f8d7da;
+        border-color: #f5c6cb;
+        color: #721c24;
+    }
+
+    .execution-info {
+        display: flex;
+        justify-content: space-between;
+        align-items: center;
+        margin-bottom: 1em;
+        padding: 0.5em;
+        background: #f8f9fa;
+        border-radius: 4px;
+        font-size: 0.9em;
+    }
+
+    .execution-time {
+        color: #666;
+    }
+
+    .execution-status {
+        font-weight: bold;
+    }
+
+    .execution-status.success {
+        color: #28a745;
+    }
+
+    .execution-status.error {
+        color: #dc3545;
+    }
+
+    .examples-section {
+        background: white;
+        padding: 1.5em;
+        border-radius: 8px;
+        box-shadow: 0 2px 4px rgba(0,0,0,0.1);
+        margin-bottom: 2em;
+    }
+
+    .example-tabs {
+        display: flex;
+        gap: 0.5em;
+        margin-bottom: 1em;
+    }
+
+    .example-tab {
+        padding: 0.5em 1em;
+        background: #f8f9fa;
+        border: 1px solid #dee2e6;
+        border-radius: 4px 4px 0 0;
+        cursor: pointer;
+        transition: background 0.2s;
+    }
+
+    .example-tab:hover {
+        background: #e9ecef;
+    }
+
+    .example-tab.active {
+        background: #0077cc;
+        color: white;
+        border-color: #0077cc;
+    }
+
+    .example-content {
+        display: none;
+        padding: 1em;
+        border: 1px solid #dee2e6;
+        border-radius: 0 4px 4px 4px;
+        background: #f8f9fa;
+    }
+
+    .example-content.active {
+        display: block;
+    }
+
+    .example-code {
+        background: #2d3748;
+        color: #e2e8f0;
+        padding: 1em;
+        border-radius: 4px;
+        font-family: 'Monaco', 'Menlo', 'Ubuntu Mono', monospace;
+        font-size: 12px;
+        margin: 0.5em 0;
+        overflow-x: auto;
+    }
+
+    .load-example-btn {
+        background: #28a745;
+        margin-top: 0.5em;
+    }
+
+    .load-example-btn:hover {
+        background: #218838;
+    }
+
+    @media (max-width: 768px) {
+        .evaluation-panel {
+            grid-template-columns: 1fr;
+        }
+
+        .pyeval-container {
+            margin: 0 1em;
+        }
+    }
+</style>
+{% endblock %}
+
+{% block content %}
+<div class="pyeval-container">
+    <div class="card">
+        <h2>Python Expression Evaluator</h2>
+        <p>Safely evaluate Python expressions using RestrictedPython. Perfect for DataFrame operations and data analysis.</p>
+    </div>
+
+    <div class="examples-section">
+        <h3>Examples</h3>
+        <div class="example-tabs">
+            <div class="example-tab active" onclick="switchExample('basic')">Basic Operations</div>
+            <div class="example-tab" onclick="switchExample('dataframe')">DataFrame Operations</div>
+            <div class="example-tab" onclick="switchExample('math')">Mathematical</div>
+        </div>
+
+        <div id="basic-example" class="example-content active">
+            <h4>Basic Python Operations</h4>
+            <p>Simple arithmetic and list operations:</p>
+            <div class="example-code"># Basic arithmetic
+sum([1, 2, 3, 4, 5])
+
+# List comprehension
+[x**2 for x in range(5)]
+
+# String operations
+"hello world".title()</div>
+            <button class="load-example-btn" onclick="loadExample('basic')">Load Example</button>
+        </div>
+
+        <div id="dataframe-example" class="example-content">
+            <h4>DataFrame Operations</h4>
+            <p>Working with pandas DataFrames:</p>
+            <div class="example-code"># DataFrame operations (requires DataFrame in context)
+df.head(10)
+
+# Column statistics
+df['column_name'].describe()
+
+# Filtering
+df[df['age'] > 25]</div>
+            <p><strong>Context needed:</strong></p>
+            <div class="example-code">{"df": "your_dataframe_variable", "pd": "pandas"}</div>
+            <button class="load-example-btn" onclick="loadExample('dataframe')">Load Example</button>
+        </div>
+
+        <div id="math-example" class="example-content">
+            <h4>Mathematical Operations</h4>
+            <p>Advanced mathematical computations:</p>
+            <div class="example-code"># Statistical operations (statistics module is available)
+statistics.mean([1, 2, 3, 4, 5])
+
+# Math operations
+math.sqrt(16) + math.sin(math.pi / 2)
+
+# Complex calculations with generators
+sum(x**2 for x in range(10) if x % 2 == 0)</div>
+            <button class="load-example-btn" onclick="loadExample('math')">Load Example</button>
+        </div>
+    </div>
+
+    <div class="evaluation-panel">
+        <div class="code-input-section">
+            <h3>Python Expression</h3>
+            <textarea id="code-input" placeholder="Enter your Python expression here...">sum([1, 2, 3, 4, 5])</textarea>
+
+            <div class="context-section">
+                <h4>Context Variables (JSON)</h4>
+                <textarea id="context-input" class="context-input" placeholder='{"df": "your_dataframe", "pd": "pandas"}'>{}</textarea>
+            </div>
+
+            <div class="evaluation-controls">
+                <button id="evaluate-btn" onclick="evaluateExpression()">Evaluate Expression</button>
+                <button onclick="clearInputs()">Clear</button>
+                <div id="evaluation-status"></div>
+            </div>
+        </div>
+
+        <div class="result-section">
+            <h3>Result</h3>
+            <div id="execution-info" class="execution-info" style="display: none;">
+                <div class="execution-status" id="execution-status">Ready</div>
+                <div class="execution-time" id="execution-time"></div>
+            </div>
+            <div id="result-display" class="result-display">Ready to evaluate your Python expression...</div>
+        </div>
+    </div>
+</div>
+{% endblock %}
+
+{% block extra_scripts %}
+<script src="https://cdnjs.cloudflare.com/ajax/libs/codemirror/5.65.2/codemirror.min.js"></script>
+<script src="https://cdnjs.cloudflare.com/ajax/libs/codemirror/5.65.2/mode/python/python.min.js"></script>
+<script>
+    let codeEditor;
+
+    document.addEventListener('DOMContentLoaded', function() {
+        // Initialize CodeMirror
+        const codeInput = document.getElementById('code-input');
+        codeEditor = CodeMirror.fromTextArea(codeInput, {
+            mode: 'python',
+            theme: 'default',
+            lineNumbers: true,
+            matchBrackets: true,
+            indentUnit: 4,
+            indentWithTabs: false,
+            extraKeys: {
+                "Ctrl-Enter": evaluateExpression,
+                "Cmd-Enter": evaluateExpression
+            }
+        });
+    });
+
+    function switchExample(exampleType) {
+        // Update tab states
+        document.querySelectorAll('.example-tab').forEach(tab => {
+            tab.classList.remove('active');
+        });
+        document.querySelector(`[onclick="switchExample('${exampleType}')"]`).classList.add('active');
+
+        // Update content visibility
+        document.querySelectorAll('.example-content').forEach(content => {
+            content.classList.remove('active');
+        });
+        document.getElementById(`${exampleType}-example`).classList.add('active');
+    }
+
+    function loadExample(exampleType) {
+        const examples = {
+            'basic': {
+                code: 'sum([1, 2, 3, 4, 5])',
+                context: '{}'
+            },
+            'dataframe': {
+                code: 'df.head(10)',
+                context: '{"df": "your_dataframe_variable", "pd": "pandas"}'
+            },
+            'math': {
+                code: 'statistics.mean([1, 2, 3, 4, 5])',
+                context: '{}'
+            }
+        };
+
+        const example = examples[exampleType];
+        if (example) {
+            codeEditor.setValue(example.code);
+            document.getElementById('context-input').value = example.context;
+        }
+    }
+
+    async function evaluateExpression() {
+        const expression = codeEditor.getValue().trim();
+        const contextInput = document.getElementById('context-input').value.trim();
+        const evaluateBtn = document.getElementById('evaluate-btn');
+        const resultDisplay = document.getElementById('result-display');
+        const executionInfo = document.getElementById('execution-info');
+        const executionStatus = document.getElementById('execution-status');
+        const executionTime = document.getElementById('execution-time');
+
+        if (!expression) {
+            showStatus('evaluation-status', 'Please enter a Python expression', true);
+            return;
+        }
+
+        // Parse context JSON
+        let context = {};
+        if (contextInput) {
+            try {
+                context = JSON.parse(contextInput);
+            } catch (e) {
+                showStatus('evaluation-status', 'Invalid JSON in context variables', true);
+                return;
+            }
+        }
+
+        // Update UI for evaluation
+        evaluateBtn.disabled = true;
+        evaluateBtn.textContent = 'Evaluating...';
+        clearStatus('evaluation-status');
+
+        resultDisplay.className = 'result-display';
+        resultDisplay.textContent = 'Evaluating expression...';
+        executionInfo.style.display = 'none';
+
+        try {
+            const response = await fetch('/api/pyeval/evaluate', {
+                method: 'POST',
+                headers: {
+                    'Content-Type': 'application/json'
+                },
+                body: JSON.stringify({
+                    expression: expression,
+                    context: context
+                })
+            });
+
+            const data = await response.json();
+
+            // Show execution info
+            executionInfo.style.display = 'flex';
+            executionTime.textContent = `${data.execution_time_ms?.toFixed(2) || 0}ms`;
+
+            if (data.success) {
+                // Success
+                executionStatus.textContent = 'Success';
+                executionStatus.className = 'execution-status success';
+                resultDisplay.className = 'result-display result-success';
+                resultDisplay.textContent = data.result || 'No result returned';
+            } else {
+                // Error
+                executionStatus.textContent = 'Error';
+                executionStatus.className = 'execution-status error';
+                resultDisplay.className = 'result-display result-error';
+                resultDisplay.textContent = data.error_message || 'Unknown error occurred';
+            }
+
+        } catch (error) {
+            console.error('Evaluation error:', error);
+            executionInfo.style.display = 'flex';
+            executionStatus.textContent = 'Network Error';
+            executionStatus.className = 'execution-status error';
+            executionTime.textContent = '';
+            resultDisplay.className = 'result-display result-error';
+            resultDisplay.textContent = `Network error: ${error.message}`;
+        } finally {
+            evaluateBtn.disabled = false;
+            evaluateBtn.textContent = 'Evaluate Expression';
+        }
+    }
+
+    function clearInputs() {
+        codeEditor.setValue('');
+        document.getElementById('context-input').value = '{}';
+        document.getElementById('result-display').className = 'result-display';
+        document.getElementById('result-display').textContent = 'Ready to evaluate your Python expression...';
+        document.getElementById('execution-info').style.display = 'none';
+        clearStatus('evaluation-status');
+    }
+
+    // Add keyboard shortcut hint
+    document.addEventListener('DOMContentLoaded', function() {
+        const evaluateBtn = document.getElementById('evaluate-btn');
+        evaluateBtn.title = 'Keyboard shortcut: Ctrl+Enter (Cmd+Enter on Mac)';
+    });
+</script>
+{% endblock %}
diff --git a/utils/pyeval/evaluator.py b/utils/pyeval/evaluator.py
index deeb406..d67f8c9 100644
--- a/utils/pyeval/evaluator.py
+++ b/utils/pyeval/evaluator.py
@@ -12,7 +12,7 @@
 
 import pandas as pd
 from RestrictedPython import compile_restricted_exec, safe_globals, limited_builtins
-from RestrictedPython.Guards import safer_getattr, guarded_setattr
+from RestrictedPython.Guards import safer_getattr, guarded_setattr, guarded_iter_unpack_sequence
 
 logger = logging.getLogger(__name__)
 
@@ -52,6 +52,9 @@ def _create_safe_builtins(self) -> Dict[str, Any]:
         Returns:
             Dictionary containing safe built-in functions.
         """
+        import statistics
+        import math
+
         safe_builtins = limited_builtins.copy()
         safe_builtins.update({
             # Mathematical functions
@@ -61,12 +64,15 @@ def _create_safe_builtins(self) -> Dict[str, Any]:
             'sum': sum,
             'abs': abs,
             'round': round,
+            'pow': pow,
 
             # Collection functions
             'sorted': sorted,
             'enumerate': enumerate,
             'zip': zip,
             'range': range,
+            'filter': filter,
+            'map': map,
 
             # Type constructors
             'list': list,
@@ -77,9 +83,39 @@ def _create_safe_builtins(self) -> Dict[str, Any]:
             'int': int,
             'float': float,
             'bool': bool,
+
+            # Safe modules
+            'statistics': statistics,
+            'math': math,
         })
         return safe_builtins
 
+    def _create_safe_getiter(self) -> callable:
+        """Create a safe iterator function for safe iteration.
+
+        Returns:
+            Safe iterator function for use in restricted environment.
+        """
+        def safe_getiter(obj):
+            """Safe iterator access for various objects.
+
+            Args:
+                obj: Object to iterate over
+
+            Returns:
+                Iterator for the object
+
+            Raises:
+                TypeError: If object is not iterable
+            """
+            try:
+                return iter(obj)
+            except TypeError as e:
+                self._logger.warning(f"Safe getiter failed for object: {e}")
+                raise
+
+        return safe_getiter
+
     def _create_safe_getitem(self) -> callable:
         """Create a safe getitem function for accessing DataFrame columns and Series values.
 
@@ -124,6 +160,8 @@ def _create_restricted_globals(self, context: Dict[str, Any]) -> Dict[str, Any]:
             '_getattr_': safer_getattr,
             '_setattr_': guarded_setattr,
             '_getitem_': self._create_safe_getitem(),
+            '_getiter_': self._create_safe_getiter(),
+            '_iter_unpack_sequence_': guarded_iter_unpack_sequence,
         })
 
         # Add user-provided context