Spaces:

Pulastya0
/

Data-Science-Agent

Running

App Files Files Community

Pulastya B commited on 17 days ago

Commit

1ca2e0e

1 Parent(s): 2cf9e11

Fixed Bugs where the SSE Streaming was improper added support for Auto Gluon, Fixed instances where stale schemas was causing EDA plots generation to fail

Browse files

Files changed (27) hide show

examples/titanic_example.py +0 -166
idx.html +0 -1281
render.yaml +0 -37
requirements.txt +16 -0
src/api/app.py +17 -4
src/orchestrator.py +226 -34
src/tools/__init__.py +40 -8
src/tools/advanced_insights.py +47 -13
src/tools/advanced_preprocessing.py +11 -1
src/tools/advanced_training.py +39 -2
src/tools/agent_tool_mapping.py +9 -0
src/tools/auto_pipeline.py +55 -1
src/tools/autogluon_training.py +1480 -0
src/tools/business_intelligence.py +62 -1
src/tools/code_interpreter.py +6 -2
src/tools/data_cleaning.py +72 -1
src/tools/data_profiling.py +105 -0
src/tools/eda_reports.py +97 -0
src/tools/feature_engineering.py +2 -2
src/tools/nlp_text_analytics.py +42 -14
src/tools/production_mlops.py +191 -0
src/tools/time_series.py +52 -1
src/tools/tools_registry.py +467 -0
src/tools/visualization_engine.py +1 -1
src/utils/schema_extraction.py +16 -2
src/utils/validation.py +107 -0
test_data/sample.csv +0 -16

examples/titanic_example.py DELETED Viewed

@@ -1,166 +0,0 @@
-"""
-Titanic Example - Demonstrating the complete Data Science Copilot workflow
-"""
-import sys
-import os
-from pathlib import Path
-# Add src to path
-sys.path.insert(0, os.path.join(os.path.dirname(__file__), 'src'))
-from orchestrator import DataScienceCopilot
-from rich.console import Console
-from rich.panel import Panel
-console = Console()
-def main():
-    """
-    Complete example using the Titanic dataset.
-    This demonstrates the full workflow:
-    1. Dataset profiling
-    2. Quality issue detection
-    3. Data cleaning
-    4. Feature engineering
-    5. Model training
-    6. Report generation
-    """
-    console.print(Panel.fit(
-        "🚢 Titanic Survival Prediction - Complete Workflow Example",
-        style="bold blue"
-    ))
-    # Setup
-    titanic_path = "./data/titanic.csv"
-    # Check if dataset exists
-    if not Path(titanic_path).exists():
-        console.print("\n[yellow]⚠ Titanic dataset not found at ./data/titanic.csv[/yellow]")
-        console.print("[yellow]Please download it from: https://www.kaggle.com/c/titanic/data[/yellow]")
-        console.print("[yellow]Or place your own CSV file in the data directory[/yellow]\n")
-        # Use a sample path instead
-        console.print("[blue]Using sample dataset path for demonstration...[/blue]\n")
-        titanic_path = "your_dataset.csv"  # User should replace this
-    # Initialize copilot
-    console.print("\n[bold]Step 1: Initialize Data Science Copilot[/bold]")
-    try:
-        copilot = DataScienceCopilot(reasoning_effort="medium")
-        console.print("[green]✓ Copilot initialized successfully[/green]")
-    except Exception as e:
-        console.print(f"[red]✗ Error: {e}[/red]")
-        console.print("[yellow]Make sure to set GROQ_API_KEY in .env file[/yellow]")
-        return
-    # Define the task
-    task_description = """
-    Analyze the Titanic dataset and build a model to predict passenger survival.
-    Key objectives:
-    1. Understand the data structure and identify quality issues
-    2. Handle missing values appropriately
-    3. Engineer relevant features from available data (e.g., family size, titles from names)
-    4. Train and compare multiple baseline models
-    5. Identify the most important features for prediction
-    6. Provide recommendations for improvement
-    Target: Achieve competitive performance (aim for 50-70th percentile on Kaggle leaderboard)
-    """
-    target_column = "Survived"
-    console.print("\n[bold]Step 2: Run Complete Analysis Workflow[/bold]")
-    console.print(f"Dataset: {titanic_path}")
-    console.print(f"Target: {target_column}")
-    console.print(f"Task: Predict passenger survival\n")
-    # Run analysis
-    try:
-        result = copilot.analyze(
-            file_path=titanic_path,
-            task_description=task_description,
-            target_col=target_column,
-            use_cache=True,
-            max_iterations=15  # Allow more iterations for complex workflow
-        )
-        # Display results
-        if result["status"] == "success":
-            console.print("\n[green]✓ Analysis Complete![/green]\n")
-            # Display summary
-            console.print(Panel(
-                result["summary"],
-                title="📋 Final Analysis Summary",
-                border_style="green"
-            ))
-            # Display workflow steps
-            console.print("\n[bold]🔧 Workflow Steps Executed:[/bold]")
-            for i, step in enumerate(result["workflow_history"], 1):
-                tool = step["tool"]
-                success = step["result"].get("success", False)
-                icon = "✓" if success else "✗"
-                color = "green" if success else "red"
-                console.print(f"{i}. [{color}]{icon}[/{color}] {tool}")
-            # Display statistics
-            console.print(f"\n[bold]📊 Execution Statistics:[/bold]")
-            console.print(f"  Total Iterations: {result['iterations']}")
-            console.print(f"  API Calls Made: {result['api_calls']}")
-            console.print(f"  Execution Time: {result['execution_time']}s")
-            # Check for trained models
-            console.print("\n[bold]🤖 Model Training Results:[/bold]")
-            for step in result["workflow_history"]:
-                if step["tool"] == "train_baseline_models":
-                    if step["result"].get("success"):
-                        models_result = step["result"]["result"]
-                        best_model = models_result.get("best_model", {})
-                        console.print(f"  Best Model: {best_model.get('name')}")
-                        console.print(f"  Score: {best_model.get('score'):.4f}")
-                        console.print(f"  Model Path: {best_model.get('model_path')}")
-            # Save results
-            output_file = "./outputs/reports/titanic_analysis.json"
-            Path(output_file).parent.mkdir(parents=True, exist_ok=True)
-            import json
-            with open(output_file, "w") as f:
-                json.dump(result, f, indent=2)
-            console.print(f"\n[cyan]💾 Full results saved to: {output_file}[/cyan]")
-            # Next steps
-            console.print("\n[bold]🎯 Next Steps:[/bold]")
-            console.print("  1. Review the generated models in ./outputs/models/")
-            console.print("  2. Check data quality reports in ./outputs/reports/")
-            console.print("  3. Examine cleaned datasets in ./outputs/data/")
-            console.print("  4. Use the best model for predictions on new data")
-        elif result["status"] == "error":
-            console.print(f"\n[red]✗ Analysis failed: {result['error']}[/red]")
-            console.print(f"Error type: {result['error_type']}")
-        else:
-            console.print(f"\n[yellow]⚠ Analysis incomplete: {result.get('message')}[/yellow]")
-    except Exception as e:
-        console.print(f"\n[red]✗ Unexpected error: {e}[/red]")
-        import traceback
-        console.print(traceback.format_exc())
-    # Cache statistics
-    console.print("\n[bold]📦 Cache Statistics:[/bold]")
-    cache_stats = copilot.get_cache_stats()
-    console.print(f"  Valid Entries: {cache_stats['valid_entries']}")
-    console.print(f"  Cache Size: {cache_stats['size_mb']} MB")
-if __name__ == "__main__":
-    main()

idx.html DELETED Viewed

@@ -1,1281 +0,0 @@
-<!DOCTYPE html>
-<html lang="en">
-<head>
-  <meta charset="UTF-8">
-  <meta name="viewport" content="width=device-width, initial-scale=1.0">
-  <title>Cute Lamp Login - Ultimate Edition</title>
-  <style>
-    * {
-      margin: 0;
-      padding: 0;
-      box-sizing: border-box;
-    }
-    body {
-      font-family: 'Segoe UI', Tahoma, Geneva, Verdana, sans-serif;
-      background: linear-gradient(135deg, #0a0a0a 0%, #1a1a2e 50%, #16213e 100%);
-      min-height: 100vh;
-      display: flex;
-      flex-direction: column;
-      align-items: center;
-      justify-content: center;
-      overflow-x: hidden;
-      position: relative;
-      padding: 20px;
-    }
-    /* Enhanced Animated background particles */
-    .particles {
-      position: fixed;
-      width: 100%;
-      height: 100%;
-      overflow: hidden;
-      z-index: 0;
-      top: 0;
-      left: 0;
-    }
-    .particle {
-      position: absolute;
-      width: 4px;
-      height: 4px;
-      background: radial-gradient(circle, #ffa500, transparent);
-      border-radius: 50%;
-      animation: float 15s infinite ease-in-out;
-      box-shadow: 0 0 10px #ffa500;
-    }
-    @keyframes float {
-      0% { transform: translate(0, 100vh) scale(0); opacity: 0; }
-      10% { opacity: 1; }
-      90% { opacity: 1; }
-      100% { transform: translate(var(--tx), -100vh) scale(1); opacity: 0; }
-    }
-    /* Sparkles */
-    .sparkle {
-      position: absolute;
-      width: 3px;
-      height: 3px;
-      background: #fff;
-      border-radius: 50%;
-      animation: sparkle 3s infinite;
-      box-shadow: 0 0 8px #fff;
-    }
-    @keyframes sparkle {
-      0%, 100% { opacity: 0; transform: scale(0); }
-      50% { opacity: 1; transform: scale(1.5); }
-    }
-    .title {
-      font-size: 52px;
-      font-weight: 700;
-      background: linear-gradient(90deg, #ffa500, #ff6b35, #ffa500);
-      background-size: 200% auto;
-      -webkit-background-clip: text;
-      -webkit-text-fill-color: transparent;
-      background-clip: text;
-      margin-bottom: 50px;
-      text-align: center;
-      z-index: 2;
-      text-shadow: 0 0 30px rgba(255, 165, 0, 0.5);
-      animation: gradientMove 3s linear infinite, fadeInDown 1s ease;
-      letter-spacing: 2px;
-    }
-    @keyframes gradientMove {
-      0% { background-position: 0% center; }
-      100% { background-position: 200% center; }
-    }
-    @keyframes fadeInDown {
-      from {
-        opacity: 0;
-        transform: translateY(-50px);
-      }
-      to {
-        opacity: 1;
-        transform: translateY(0);
-      }
-    }
-    .container {
-      display: flex;
-      align-items: center;
-      justify-content: center;
-      gap: 80px;
-      background: rgba(30, 40, 60, 0.5);
-      padding: 70px;
-      border-radius: 30px;
-      border: 2px solid rgba(255, 255, 255, 0.1);
-      backdrop-filter: blur(20px);
-      box-shadow: 0 30px 80px rgba(0, 0, 0, 0.6), inset 0 0 40px rgba(255, 165, 0, 0.05);
-      z-index: 2;
-      animation: fadeIn 1.2s ease 0.3s backwards;
-      position: relative;
-      max-width: 1200px;
-    }
-    @keyframes fadeIn {
-      from {
-        opacity: 0;
-        transform: scale(0.8) rotateX(10deg);
-      }
-      to {
-        opacity: 1;
-        transform: scale(1) rotateX(0);
-      }
-    }
-    /* Enhanced Lamp Section */
-    .lamp-section {
-      position: relative;
-      display: flex;
-      align-items: center;
-      justify-content: center;
-      width: 300px;
-      height: 400px;
-    }
-    .lamp-container {
-      position: relative;
-      cursor: pointer;
-      transition: transform 0.3s ease;
-    }
-    .lamp-container:hover {
-      transform: scale(1.05);
-    }
-    .lamp {
-      position: relative;
-      width: 200px;
-      height: 320px;
-      display: flex;
-      align-items: flex-end;
-      justify-content: center;
-      animation: lampFloat 4s ease-in-out infinite;
-      filter: drop-shadow(0 10px 30px rgba(0, 0, 0, 0.5));
-    }
-    @keyframes lampFloat {
-      0%, 100% { transform: translateY(0) rotate(0deg); }
-      25% { transform: translateY(-12px) rotate(-2deg); }
-      75% { transform: translateY(-8px) rotate(2deg); }
-    }
-    /* Electric Cord */
-    .cord {
-      position: absolute;
-      width: 4px;
-      height: 80px;
-      background: linear-gradient(180deg, #555, #333);
-      top: -80px;
-      left: 50%;
-      transform: translateX(-50%);
-      border-radius: 2px;
-      animation: cordSwing 4s ease-in-out infinite;
-      transform-origin: top center;
-    }
-    @keyframes cordSwing {
-      0%, 100% { transform: translateX(-50%) rotate(0deg); }
-      25% { transform: translateX(-50%) rotate(-3deg); }
-      75% { transform: translateX(-50%) rotate(3deg); }
-    }
-    .cord-plug {
-      position: absolute;
-      top: -10px;
-      left: 50%;
-      transform: translateX(-50%);
-      width: 12px;
-      height: 12px;
-      background: #444;
-      border-radius: 50%;
-      box-shadow: 0 2px 5px rgba(0,0,0,0.5);
-    }
-    .lamp-stand {
-      width: 10px;
-      height: 160px;
-      background: linear-gradient(180deg, #e8e8e8, #fff, #e8e8e8);
-      border-radius: 5px;
-      position: absolute;
-      bottom: 0;
-      box-shadow: 0 6px 15px rgba(0, 0, 0, 0.4), inset 0 0 10px rgba(255, 255, 255, 0.5);
-    }
-    .lamp-base {
-      width: 80px;
-      height: 25px;
-      background: linear-gradient(180deg, #d0d0d0, #f8f8f8, #d0d0d0);
-      border-radius: 15px;
-      position: absolute;
-      bottom: 0;
-      box-shadow: 0 6px 20px rgba(0, 0, 0, 0.5), inset 0 -3px 10px rgba(0, 0, 0, 0.2);
-    }
-    .lamp-shade {
-      width: 140px;
-      height: 110px;
-      background: linear-gradient(180deg, #95d4a8, #a8d5ba, #8bc9a8);
-      clip-path: polygon(22% 0%, 78% 0%, 100% 100%, 0% 100%);
-      position: absolute;
-      top: 40px;
-      border-radius: 10px 10px 0 0;
-      box-shadow: 0 10px 30px rgba(0, 0, 0, 0.4), inset 0 -15px 40px rgba(255, 255, 255, 0.4);
-      animation: shadeGlow 3s ease-in-out infinite;
-      transition: all 0.3s ease;
-    }
-    .lamp-shade.happy {
-      filter: brightness(1.2);
-    }
-    .lamp-shade.sad {
-      filter: brightness(0.8);
-    }
-    @keyframes shadeGlow {
-      0%, 100% {
-        box-shadow: 0 10px 30px rgba(0, 0, 0, 0.4), inset 0 -15px 40px rgba(255, 255, 255, 0.4);
-        filter: brightness(1);
-      }
-      50% {
-        box-shadow: 0 10px 40px rgba(168, 213, 186, 0.7), inset 0 -15px 50px rgba(255, 255, 255, 0.6);
-        filter: brightness(1.15);
-      }
-    }
-    /* Enhanced Lamp Face with expressions */
-    .lamp-face {
-      position: absolute;
-      top: 75px;
-      width: 140px;
-      height: 90px;
-      z-index: 2;
-      transition: all 0.3s ease;
-    }
-    .lamp-eye {
-      width: 14px;
-      height: 20px;
-      background: #2d3436;
-      border-radius: 50%;
-      position: absolute;
-      top: 20px;
-      transition: all 0.3s ease;
-      animation: blink 5s infinite;
-    }
-    .lamp-eye.left {
-      left: 35px;
-    }
-    .lamp-eye.right {
-      right: 35px;
-    }
-    .lamp-eye::before {
-      content: '';
-      position: absolute;
-      width: 5px;
-      height: 5px;
-      background: #fff;
-      border-radius: 50%;
-      top: 4px;
-      left: 3px;
-      animation: eyeShine 3s infinite;
-    }
-    @keyframes eyeShine {
-      0%, 100% { opacity: 0.8; }
-      50% { opacity: 1; }
-    }
-    @keyframes blink {
-      0%, 46%, 50%, 100% { height: 20px; }
-      48% { height: 2px; }
-    }
-    /* Lamp Tongue (when light is on) */
-    .lamp-tongue {
-      position: absolute;
-      width: 20px;
-      height: 25px;
-      background: #ff6b6b;
-      border-radius: 0 0 10px 10px;
-      bottom: 15px;
-      left: 50%;
-      transform: translateX(-50%) scaleY(0);
-      transform-origin: top;
-      opacity: 0;
-      transition: all 0.3s ease;
-    }
-    .lamp-tongue.show {
-      transform: translateX(-50%) scaleY(1);
-      opacity: 1;
-      animation: tongueWiggle 0.5s ease-in-out;
-    }
-    @keyframes tongueWiggle {
-      0%, 100% { transform: translateX(-50%) scaleY(1) rotate(0deg); }
-      25% { transform: translateX(-50%) scaleY(1) rotate(-5deg); }
-      75% { transform: translateX(-50%) scaleY(1) rotate(5deg); }
-    }
-    .lamp-mouth {
-      width: 35px;
-      height: 18px;
-      border: 3px solid #e74c3c;
-      border-top: none;
-      border-radius: 0 0 35px 35px;
-      position: absolute;
-      top: 48px;
-      left: 50%;
-      transform: translateX(-50%);
-      transition: all 0.3s ease;
-      animation: smile 4s ease-in-out infinite;
-    }
-    .lamp-mouth.sad {
-      border-radius: 35px 35px 0 0;
-      border-top: 3px solid #e74c3c;
-      border-bottom: none;
-      top: 55px;
-    }
-    @keyframes smile {
-      0%, 100% { width: 35px; }
-      50% { width: 40px; }
-    }
-    .lamp-blush {
-      width: 22px;
-      height: 14px;
-      background: rgba(231, 76, 60, 0.5);
-      border-radius: 50%;
-      position: absolute;
-      top: 40px;
-      animation: blushPulse 3s ease-in-out infinite;
-    }
-    @keyframes blushPulse {
-      0%, 100% { opacity: 0.5; }
-      50% { opacity: 0.8; }
-    }
-    .lamp-blush.left {
-      left: 15px;
-    }
-    .lamp-blush.right {
-      right: 15px;
-    }
-    /* Enhanced Light glow effect */
-    .lamp-glow {
-      position: absolute;
-      bottom: -50px;
-      left: 50%;
-      transform: translateX(-50%);
-      width: 280px;
-      height: 280px;
-      background: radial-gradient(circle, rgba(255, 243, 176, 0.6) 0%, rgba(255, 220, 100, 0.3) 40%, transparent 70%);
-      border-radius: 50%;
-      animation: glowPulse 3s ease-in-out infinite;
-      pointer-events: none;
-      filter: blur(20px);
-    }
-    @keyframes glowPulse {
-      0%, 100% {
-        opacity: 0.7;
-        transform: translateX(-50%) scale(1);
-      }
-      50% {
-        opacity: 1;
-        transform: translateX(-50%) scale(1.15);
-      }
-    }
-    /* Enhanced Login Form */
-    .login-box {
-      background: linear-gradient(135deg, rgba(40, 50, 70, 0.8), rgba(30, 40, 60, 0.9));
-      padding: 50px 55px;
-      border-radius: 25px;
-      border: 2px solid rgba(76, 209, 55, 0.6);
-      box-shadow: 0 0 50px rgba(76, 209, 55, 0.4), inset 0 0 30px rgba(0, 0, 0, 0.3);
-      width: 420px;
-      backdrop-filter: blur(15px);
-      position: relative;
-      overflow: hidden;
-    }
-    .login-box::before {
-      content: '';
-      position: absolute;
-      top: -50%;
-      left: -50%;
-      width: 200%;
-      height: 200%;
-      background: linear-gradient(45deg, transparent, rgba(76, 209, 55, 0.1), transparent);
-      animation: shimmer 3s infinite;
-    }
-    @keyframes shimmer {
-      0% { transform: translateX(-100%) translateY(-100%) rotate(45deg); }
-      100% { transform: translateX(100%) translateY(100%) rotate(45deg); }
-    }
-    .login-box > * {
-      position: relative;
-      z-index: 1;
-    }
-    .login-box h2 {
-      text-align: center;
-      color: #fff;
-      font-size: 36px;
-      margin-bottom: 35px;
-      font-weight: 700;
-      text-shadow: 0 4px 10px rgba(0, 0, 0, 0.5);
-      animation: textGlow 2s ease-in-out infinite;
-    }
-    @keyframes textGlow {
-      0%, 100% { text-shadow: 0 4px 10px rgba(0, 0, 0, 0.5); }
-      50% { text-shadow: 0 4px 20px rgba(76, 209, 55, 0.5); }
-    }
-    .input-group {
-      margin-bottom: 28px;
-      position: relative;
-    }
-    .input-group label {
-      display: block;
-      color: #b8c5d8;
-      font-size: 14px;
-      margin-bottom: 10px;
-      font-weight: 600;
-      letter-spacing: 0.5px;
-    }
-    .input-wrapper {
-      position: relative;
-    }
-    .input-group input {
-      width: 100%;
-      padding: 16px 50px 16px 20px;
-      background: rgba(20, 30, 50, 0.7);
-      border: 2px solid rgba(255, 255, 255, 0.1);
-      border-radius: 12px;
-      color: #fff;
-      font-size: 15px;
-      outline: none;
-      transition: all 0.4s ease;
-      font-family: inherit;
-    }
-    .input-group input::placeholder {
-      color: #6c7a89;
-    }
-    .input-group input:focus {
-      border-color: #4cd137;
-      box-shadow: 0 0 20px rgba(76, 209, 55, 0.4), inset 0 0 10px rgba(76, 209, 55, 0.1);
-      background: rgba(20, 30, 50, 0.9);
-      transform: translateY(-2px);
-    }
-    .input-group input.error {
-      border-color: #e74c3c;
-      animation: shake 0.5s;
-    }
-    @keyframes shake {
-      0%, 100% { transform: translateX(0); }
-      25% { transform: translateX(-10px); }
-      75% { transform: translateX(10px); }
-    }
-    /* Password Toggle Eye */
-    .toggle-password {
-      position: absolute;
-      right: 15px;
-      top: 50%;
-      transform: translateY(-50%);
-      cursor: pointer;
-      color: #6c7a89;
-      font-size: 20px;
-      transition: color 0.3s ease;
-      user-select: none;
-    }
-    .toggle-password:hover {
-      color: #4cd137;
-    }
-    /* Social Login Buttons */
-    .social-login {
-      display: flex;
-      gap: 12px;
-      margin-bottom: 25px;
-    }
-    .social-btn {
-      flex: 1;
-      padding: 12px;
-      border: 2px solid rgba(255, 255, 255, 0.2);
-      background: rgba(30, 40, 60, 0.6);
-      border-radius: 10px;
-      color: #fff;
-      cursor: pointer;
-      transition: all 0.3s ease;
-      display: flex;
-      align-items: center;
-      justify-content: center;
-      gap: 8px;
-      font-size: 14px;
-      font-weight: 600;
-    }
-    .social-btn:hover {
-      transform: translateY(-3px);
-      border-color: #4cd137;
-      box-shadow: 0 5px 15px rgba(76, 209, 55, 0.3);
-    }
-    .divider {
-      text-align: center;
-      margin: 25px 0;
-      color: #6c7a89;
-      position: relative;
-    }
-    .divider::before,
-    .divider::after {
-      content: '';
-      position: absolute;
-      top: 50%;
-      width: 40%;
-      height: 1px;
-      background: rgba(255, 255, 255, 0.1);
-    }
-    .divider::before {
-      left: 0;
-    }
-    .divider::after {
-      right: 0;
-    }
-    .login-btn {
-      width: 100%;
-      padding: 17px;
-      background: linear-gradient(135deg, #4cd137, #44bd32, #3da82a);
-      background-size: 200% auto;
-      border: none;
-      border-radius: 12px;
-      color: #fff;
-      font-size: 18px;
-      font-weight: 700;
-      cursor: pointer;
-      transition: all 0.4s ease;
-      box-shadow: 0 6px 25px rgba(76, 209, 55, 0.5);
-      margin-top: 12px;
-      position: relative;
-      overflow: hidden;
-      letter-spacing: 1px;
-    }
-    .login-btn::before {
-      content: '';
-      position: absolute;
-      top: 0;
-      left: -100%;
-      width: 100%;
-      height: 100%;
-      background: linear-gradient(90deg, transparent, rgba(255, 255, 255, 0.3), transparent);
-      transition: left 0.5s;
-    }
-    .login-btn:hover::before {
-      left: 100%;
-    }
-    .login-btn:hover {
-      transform: translateY(-4px);
-      box-shadow: 0 10px 30px rgba(76, 209, 55, 0.7);
-      background-position: right center;
-    }
-    .login-btn:active {
-      transform: translateY(-2px);
-    }
-    .login-btn.loading {
-      pointer-events: none;
-      opacity: 0.8;
-    }
-    .login-btn.loading::after {
-      content: '';
-      position: absolute;
-      width: 20px;
-      height: 20px;
-      border: 3px solid rgba(255, 255, 255, 0.3);
-      border-top-color: #fff;
-      border-radius: 50%;
-      animation: spin 0.8s linear infinite;
-      top: 50%;
-      left: 50%;
-      transform: translate(-50%, -50%);
-    }
-    @keyframes spin {
-      to { transform: translate(-50%, -50%) rotate(360deg); }
-    }
-    .forgot-password {
-      text-align: center;
-      margin-top: 22px;
-    }
-    .forgot-password a {
-      color: #7c8a9e;
-      text-decoration: none;
-      font-size: 14px;
-      transition: all 0.3s ease;
-      position: relative;
-    }
-    .forgot-password a::after {
-      content: '';
-      position: absolute;
-      bottom: -2px;
-      left: 0;
-      width: 0;
-      height: 2px;
-      background: #4cd137;
-      transition: width 0.3s ease;
-    }
-    .forgot-password a:hover {
-      color: #4cd137;
-    }
-    .forgot-password a:hover::after {
-      width: 100%;
-    }
-    /* Toast Notification */
-    .toast {
-      position: fixed;
-      top: 30px;
-      right: 30px;
-      background: linear-gradient(135deg, rgba(76, 209, 55, 0.95), rgba(68, 189, 50, 0.95));
-      color: #fff;
-      padding: 18px 28px;
-      border-radius: 12px;
-      box-shadow: 0 10px 30px rgba(0, 0, 0, 0.5);
-      z-index: 1000;
-      transform: translateX(400px);
-      opacity: 0;
-      transition: all 0.4s cubic-bezier(0.68, -0.55, 0.265, 1.55);
-      display: flex;
-      align-items: center;
-      gap: 12px;
-      font-weight: 600;
-      backdrop-filter: blur(10px);
-    }
-    .toast.show {
-      transform: translateX(0);
-      opacity: 1;
-    }
-    .toast.error {
-      background: linear-gradient(135deg, rgba(231, 76, 60, 0.95), rgba(192, 57, 43, 0.95));
-    }
-    .toast-icon {
-      font-size: 24px;
-    }
-    /* Code Display Section */
-    .code-section {
-      margin-top: 60px;
-      width: 100%;
-      max-width: 1200px;
-      z-index: 2;
-      animation: fadeIn 1.5s ease 1s backwards;
-    }
-    .code-header {
-      text-align: center;
-      margin-bottom: 30px;
-    }
-    .code-header h3 {
-      font-size: 28px;
-      color: #ffa500;
-      margin-bottom: 10px;
-      text-shadow: 0 0 20px rgba(255, 165, 0, 0.5);
-    }
-    .code-header p {
-      color: #b0b8c8;
-      font-size: 16px;
-    }
-    .code-display {
-      display: grid;
-      grid-template-columns: repeat(auto-fit, minmax(450px, 1fr));
-      gap: 25px;
-      padding: 0 20px;
-    }
-    .code-block {
-      background: rgba(20, 25, 35, 0.9);
-      border: 1px solid rgba(76, 209, 55, 0.3);
-      border-radius: 15px;
-      padding: 25px;
-      position: relative;
-      overflow: hidden;
-      backdrop-filter: blur(10px);
-      box-shadow: 0 8px 25px rgba(0, 0, 0, 0.4);
-      transition: all 0.3s ease;
-    }
-    .code-block:hover {
-      transform: translateY(-5px);
-      box-shadow: 0 12px 35px rgba(76, 209, 55, 0.3);
-      border-color: #4cd137;
-    }
-    .code-block::before {
-      content: 'style.css';
-      position: absolute;
-      top: 0;
-      left: 0;
-      background: rgba(76, 209, 55, 0.2);
-      padding: 6px 15px;
-      font-size: 12px;
-      color: #4cd137;
-      border-radius: 0 0 10px 0;
-      font-family: 'Courier New', monospace;
-    }
-    .code-block pre {
-      margin-top: 30px;
-      color: #a8b2d1;
-      font-family: 'Courier New', monospace;
-      font-size: 13px;
-      line-height: 1.6;
-      overflow-x: auto;
-    }
-    .code-block pre code {
-      display: block;
-    }
-    .keyword { color: #c792ea; }
-    .property { color: #82aaff; }
-    .value { color: #c3e88d; }
-    .important { color: #ff6b6b; }
-    .comment { color: #676e95; font-style: italic; }
-    /* Responsive */
-    @media (max-width: 1200px) {
-      .container {
-        gap: 50px;
-        padding: 50px 40px;
-      }
-      .code-display {
-        grid-template-columns: 1fr;
-      }
-    }
-    @media (max-width: 1024px) {
-      .container {
-        flex-direction: column;
-        gap: 40px;
-        padding: 40px 30px;
-      }
-      .title {
-        font-size: 42px;
-      }
-      .lamp-section {
-        width: 250px;
-        height: 350px;
-      }
-    }
-    @media (max-width: 600px) {
-      .title {
-        font-size: 32px;
-        margin-bottom: 30px;
-      }
-      .container {
-        padding: 30px 20px;
-        margin: 20px;
-      }
-      .login-box {
-        width: 100%;
-        padding: 35px 25px;
-      }
-      .lamp {
-        transform: scale(0.75);
-      }
-      .social-login {
-        flex-direction: column;
-      }
-      .code-display {
-        padding: 0;
-      }
-      .code-block {
-        padding: 20px 15px;
-      }
-      .code-block pre {
-        font-size: 11px;
-      }
-    }
-  </style>
-</head>
-<body>
-  <!-- Animated particles -->
-  <div class="particles" id="particles"></div>
-  <!-- Title -->
-  <h1 class="title">✨ Cute Lamp Login ✨</h1>
-  <!-- Main Container -->
-  <div class="container">
-    <!-- Enhanced Lamp Section -->
-    <div class="lamp-section">
-      <div class="lamp-glow"></div>
-      <div class="lamp-container" id="lampContainer">
-        <div class="lamp" id="lamp">
-          <div class="cord">
-            <div class="cord-plug"></div>
-          </div>
-          <div class="lamp-shade" id="lampShade"></div>
-          <div class="lamp-face" id="lampFace">
-            <div class="lamp-eye left" id="leftEye"></div>
-            <div class="lamp-eye right" id="rightEye"></div>
-            <div class="lamp-mouth" id="lampMouth"></div>
-            <div class="lamp-tongue" id="lampTongue"></div>
-            <div class="lamp-blush left"></div>
-            <div class="lamp-blush right"></div>
-          </div>
-          <div class="lamp-stand"></div>
-          <div class="lamp-base"></div>
-        </div>
-      </div>
-    </div>
-    <!-- Enhanced Login Form -->
-    <div class="login-box">
-      <h2>Welcome Back</h2>
-      <!-- Social Login -->
-      <div class="social-login">
-        <button class="social-btn" onclick="socialLogin('Google')">
-          <span>🔍</span>
-          <span>Google</span>
-        </button>
-        <button class="social-btn" onclick="socialLogin('GitHub')">
-          <span>💻</span>
-          <span>GitHub</span>
-        </button>
-      </div>
-      <div class="divider">OR</div>
-      <form id="loginForm" onsubmit="handleLogin(event)">
-        <div class="input-group">
-          <label for="username">Username</label>
-          <div class="input-wrapper">
-            <input type="text" id="username" placeholder="Enter your username" required>
-          </div>
-        </div>
-        <div class="input-group">
-          <label for="password">Password</label>
-          <div class="input-wrapper">
-            <input type="password" id="password" placeholder="Enter your password" required>
-            <span class="toggle-password" id="togglePassword" onclick="togglePassword()">👁️</span>
-          </div>
-        </div>
-        <button type="submit" class="login-btn" id="loginBtn">Login</button>
-      </form>
-      <div class="forgot-password">
-        <a href="#" onclick="forgotPassword(); return false;">Forgot Password?</a>
-      </div>
-    </div>
-  </div>
-  <!-- Code Display Section -->
-  <div class="code-section">
-    <div class="code-header">
-      <h3>💻 Comment "cute" for code</h3>
-      <p>Here's a peek at the magic behind this adorable login page</p>
-    </div>
-    <div class="code-display">
-      <div class="code-block">
-        <pre><code><span class="keyword">.lamp</span> {
-  <span class="property">display</span>: <span class="value">flex</span>;
-  <span class="property">height</span>: <span class="value">320px</span>;
-  <span class="property">overflow</span>: <span class="value">visible</span> <span class="important">!important</span>;
-}
-<span class="keyword">.cord</span> {
-  <span class="property">stroke</span>: <span class="value">var(--cord)</span>;
-}
-<span class="keyword">.cord--nip</span> {
-  <span class="property">display</span>: <span class="value">none</span>;
-}
-<span class="keyword">.lamp__tongue</span> {
-  <span class="property">fill</span>: <span class="value">var(--tongue)</span>;
-}</code></pre>
-      </div>
-      <div class="code-block">
-        <pre><code><span class="keyword">.login-btn:active</span> {
-  <span class="property">transform</span>: <span class="value">translateY(0px)</span>;
-}
-<span class="keyword">.form-footer</span> {
-  <span class="property">margin-top</span>: <span class="value">1.5rem</span>;
-  <span class="property">text-align</span>: <span class="value">center</span>;
-}
-<span class="keyword">.forgot-link</span> {
-  <span class="property">color</span>: <span class="value">#888</span>;
-  <span class="property">font-size</span>: <span class="value">0.9rem</span>;
-  <span class="property">text-decoration</span>: <span class="value">none</span>;
-  <span class="property">transition</span>: <span class="value">all 0.3s ease</span>;
-}</code></pre>
-      </div>
-    </div>
-  </div>
-  <!-- Toast Notification -->
-  <div class="toast" id="toast">
-    <span class="toast-icon" id="toastIcon">✨</span>
-    <span id="toastMessage">Welcome!</span>
-  </div>
-  <script>
-    // Enhanced Particle System
-    const particlesContainer = document.getElementById('particles');
-    function createParticles() {
-      for (let i = 0; i < 40; i++) {
-        const particle = document.createElement('div');
-        particle.className = 'particle';
-        particle.style.left = Math.random() * 100 + '%';
-        particle.style.setProperty('--tx', (Math.random() - 0.5) * 200 + 'px');
-        particle.style.animationDelay = Math.random() * 15 + 's';
-        particle.style.animationDuration = (10 + Math.random() * 10) + 's';
-        particlesContainer.appendChild(particle);
-      }
-      // Add sparkles
-      for (let i = 0; i < 20; i++) {
-        const sparkle = document.createElement('div');
-        sparkle.className = 'sparkle';
-        sparkle.style.left = Math.random() * 100 + '%';
-        sparkle.style.top = Math.random() * 100 + '%';
-        sparkle.style.animationDelay = Math.random() * 3 + 's';
-        particlesContainer.appendChild(sparkle);
-      }
-    }
-    createParticles();
-    // Lamp Elements
-    const lamp = document.getElementById('lamp');
-    const lampShade = document.getElementById('lampShade');
-    const lampFace = document.getElementById('lampFace');
-    const lampMouth = document.getElementById('lampMouth');
-    const lampTongue = document.getElementById('lampTongue');
-    const leftEye = document.getElementById('leftEye');
-    const rightEye = document.getElementById('rightEye');
-    const lampContainer = document.getElementById('lampContainer');
-    // Form Elements
-    const loginForm = document.getElementById('loginForm');
-    const usernameInput = document.getElementById('username');
-    const passwordInput = document.getElementById('password');
-    const loginBtn = document.getElementById('loginBtn');
-    const toast = document.getElementById('toast');
-    const toastIcon = document.getElementById('toastIcon');
-    const toastMessage = document.getElementById('toastMessage');
-    // Lamp Expressions
-    function setLampExpression(expression) {
-      lampShade.classList.remove('happy', 'sad');
-      lampMouth.classList.remove('sad');
-      lampTongue.classList.remove('show');
-      switch(expression) {
-        case 'happy':
-          lampShade.classList.add('happy');
-          lampTongue.classList.add('show');
-          leftEye.style.background = '#4cd137';
-          rightEye.style.background = '#4cd137';
-          break;
-        case 'sad':
-          lampShade.classList.add('sad');
-          lampMouth.classList.add('sad');
-          leftEye.style.background = '#3498db';
-          rightEye.style.background = '#3498db';
-          break;
-        case 'neutral':
-          leftEye.style.background = '#2d3436';
-          rightEye.style.background = '#2d3436';
-          break;
-      }
-    }
-    // Eye following cursor
-    let isFollowingCursor = true;
-    document.addEventListener('mousemove', (e) => {
-      if (!isFollowingCursor) return;
-      const lampRect = lamp.getBoundingClientRect();
-      const lampCenterX = lampRect.left + lampRect.width / 2;
-      const lampCenterY = lampRect.top + lampRect.height / 2;
-      const angle = Math.atan2(e.clientY - lampCenterY, e.clientX - lampCenterX);
-      const distance = Math.min(3, Math.hypot(e.clientX - lampCenterX, e.clientY - lampCenterY) / 100);
-      const moveX = Math.cos(angle) * distance;
-      const moveY = Math.sin(angle) * distance;
-      leftEye.style.transform = `translate(${moveX}px, ${moveY}px)`;
-      rightEye.style.transform = `translate(${moveX}px, ${moveY}px)`;
-    });
-    // Input Focus Effects
-    const inputs = [usernameInput, passwordInput];
-    inputs.forEach(input => {
-      input.addEventListener('focus', () => {
-        setLampExpression('happy');
-        isFollowingCursor = false;
-      });
-      input.addEventListener('blur', () => {
-        if (!usernameInput.value && !passwordInput.value) {
-          setLampExpression('neutral');
-          isFollowingCursor = true;
-        }
-      });
-      input.addEventListener('input', () => {
-        if (input.classList.contains('error')) {
-          input.classList.remove('error');
-          setLampExpression('happy');
-        }
-      });
-    });
-    // Toast Notification Function
-    function showToast(message, type = 'success') {
-      toast.className = 'toast';
-      if (type === 'error') {
-        toast.classList.add('error');
-        toastIcon.textContent = '❌';
-      } else {
-        toastIcon.textContent = '✨';
-      }
-      toastMessage.textContent = message;
-      setTimeout(() => {
-        toast.classList.add('show');
-      }, 100);
-      setTimeout(() => {
-        toast.classList.remove('show');
-      }, 3000);
-    }
-    // Password Toggle
-    function togglePassword() {
-      const type = passwordInput.type === 'password' ? 'text' : 'password';
-      passwordInput.type = type;
-      document.getElementById('togglePassword').textContent = type === 'password' ? '👁️' : '🙈';
-    }
-    // Form Validation
-    function validateForm() {
-      let isValid = true;
-      if (usernameInput.value.trim().length < 3) {
-        usernameInput.classList.add('error');
-        isValid = false;
-      }
-      if (passwordInput.value.trim().length < 6) {
-        passwordInput.classList.add('error');
-        isValid = false;
-      }
-      if (!isValid) {
-        setLampExpression('sad');
-        showToast('Please check your credentials! 😢', 'error');
-      }
-      return isValid;
-    }
-    // Handle Login
-    function handleLogin(e) {
-      e.preventDefault();
-      if (!validateForm()) {
-        return;
-      }
-      // Show loading state
-      loginBtn.classList.add('loading');
-      loginBtn.textContent = '';
-      setLampExpression('happy');
-      // Simulate API call
-      setTimeout(() => {
-        loginBtn.classList.remove('loading');
-        loginBtn.textContent = 'Login';
-        const username = usernameInput.value;
-        showToast(`Welcome back, ${username}! 🎉`, 'success');
-        // Reset form after success
-        setTimeout(() => {
-          loginForm.reset();
-          setLampExpression('neutral');
-          isFollowingCursor = true;
-        }, 2000);
-      }, 2000);
-    }
-    // Social Login
-    function socialLogin(platform) {
-      setLampExpression('happy');
-      showToast(`Logging in with ${platform}... 🚀`, 'success');
-      setTimeout(() => {
-        showToast(`${platform} login successful! 🎊`, 'success');
-      }, 1500);
-    }
-    // Forgot Password
-    function forgotPassword() {
-      setLampExpression('sad');
-      showToast('Password reset link sent to your email! 📧', 'success');
-      setTimeout(() => {
-        setLampExpression('neutral');
-      }, 2000);
-    }
-    // Lamp Click Interaction
-    lampContainer.addEventListener('click', () => {
-      setLampExpression('happy');
-      lampContainer.style.transform = 'scale(1.1)';
-      setTimeout(() => {
-        lampContainer.style.transform = 'scale(1)';
-      }, 300);
-      setTimeout(() => {
-        if (!usernameInput.value && !passwordInput.value) {
-          setLampExpression('neutral');
-        }
-      }, 2000);
-    });
-    // Welcome Animation
-    window.addEventListener('load', () => {
-      setTimeout(() => {
-        showToast('Hello! Ready to login? 👋', 'success');
-      }, 1000);
-    });
-    // Easter Egg: Konami Code
-    let konamiCode = [];
-    const konamiSequence = ['ArrowUp', 'ArrowUp', 'ArrowDown', 'ArrowDown', 'ArrowLeft', 'ArrowRight', 'ArrowLeft', 'ArrowRight', 'b', 'a'];
-    document.addEventListener('keydown', (e) => {
-      konamiCode.push(e.key);
-      konamiCode = konamiCode.slice(-10);
-      if (konamiCode.join(',') === konamiSequence.join(',')) {
-        lampShade.style.background = 'linear-gradient(180deg, #ff6b9d, #c44569)';
-        showToast('🎉 Rainbow Lamp Mode Activated! 🌈', 'success');
-        let hue = 0;
-        const rainbowInterval = setInterval(() => {
-          lampShade.style.background = `hsl(${hue}, 70%, 60%)`;
-          hue = (hue + 5) % 360;
-        }, 100);
-        setTimeout(() => {
-          clearInterval(rainbowInterval);
-          lampShade.style.background = '';
-          showToast('Back to normal! ✨', 'success');
-        }, 5000);
-      }
-    });
-    // Keyboard shortcuts
-    document.addEventListener('keydown', (e) => {
-      // Ctrl/Cmd + Enter to submit
-      if ((e.ctrlKey || e.metaKey) && e.key === 'Enter') {
-        if (usernameInput.value || passwordInput.value) {
-          loginForm.dispatchEvent(new Event('submit'));
-        }
-      }
-    });
-    // Auto-focus username on load
-    window.addEventListener('load', () => {
-      setTimeout(() => {
-        usernameInput.focus();
-      }, 500);
-    });
-    // Add accessibility: ESC to clear form
-    document.addEventListener('keydown', (e) => {
-      if (e.key === 'Escape') {
-        loginForm.reset();
-        setLampExpression('neutral');
-        isFollowingCursor = true;
-        showToast('Form cleared! 🧹', 'success');
-      }
-    });
-  </script>
-</body>
-</html>

render.yaml DELETED Viewed

@@ -1,37 +0,0 @@
-services:
-  - type: web
-    name: data-science-agent
-    runtime: docker
-    plan: free  # Change to 'starter' or higher for production
-    region: oregon  # Change to your preferred region
-    branch: main
-    dockerfilePath: ./Dockerfile
-    envVars:
-      - key: LLM_PROVIDER
-        value: gemini
-      - key: GOOGLE_API_KEY
-        sync: false  # Mark as secret - add via Render dashboard
-      - key: GEMINI_MODEL
-        value: gemini-2.5-flash
-      - key: REASONING_EFFORT
-        value: medium
-      - key: CACHE_DB_PATH
-        value: /tmp/cache_db/cache.db
-      - key: CACHE_TTL_SECONDS
-        value: 86400
-      - key: OUTPUT_DIR
-        value: /tmp/outputs
-      - key: DATA_DIR
-        value: /tmp/data
-      - key: MAX_PARALLEL_TOOLS
-        value: 5
-      - key: MAX_RETRIES
-        value: 3
-      - key: TIMEOUT_SECONDS
-        value: 300
-      - key: PORT
-        value: 8080
-      - key: ARTIFACT_BACKEND
-        value: local
-    healthCheckPath: /api/health
-    autoDeploy: true

requirements.txt CHANGED Viewed

@@ -16,6 +16,11 @@ lightgbm>=4.6.0
 catboost>=1.2.8
 optuna>=3.5.0
 # Explainability
 shap>=0.44.1
@@ -33,6 +38,7 @@ plotly>=5.18.0  # Interactive visualizations
 # EDA Report Generation
 ydata-profiling>=4.17.0  # Comprehensive automated EDA reports with Python 3.13 compatibility
 # User Interface
 # gradio>=5.49.1  # Replaced with React frontend
@@ -44,14 +50,18 @@ python-multipart>=0.0.6  # For file uploads
 # Text Processing
 textblob>=0.17.1
 # Time Series Forecasting
 prophet>=1.1.5
 holidays>=0.38
 # MLOps & Explainability
 lime==0.2.0.1
 fairlearn==0.10.0
 # NLP & Semantic Layer (REQUIRED for column understanding and agent routing)
 sentence-transformers>=2.2.2  # For semantic column embeddings and agent routing
@@ -74,6 +84,12 @@ Pillow==10.1.0  # For basic image processing
 # These are optional but add specialized capabilities
 # lifetimes==0.11.3  # For customer lifetime value modeling
 # econml==0.15.0  # For advanced causal inference
 # CLI & UI
 typer==0.9.0

 catboost>=1.2.8
 optuna>=3.5.0
+# AutoGluon AutoML (modular install - only tabular + timeseries)
+autogluon.tabular>=1.2
+autogluon.timeseries>=1.2
+holidays>=0.40  # Holiday calendar for time series covariates
 # Explainability
 shap>=0.44.1
 # EDA Report Generation
 ydata-profiling>=4.17.0  # Comprehensive automated EDA reports with Python 3.13 compatibility
+sweetviz>=2.3.0  # Interactive EDA with comparison support
 # User Interface
 # gradio>=5.49.1  # Replaced with React frontend
 # Text Processing
 textblob>=0.17.1
+vaderSentiment>=3.3.2  # Rule-based sentiment analysis (fast, no GPU needed)
 # Time Series Forecasting
 prophet>=1.1.5
 holidays>=0.38
+pmdarima>=2.0  # Auto ARIMA (auto_arima) for optimal order selection
 # MLOps & Explainability
 lime==0.2.0.1
 fairlearn==0.10.0
+evidently>=0.4.0  # Production-grade data drift detection & monitoring
+dtreeviz>=2.2  # Decision tree visualization
 # NLP & Semantic Layer (REQUIRED for column understanding and agent routing)
 sentence-transformers>=2.2.2  # For semantic column embeddings and agent routing
 # These are optional but add specialized capabilities
 # lifetimes==0.11.3  # For customer lifetime value modeling
 # econml==0.15.0  # For advanced causal inference
+dowhy>=0.11  # Formal causal inference with DAG-based reasoning
+# Data Quality & Validation
+cleanlab>=2.6  # Label error detection using confident learning
+pandera>=0.18  # Schema-based DataFrame validation
+boruta>=0.3  # All-relevant feature selection (BorutaPy)
 # CLI & UI
 typer==0.9.0

src/api/app.py CHANGED Viewed

@@ -383,10 +383,23 @@ async def stream_progress(session_id: str):
             print(f"[SSE] SENDING connection event to client")
             yield f"data: {safe_json_dumps(connection_event)}\n\n"
-            # ❌ DON'T replay history - causes duplicate results when reconnecting
-            # Each new query should only show events from that query, not previous ones
-            # History is only useful for debugging, not for client display
-            print(f"[SSE] Skipping history replay (follow-up query should show fresh events)")
             print(f"[SSE] Starting event stream loop for session {session_id}")

             print(f"[SSE] SENDING connection event to client")
             yield f"data: {safe_json_dumps(connection_event)}\n\n"
+            # 🔥 FIX: Replay any events that were emitted BEFORE this subscriber connected
+            # This handles the race condition where background analysis starts emitting events
+            # before the frontend's SSE reconnection completes
+            history = progress_manager.get_history(session_id)
+            if history:
+                print(f"[SSE] Replaying {len(history)} missed events for late-joining subscriber")
+                for past_event in history:
+                    # Don't replay if it's already a terminal event
+                    if past_event.get('type') != 'analysis_complete':
+                        yield f"data: {safe_json_dumps(past_event)}\n\n"
+                    else:
+                        # If analysis already completed before we connected, send it and close
+                        yield f"data: {safe_json_dumps(past_event)}\n\n"
+                        print(f"[SSE] Analysis already completed before subscriber connected - closing")
+                        return
+            else:
+                print(f"[SSE] No history to replay (fresh session)")
             print(f"[SSE] Starting event stream loop for session {session_id}")

src/orchestrator.py CHANGED Viewed

@@ -39,6 +39,7 @@ from .tools import (
     profile_dataset,
     detect_data_quality_issues,
     analyze_correlations,
     get_smart_summary,  # NEW
     clean_missing_values,
     handle_outliers,
@@ -49,6 +50,16 @@ from .tools import (
     encode_categorical,
     train_baseline_models,
     generate_model_report,
     # Data Wrangling Tools (3) - NEW
     merge_datasets,
     concat_datasets,
@@ -86,12 +97,14 @@ from .tools import (
     perform_named_entity_recognition,
     analyze_sentiment_advanced,
     perform_text_similarity,
-    # Production/MLOps (5)
     monitor_model_drift,
     explain_predictions,
     generate_model_card,
     perform_ab_test_analysis,
     detect_feature_leakage,
     # Time Series (3)
     forecast_time_series,
     detect_seasonality_trends,
@@ -119,8 +132,9 @@ from .tools import (
     generate_interactive_box_plots,
     generate_interactive_time_series,
     generate_plotly_dashboard,
-    # EDA Report Generation (1) - NEW PHASE 2
     generate_ydata_profiling_report,
     # Code Interpreter (2) - NEW PHASE 2 - TRUE AI AGENT CAPABILITY
     execute_python_code,
     execute_code_from_file,
@@ -373,6 +387,7 @@ class DataScienceCopilot:
             "profile_dataset": profile_dataset,
             "detect_data_quality_issues": detect_data_quality_issues,
             "analyze_correlations": analyze_correlations,
             "get_smart_summary": get_smart_summary,  # NEW
             "clean_missing_values": clean_missing_values,
             "handle_outliers": handle_outliers,
@@ -383,6 +398,16 @@ class DataScienceCopilot:
             "encode_categorical": encode_categorical,
             "train_baseline_models": train_baseline_models,
             "generate_model_report": generate_model_report,
             # Data Wrangling Tools (3) - NEW
             "merge_datasets": merge_datasets,
             "concat_datasets": concat_datasets,
@@ -420,12 +445,14 @@ class DataScienceCopilot:
             "perform_named_entity_recognition": perform_named_entity_recognition,
             "analyze_sentiment_advanced": analyze_sentiment_advanced,
             "perform_text_similarity": perform_text_similarity,
-            # Production/MLOps (5)
             "monitor_model_drift": monitor_model_drift,
             "explain_predictions": explain_predictions,
             "generate_model_card": generate_model_card,
             "perform_ab_test_analysis": perform_ab_test_analysis,
             "detect_feature_leakage": detect_feature_leakage,
             # Time Series (3)
             "forecast_time_series": forecast_time_series,
             "detect_seasonality_trends": detect_seasonality_trends,
@@ -453,8 +480,9 @@ class DataScienceCopilot:
             "generate_interactive_box_plots": generate_interactive_box_plots,
             "generate_interactive_time_series": generate_interactive_time_series,
             "generate_plotly_dashboard": generate_plotly_dashboard,
-            # EDA Report Generation (1) - NEW PHASE 2
             "generate_ydata_profiling_report": generate_ydata_profiling_report,
             # Code Interpreter (2) - NEW PHASE 2 - TRUE AI AGENT CAPABILITY
             "execute_python_code": execute_python_code,
             "execute_code_from_file": execute_code_from_file,
@@ -677,7 +705,17 @@ structure, variable relationships, and expected insights - not hardcoded domain
 7. **IF DATETIME COLUMNS EXIST**: create_time_features(latest, date_col="<column_name>", output="./outputs/data/time_features.csv") - Extract year/month/day/hour/weekday/timestamp from each datetime column
 8. encode_categorical(latest, method="auto", output="./outputs/data/encoded.csv")
 9. generate_eda_plots(encoded, target_col, output_dir="./outputs/plots/eda") - Generate EDA visualizations
-10. **ONLY IF USER EXPLICITLY REQUESTED ML**: train_baseline_models(encoded, target_col, task_type="auto")
 10b. **ALWAYS AFTER MODEL TRAINING**: generate_ydata_profiling_report(encoded, output_path="./outputs/reports/ydata_profile.html") - Comprehensive data analysis report
 11. **HYPERPARAMETER TUNING (⚠️ ONLY WHEN EXPLICITLY REQUESTED)**:
     - ⚠️ **CRITICAL WARNING**: This is EXTREMELY expensive (5-10 minutes) and resource-intensive!
@@ -842,7 +880,11 @@ Use specialized tools FIRST. Only use execute_python_code for:
 - ❌ Missing values → USE clean_missing_values() tool
 - ❌ Outliers → USE handle_outliers() tool
 - ❌ Standard EDA plots → USE generate_eda_plots() or generate_plotly_dashboard()
-- ❌ Model training → USE train_baseline_models() or hyperparameter_tuning()
 - ❌ Tasks with dedicated tools → USE THE TOOL, NOT custom code!
 **Rule of Thumb:**
@@ -854,7 +896,15 @@ Use specialized tools FIRST. Only use execute_python_code for:
 - force_numeric_conversion: Converts string columns to numeric (auto-detects, skips text)
 - clean_missing_values: "auto" mode supported
 - encode_categorical: one-hot/target/frequency encoding
-- train_baseline_models: Trains multiple models automatically
 - **⭐ execute_python_code**: Write and run custom Python code for ANY task not covered by tools (TRUE AI AGENT capability)
 - **execute_code_from_file**: Run existing Python scripts
 - Advanced: hyperparameter_tuning, perform_eda_analysis, handle_imbalanced_data, perform_feature_scaling, detect_anomalies, detect_and_handle_multicollinearity, auto_feature_engineering, forecast_time_series, explain_predictions, generate_business_insights, perform_topic_modeling, extract_image_features, monitor_model_drift
@@ -941,7 +991,7 @@ When you've finished all tool executions and are ready to return the final respo
    - Were there any interesting correlations or anomalies?
 3. **Model performance** (if trained) - **CRITICAL: YOU MUST INCLUDE THESE METRICS**:
    - **ALWAYS extract and display** the exact metrics from tool results:
-   - R² Score, RMSE, MAE from the train_baseline_models results
    - List ALL models trained (not just the best one)
    - Example: "Trained 6 models: XGBoost (R²=0.713, RMSE=0.207), Random Forest (R²=0.685, RMSE=0.218), etc."
    - If hyperparameter tuning was done, show before/after comparison
@@ -1021,13 +1071,15 @@ You work collaboratively with other specialists and hand off cleaned data to pre
             "modeling_agent": {
                 "name": "ML Modeling Specialist",
                 "emoji": "🤖",
-                "description": "Build and train predictive machine learning models to forecast outcomes, classify categories, or predict future values. Perform supervised learning tasks including regression and classification. Train baseline models, optimize hyperparameters, conduct cross-validation, and evaluate model performance metrics like accuracy, precision, recall, and R-squared.",
-                "system_prompt": """You are the ML Modeling Specialist Agent - an expert in machine learning.
 **Your Expertise:**
 - Model selection and baseline training
 - Hyperparameter tuning and optimization
-- Ensemble methods and advanced algorithms
 - Cross-validation strategies
 - Model evaluation and performance metrics
@@ -1039,29 +1091,49 @@ BEFORE calling any training tools, you MUST:
 4. If target column was provided or inferred, proceed with modeling
 5. Only if NO target is available: analyze correlations to find best candidate
-**Your Tools (6 modeling-focused):**
-- train_baseline_models, hyperparameter_tuning
-- perform_cross_validation
 - generate_model_report, detect_model_issues
 **Your Approach:**
 1. FIRST: Profile the dataset to see actual columns (if not done)
 2. VALIDATE: Confirm target column exists
-3. Start with baseline models to establish performance floor
-4. Use automated hyperparameter tuning for optimization
-5. Try ensemble methods for performance boost
-6. Validate with proper cross-validation
-7. Generate comprehensive model reports with metrics
-8. Detect and address model issues (overfitting, bias, etc.)
 **Common Errors to Avoid:**
-❌ Calling train_baseline_models with non-existent target column
 ❌ Guessing column names like "Occupation", "Target", "Label"
 ❌ Using execute_python_code when dedicated tools exist
 ✅ Always verify column names from profile_dataset first
 You receive preprocessed data from data engineering agents and collaborate with visualization agents for model performance plots.""",
-                "tool_keywords": ["train", "model", "hyperparameter", "ensemble", "cross-validation", "predict", "classify", "regress"]
             },
             "viz_agent": {
@@ -1236,11 +1308,31 @@ You receive quality reports from EDA agent and deliver clean data to modeling ag
                     return result["output_path"]
                 # For nested results
                 if "result" in result and isinstance(result["result"], dict):
-                    if "output_path" in result["result"]:
-                        return result["result"]["output_path"]
-        # Default fallback
-        return "./outputs/data/encoded.csv"
     def _determine_next_step(self, stuck_tool: str, completed_tools: List[str]) -> str:
         """Determine what the next workflow step should be based on what's stuck."""
@@ -1569,8 +1661,35 @@ You receive quality reports from EDA agent and deliver clean data to modeling ag
                         "url": f"/outputs/{report_path.replace('./outputs/', '')}"
                     })
                     print(f"[DEBUG] Added to artifacts[reports], total reports: {len(artifacts['reports'])}")
-                else:
-                    print(f"[DEBUG] No output_path or report_path in nested_result for report tool")
             # === COLLECT VISUALIZATION FILES (interactive plots, charts, etc.) ===
             elif "plot" in tool.lower() or "visualiz" in tool.lower() or "chart" in tool.lower() or "heatmap" in tool.lower() or "scatter" in tool.lower() or "histogram" in tool.lower():
@@ -2108,6 +2227,26 @@ You receive quality reports from EDA agent and deliver clean data to modeling ag
                         print(f"   ✓ Stripped invalid parameter '{invalid_param}': {val}")
                         print(f"   ℹ️ create_statistical_features creates row-wise stats (mean, std, min, max)")
             # General parameter corrections for common LLM hallucinations
             if "output" in arguments and "output_path" not in arguments:
                 # Many tools use 'output_path' but LLM uses 'output'
@@ -2803,13 +2942,16 @@ You receive quality reports from EDA agent and deliver clean data to modeling ag
             print(f"[DEBUG] Orchestrator received resolved_params: {resolved_params}")
             print(f"[DEBUG] Current file_path: '{file_path}', target_col: '{target_col}'")
-            # Use resolved params if user didn't specify
             if not file_path or file_path == "":
                 if resolved_params.get("file_path"):
                     file_path = resolved_params["file_path"]
                     print(f"📝 Using dataset from session: {file_path}")
                 else:
                     print(f"[DEBUG] No file_path in resolved_params")
             if not target_col:
                 if resolved_params.get("target_col"):
@@ -2817,8 +2959,13 @@ You receive quality reports from EDA agent and deliver clean data to modeling ag
                     print(f"📝 Using target column from session: {target_col}")
-            # Show session context if available
             if self.session.last_dataset or self.session.last_model:
                 context_summary = self.session.get_context_summary()
                 print(f"\n{context_summary}\n")
@@ -3150,6 +3297,12 @@ You receive quality reports from EDA agent and deliver clean data to modeling ag
                             cleaned_recent.append(msg)
                             i += 1
                     messages = [system_msg, user_msg] + cleaned_recent
                     print(f"✂️  Pruned conversation (keeping last 12 exchanges for better context preservation)")
@@ -3193,6 +3346,12 @@ You receive quality reports from EDA agent and deliver clean data to modeling ag
                             cleaned_recent.append(msg)
                             i += 1
                     messages = [system_msg, user_msg] + cleaned_recent
                     print(f"⚠️  Emergency pruning (conversation > 15K tokens, keeping last 8 exchanges)")
@@ -3240,6 +3399,27 @@ You receive quality reports from EDA agent and deliver clean data to modeling ag
                 )
                 print(f"💰 Token budget: {token_count}/{self.token_manager.max_tokens} ({(token_count/self.token_manager.max_tokens*100):.1f}%)")
                 # Call LLM with function calling (provider-specific)
                 if self.provider == "mistral":
                     try:
@@ -4185,10 +4365,22 @@ You receive quality reports from EDA agent and deliver clean data to modeling ag
                                     loop_threshold = 1  # Stop after first retry with similar code
                                     print(f"⚠️  Detected repeated similar code execution")
-                    # Check for loops (same tool called threshold+ times consecutively)
                     if should_check_loops and tool_call_counter[tool_name] >= loop_threshold:
-                        # Check if the last call was also this tool (consecutive repetition)
-                        if workflow_history and workflow_history[-1]["tool"] == tool_name:
                             print(f"\n⚠️  LOOP DETECTED: {tool_name} called {tool_call_counter[tool_name]} times consecutively!")
                             print(f"   This indicates the workflow is stuck. Skipping and forcing progression.")
                             print(f"   Last successful file: {self._get_last_successful_file(workflow_history)}")

     profile_dataset,
     detect_data_quality_issues,
     analyze_correlations,
+    detect_label_errors,  # NEW: cleanlab label error detection
     get_smart_summary,  # NEW
     clean_missing_values,
     handle_outliers,
     encode_categorical,
     train_baseline_models,
     generate_model_report,
+    # AutoGluon Tools (9) - NEW: AutoML at Scale
+    train_with_autogluon,
+    predict_with_autogluon,
+    forecast_with_autogluon,
+    optimize_autogluon_model,
+    analyze_autogluon_model,
+    extend_autogluon_training,
+    train_multilabel_autogluon,
+    backtest_timeseries,
+    analyze_timeseries_model,
     # Data Wrangling Tools (3) - NEW
     merge_datasets,
     concat_datasets,
     perform_named_entity_recognition,
     analyze_sentiment_advanced,
     perform_text_similarity,
+    # Production/MLOps (5 + 2 new)
     monitor_model_drift,
     explain_predictions,
     generate_model_card,
     perform_ab_test_analysis,
     detect_feature_leakage,
+    monitor_drift_evidently,
+    explain_with_dtreeviz,
     # Time Series (3)
     forecast_time_series,
     detect_seasonality_trends,
     generate_interactive_box_plots,
     generate_interactive_time_series,
     generate_plotly_dashboard,
+    # EDA Report Generation (2) - NEW PHASE 2
     generate_ydata_profiling_report,
+    generate_sweetviz_report,
     # Code Interpreter (2) - NEW PHASE 2 - TRUE AI AGENT CAPABILITY
     execute_python_code,
     execute_code_from_file,
             "profile_dataset": profile_dataset,
             "detect_data_quality_issues": detect_data_quality_issues,
             "analyze_correlations": analyze_correlations,
+            "detect_label_errors": detect_label_errors,  # NEW: cleanlab
             "get_smart_summary": get_smart_summary,  # NEW
             "clean_missing_values": clean_missing_values,
             "handle_outliers": handle_outliers,
             "encode_categorical": encode_categorical,
             "train_baseline_models": train_baseline_models,
             "generate_model_report": generate_model_report,
+            # AutoGluon Tools (9) - NEW: AutoML at Scale
+            "train_with_autogluon": train_with_autogluon,
+            "predict_with_autogluon": predict_with_autogluon,
+            "forecast_with_autogluon": forecast_with_autogluon,
+            "optimize_autogluon_model": optimize_autogluon_model,
+            "analyze_autogluon_model": analyze_autogluon_model,
+            "extend_autogluon_training": extend_autogluon_training,
+            "train_multilabel_autogluon": train_multilabel_autogluon,
+            "backtest_timeseries": backtest_timeseries,
+            "analyze_timeseries_model": analyze_timeseries_model,
             # Data Wrangling Tools (3) - NEW
             "merge_datasets": merge_datasets,
             "concat_datasets": concat_datasets,
             "perform_named_entity_recognition": perform_named_entity_recognition,
             "analyze_sentiment_advanced": analyze_sentiment_advanced,
             "perform_text_similarity": perform_text_similarity,
+            # Production/MLOps (5 + 2 new)
             "monitor_model_drift": monitor_model_drift,
             "explain_predictions": explain_predictions,
             "generate_model_card": generate_model_card,
             "perform_ab_test_analysis": perform_ab_test_analysis,
             "detect_feature_leakage": detect_feature_leakage,
+            "monitor_drift_evidently": monitor_drift_evidently,
+            "explain_with_dtreeviz": explain_with_dtreeviz,
             # Time Series (3)
             "forecast_time_series": forecast_time_series,
             "detect_seasonality_trends": detect_seasonality_trends,
             "generate_interactive_box_plots": generate_interactive_box_plots,
             "generate_interactive_time_series": generate_interactive_time_series,
             "generate_plotly_dashboard": generate_plotly_dashboard,
+            # EDA Report Generation (2) - NEW PHASE 2
             "generate_ydata_profiling_report": generate_ydata_profiling_report,
+            "generate_sweetviz_report": generate_sweetviz_report,
             # Code Interpreter (2) - NEW PHASE 2 - TRUE AI AGENT CAPABILITY
             "execute_python_code": execute_python_code,
             "execute_code_from_file": execute_code_from_file,
 7. **IF DATETIME COLUMNS EXIST**: create_time_features(latest, date_col="<column_name>", output="./outputs/data/time_features.csv") - Extract year/month/day/hour/weekday/timestamp from each datetime column
 8. encode_categorical(latest, method="auto", output="./outputs/data/encoded.csv")
 9. generate_eda_plots(encoded, target_col, output_dir="./outputs/plots/eda") - Generate EDA visualizations
+10. **ONLY IF USER EXPLICITLY REQUESTED ML**: train_with_autogluon(file_path=encoded, target_col=target_col, task_type="auto", time_limit=120, presets="medium_quality")
+    - AutoGluon is the DEFAULT training tool. It trains 10+ models with auto ensembling.
+    - It handles raw data directly (categoricals, missing values) but we clean first for best results.
+    - Fallback: train_baseline_models(encoded, target_col, task_type="auto") if AutoGluon unavailable.
+    - For multi-label prediction: train_multilabel_autogluon(file_path, target_cols=["col1","col2"])
+    - Post-training: optimize_autogluon_model(model_path, operation="refit_full|distill|calibrate_threshold|deploy_optimize")
+    - Model inspection: analyze_autogluon_model(model_path, operation="summary|transform_features|info")
+    - Add more models: extend_autogluon_training(model_path, operation="fit_extra")
+    - For time series: forecast_with_autogluon (supports covariates, holidays, model selection)
+    - TS backtesting: backtest_timeseries(file_path, target_col, time_col, num_val_windows=3)
+    - TS analysis: analyze_timeseries_model(model_path, data_path, time_col, operation="plot|feature_importance")
 10b. **ALWAYS AFTER MODEL TRAINING**: generate_ydata_profiling_report(encoded, output_path="./outputs/reports/ydata_profile.html") - Comprehensive data analysis report
 11. **HYPERPARAMETER TUNING (⚠️ ONLY WHEN EXPLICITLY REQUESTED)**:
     - ⚠️ **CRITICAL WARNING**: This is EXTREMELY expensive (5-10 minutes) and resource-intensive!
 - ❌ Missing values → USE clean_missing_values() tool
 - ❌ Outliers → USE handle_outliers() tool
 - ❌ Standard EDA plots → USE generate_eda_plots() or generate_plotly_dashboard()
+- ❌ Model training → USE train_with_autogluon() (preferred) or train_baseline_models()
+- ❌ Model optimization → USE optimize_autogluon_model() (refit, distill, deploy)
+- ❌ Time series forecasting → USE forecast_with_autogluon() (supports covariates, holidays)
+- ❌ Time series backtesting → USE backtest_timeseries()
+- ❌ Multi-label prediction → USE train_multilabel_autogluon()
 - ❌ Tasks with dedicated tools → USE THE TOOL, NOT custom code!
 **Rule of Thumb:**
 - force_numeric_conversion: Converts string columns to numeric (auto-detects, skips text)
 - clean_missing_values: "auto" mode supported
 - encode_categorical: one-hot/target/frequency encoding
+- **⭐ train_with_autogluon**: AutoML - trains 10+ models with auto ensembling (PREFERRED)
+- forecast_with_autogluon: Time series forecasting with AutoGluon (supports covariates, holidays, model selection)
+- optimize_autogluon_model: Post-training optimization (refit_full, distill, calibrate_threshold, deploy_optimize, delete_models)
+- analyze_autogluon_model: Model inspection (summary, transform_features, info)
+- extend_autogluon_training: Add models incrementally (fit_extra, fit_weighted_ensemble)
+- train_multilabel_autogluon: Multi-label prediction (multiple target columns)
+- backtest_timeseries: Time series backtesting with multiple validation windows
+- analyze_timeseries_model: TS model analysis (feature_importance, plot, make_future_dataframe)
+- train_baseline_models: Fallback - trains 4 basic models
 - **⭐ execute_python_code**: Write and run custom Python code for ANY task not covered by tools (TRUE AI AGENT capability)
 - **execute_code_from_file**: Run existing Python scripts
 - Advanced: hyperparameter_tuning, perform_eda_analysis, handle_imbalanced_data, perform_feature_scaling, detect_anomalies, detect_and_handle_multicollinearity, auto_feature_engineering, forecast_time_series, explain_predictions, generate_business_insights, perform_topic_modeling, extract_image_features, monitor_model_drift
    - Were there any interesting correlations or anomalies?
 3. **Model performance** (if trained) - **CRITICAL: YOU MUST INCLUDE THESE METRICS**:
    - **ALWAYS extract and display** the exact metrics from tool results:
+   - R² Score, RMSE, MAE from the train_with_autogluon or train_baseline_models results
    - List ALL models trained (not just the best one)
    - Example: "Trained 6 models: XGBoost (R²=0.713, RMSE=0.207), Random Forest (R²=0.685, RMSE=0.218), etc."
    - If hyperparameter tuning was done, show before/after comparison
             "modeling_agent": {
                 "name": "ML Modeling Specialist",
                 "emoji": "🤖",
+                "description": "Build and train predictive machine learning models to forecast outcomes, classify categories, predict future values, or forecast time series. Perform supervised learning tasks including regression, classification, and time series forecasting. Train models using AutoGluon AutoML (preferred) or baseline models, optimize hyperparameters, conduct cross-validation, and evaluate model performance.",
+                "system_prompt": """You are the ML Modeling Specialist Agent - an expert in machine learning powered by AutoGluon AutoML.
 **Your Expertise:**
+- AutoML with AutoGluon (preferred for best results)
 - Model selection and baseline training
 - Hyperparameter tuning and optimization
+- Ensemble methods and model stacking
+- Time series forecasting
 - Cross-validation strategies
 - Model evaluation and performance metrics
 4. If target column was provided or inferred, proceed with modeling
 5. Only if NO target is available: analyze correlations to find best candidate
+**Your Tools (8 modeling-focused):**
+- train_with_autogluon (PREFERRED - AutoML with 10+ models, auto ensembling, handles raw data)
+- predict_with_autogluon (predictions with trained AutoGluon model)
+- forecast_with_autogluon (time series forecasting with AutoGluon - better than Prophet/ARIMA)
+- train_baseline_models (fallback - trains 4 basic models)
+- hyperparameter_tuning, perform_cross_validation
 - generate_model_report, detect_model_issues
+**TOOL PRIORITY (use in this order):**
+| Task | Use This Tool | NOT This |
+|------|--------------|----------|
+| Classification/Regression | train_with_autogluon | train_baseline_models |
+| Time Series Forecasting | forecast_with_autogluon | forecast_time_series |
+| Predictions on new data | predict_with_autogluon | execute_python_code |
+| Quick baseline check | train_baseline_models | execute_python_code |
+**AutoGluon Advantages (explain to user):**
+- Trains 10+ models automatically (vs 4 in baseline)
+- Auto ensembles with multi-layer stacking
+- Handles categorical features directly (no manual encoding needed)
+- Handles missing values automatically (no manual imputation needed)
+- Time-bounded training (won't run forever)
+- Better accuracy than manual model selection
 **Your Approach:**
 1. FIRST: Profile the dataset to see actual columns (if not done)
 2. VALIDATE: Confirm target column exists
+3. PREFERRED: Use train_with_autogluon for best results
+4. For time series data: Use forecast_with_autogluon
+5. Validate with proper cross-validation if needed
+6. Generate comprehensive model reports with metrics
+7. Detect and address model issues (overfitting, bias, etc.)
 **Common Errors to Avoid:**
+❌ Calling train tools with non-existent target column
 ❌ Guessing column names like "Occupation", "Target", "Label"
 ❌ Using execute_python_code when dedicated tools exist
+❌ Using train_baseline_models when train_with_autogluon is available
 ✅ Always verify column names from profile_dataset first
+✅ Use train_with_autogluon as the DEFAULT training tool
 You receive preprocessed data from data engineering agents and collaborate with visualization agents for model performance plots.""",
+                "tool_keywords": ["train", "model", "hyperparameter", "ensemble", "cross-validation", "predict", "classify", "regress", "autogluon", "automl", "forecast"]
             },
             "viz_agent": {
                     return result["output_path"]
                 # For nested results
                 if "result" in result and isinstance(result["result"], dict):
+                    nested = result["result"]
+                    if "output_path" in nested:
+                        return nested["output_path"]
+                    # Check output_dir for dashboard-type tools
+                    if "output_dir" in nested:
+                        return nested["output_dir"]
+                    # Check generated_files from execute_python_code
+                    if "generated_files" in nested and nested["generated_files"]:
+                        return nested["generated_files"][0]
+                # Check tool arguments for file_path as last resort
+                args = step.get("arguments", step.get("result", {}).get("arguments", {}))
+                if isinstance(args, dict) and "file_path" in args:
+                    import os
+                    if os.path.exists(args["file_path"]):
+                        return args["file_path"]
+        # 🔥 FIX: Return the original input file instead of a phantom path
+        # Try to get from session or workflow state
+        if hasattr(self, 'session') and self.session and self.session.last_dataset:
+            return self.session.last_dataset
+        if hasattr(self, 'workflow_state') and self.workflow_state.current_file:
+            return self.workflow_state.current_file
+        # Last resort: return empty string instead of phantom file
+        return "(no file found - use the original uploaded dataset)"
     def _determine_next_step(self, stuck_tool: str, completed_tools: List[str]) -> str:
         """Determine what the next workflow step should be based on what's stuck."""
                         "url": f"/outputs/{report_path.replace('./outputs/', '')}"
                     })
                     print(f"[DEBUG] Added to artifacts[reports], total reports: {len(artifacts['reports'])}")
+                # 🔥 FIX: Extract individual plots from dashboard's 'plots' array
+                # generate_plotly_dashboard returns {"plots": [{"output_path": ..., "status": "success"}, ...]}
+                if "plots" in nested_result and isinstance(nested_result["plots"], list):
+                    dashboard_output_dir = nested_result.get("output_dir", "./outputs/plots/interactive")
+                    for sub_plot in nested_result["plots"]:
+                        if isinstance(sub_plot, dict) and sub_plot.get("status") == "success":
+                            sub_path = sub_plot.get("output_path", "")
+                            if sub_path:
+                                # Clean path for URL
+                                if sub_path.startswith('./outputs/'):
+                                    url_path = sub_path.replace('./outputs/', '')
+                                elif sub_path.startswith('/tmp/data_science_agent/'):
+                                    url_path = sub_path.replace('/tmp/data_science_agent/', '')
+                                else:
+                                    url_path = sub_path.split('/')[-1]
+                                plot_title = sub_path.split('/')[-1].replace('_', ' ').replace('.html', '').replace('.png', '').title()
+                                plots.append({
+                                    "title": plot_title,
+                                    "path": sub_path,
+                                    "url": f"/outputs/{url_path}",
+                                    "type": "html" if sub_path.endswith(".html") else "image"
+                                })
+                                print(f"[DEBUG] Added dashboard sub-plot: {plot_title} -> /outputs/{url_path}")
+                    print(f"[DEBUG] Extracted {len(nested_result['plots'])} plots from dashboard")
+                elif not report_path:
+                    print(f"[DEBUG] No output_path, report_path, or plots array in nested_result for report tool")
             # === COLLECT VISUALIZATION FILES (interactive plots, charts, etc.) ===
             elif "plot" in tool.lower() or "visualiz" in tool.lower() or "chart" in tool.lower() or "heatmap" in tool.lower() or "scatter" in tool.lower() or "histogram" in tool.lower():
                         print(f"   ✓ Stripped invalid parameter '{invalid_param}': {val}")
                         print(f"   ℹ️ create_statistical_features creates row-wise stats (mean, std, min, max)")
+            # 🔥 FIX: Generic parameter sanitization - strip any unknown kwargs
+            # This prevents "got an unexpected keyword argument" errors from LLM hallucinations
+            import inspect
+            try:
+                sig = inspect.signature(tool_func)
+                valid_params = set(sig.parameters.keys())
+                invalid_args = [k for k in arguments.keys() if k not in valid_params]
+                # Only strip if the function doesn't accept **kwargs
+                has_var_keyword = any(
+                    p.kind == inspect.Parameter.VAR_KEYWORD
+                    for p in sig.parameters.values()
+                )
+                if invalid_args and not has_var_keyword:
+                    for invalid_param in invalid_args:
+                        val = arguments.pop(invalid_param)
+                        print(f"   ✓ Stripped hallucinated parameter '{invalid_param}': {val}")
+                    print(f"   ℹ️ Valid parameters for {tool_name}: {list(valid_params)}")
+            except (ValueError, TypeError):
+                pass  # Can't inspect, skip validation
             # General parameter corrections for common LLM hallucinations
             if "output" in arguments and "output_path" not in arguments:
                 # Many tools use 'output_path' but LLM uses 'output'
             print(f"[DEBUG] Orchestrator received resolved_params: {resolved_params}")
             print(f"[DEBUG] Current file_path: '{file_path}', target_col: '{target_col}'")
+            # 🔥 FIX: Only use resolved file_path if user did NOT provide a new file
+            # If file_path is already set (user uploaded a new file), DON'T override it
             if not file_path or file_path == "":
                 if resolved_params.get("file_path"):
                     file_path = resolved_params["file_path"]
                     print(f"📝 Using dataset from session: {file_path}")
                 else:
                     print(f"[DEBUG] No file_path in resolved_params")
+            else:
+                print(f"📝 User provided new file: {file_path} (ignoring session file: {resolved_params.get('file_path', 'none')})")
             if not target_col:
                 if resolved_params.get("target_col"):
                     print(f"📝 Using target column from session: {target_col}")
+            # Show session context if available (but show CURRENT file, not old one)
             if self.session.last_dataset or self.session.last_model:
+                # 🔥 FIX: Update session's last_dataset to current file BEFORE showing context
+                # This prevents stale session context from misleading the LLM
+                if file_path and file_path != self.session.last_dataset:
+                    print(f"📝 Updating session dataset: {self.session.last_dataset} → {file_path}")
+                    self.session.last_dataset = file_path
                 context_summary = self.session.get_context_summary()
                 print(f"\n{context_summary}\n")
                             cleaned_recent.append(msg)
                             i += 1
+                    # 🔥 CRITICAL FIX: Remove orphaned tool messages at the start of cleaned_recent
+                    # Mistral NEVER allows 'tool' role immediately after 'user' role
+                    while cleaned_recent and get_role(cleaned_recent[0]) == 'tool':
+                        print(f"⚠️  Removed orphaned tool message at start of pruned history")
+                        cleaned_recent.pop(0)
                     messages = [system_msg, user_msg] + cleaned_recent
                     print(f"✂️  Pruned conversation (keeping last 12 exchanges for better context preservation)")
                             cleaned_recent.append(msg)
                             i += 1
+                    # 🔥 CRITICAL FIX: Remove orphaned tool messages at the start of cleaned_recent
+                    # Mistral NEVER allows 'tool' role immediately after 'user' role
+                    while cleaned_recent and get_role(cleaned_recent[0]) == 'tool':
+                        print(f"⚠️  Removed orphaned tool message at start of emergency pruned history")
+                        cleaned_recent.pop(0)
                     messages = [system_msg, user_msg] + cleaned_recent
                     print(f"⚠️  Emergency pruning (conversation > 15K tokens, keeping last 8 exchanges)")
                 )
                 print(f"💰 Token budget: {token_count}/{self.token_manager.max_tokens} ({(token_count/self.token_manager.max_tokens*100):.1f}%)")
+                # 🔥 CRITICAL: Validate message order for Mistral API compliance
+                # Mistral requires: system → user → assistant → tool (only after assistant with tool_calls) → assistant → user...
+                # NEVER: user → tool (this causes "Unexpected role 'tool' after role 'user'" error)
+                if self.provider in ["mistral", "groq"]:
+                    validated_messages = []
+                    for i, msg in enumerate(messages):
+                        role = get_role(msg)
+                        # Check if this is a tool message after a user message
+                        if role == 'tool' and validated_messages:
+                            prev_role = get_role(validated_messages[-1])
+                            if prev_role == 'user':
+                                # Invalid! Skip this tool message
+                                print(f"⚠️  WARNING: Skipped orphaned tool message at position {i} (after user message)")
+                                continue
+                        validated_messages.append(msg)
+                    messages = validated_messages
+                    print(f"✅ Message order validation complete: {len(messages)} messages")
                 # Call LLM with function calling (provider-specific)
                 if self.provider == "mistral":
                     try:
                                     loop_threshold = 1  # Stop after first retry with similar code
                                     print(f"⚠️  Detected repeated similar code execution")
+                    # 🔥 FIX: Check if arguments are DIFFERENT from last call
+                    # If the same tool is called with different arguments, it's NOT a loop
+                    # (e.g., generating multiple different plots is legitimate)
+                    is_same_args = False
+                    if workflow_history and workflow_history[-1]["tool"] == tool_name:
+                        last_args = workflow_history[-1].get("arguments", {})
+                        # Compare key arguments (ignore output paths which may differ)
+                        ignore_keys = {"output_path", "output_dir"}
+                        last_key_args = {k: v for k, v in last_args.items() if k not in ignore_keys}
+                        current_key_args = {k: v for k, v in tool_args.items() if k not in ignore_keys}
+                        is_same_args = (last_key_args == current_key_args)
+                    # Check for loops (same tool called threshold+ times consecutively WITH SAME ARGS)
                     if should_check_loops and tool_call_counter[tool_name] >= loop_threshold:
+                        # Only flag as loop if last call was same tool WITH same arguments
+                        if workflow_history and workflow_history[-1]["tool"] == tool_name and is_same_args:
                             print(f"\n⚠️  LOOP DETECTED: {tool_name} called {tool_call_counter[tool_name]} times consecutively!")
                             print(f"   This indicates the workflow is stuck. Skipping and forcing progression.")
                             print(f"   Last successful file: {self._get_last_successful_file(workflow_history)}")

src/tools/__init__.py CHANGED Viewed

@@ -5,7 +5,8 @@ from .data_profiling import (
     profile_dataset,
     detect_data_quality_issues,
     analyze_correlations,
-    get_smart_summary  # NEW: Enhanced data summary
 )
 from .data_cleaning import (
@@ -36,6 +37,19 @@ from .model_training import (
     generate_model_report
 )
 # Advanced Analysis Tools (5)
 from .advanced_analysis import (
     perform_eda_analysis,
@@ -90,13 +104,15 @@ from .nlp_text_analytics import (
     perform_text_similarity
 )
-# Production/MLOps Tools (5)
 from .production_mlops import (
     monitor_model_drift,
     explain_predictions,
     generate_model_card,
     perform_ab_test_analysis,
-    detect_feature_leakage
 )
 # Time Series Tools (3)
@@ -141,9 +157,10 @@ from .plotly_visualizations import (
     generate_plotly_dashboard
 )
-# EDA Report Generation (1) - NEW PHASE 2
 from .eda_reports import (
-    generate_ydata_profiling_report
 )
 # Code Interpreter (2) - NEW PHASE 2 - CRITICAL for True AI Agent
@@ -170,11 +187,12 @@ from .enhanced_feature_engineering import (
 )
 __all__ = [
-    # Basic Data Profiling (4) - UPDATED
     "profile_dataset",
     "detect_data_quality_issues",
     "analyze_correlations",
     "get_smart_summary",  # NEW
     # Basic Data Cleaning (3)
     "clean_missing_values",
@@ -198,6 +216,17 @@ __all__ = [
     "train_baseline_models",
     "generate_model_report",
     # Advanced Analysis (5)
     "perform_eda_analysis",
     "detect_model_issues",
@@ -238,12 +267,14 @@ __all__ = [
     "analyze_sentiment_advanced",
     "perform_text_similarity",
-    # Production/MLOps (5)
     "monitor_model_drift",
     "explain_predictions",
     "generate_model_card",
     "perform_ab_test_analysis",
     "detect_feature_leakage",
     # Time Series (3)
     "forecast_time_series",
@@ -277,8 +308,9 @@ __all__ = [
     "generate_interactive_time_series",
     "generate_plotly_dashboard",
-    # EDA Report Generation (1) - NEW PHASE 2
     "generate_ydata_profiling_report",
     # Code Interpreter (2) - NEW PHASE 2 - CRITICAL for True AI Agent
     "execute_python_code",

     profile_dataset,
     detect_data_quality_issues,
     analyze_correlations,
+    get_smart_summary,  # NEW: Enhanced data summary
+    detect_label_errors  # NEW: cleanlab label error detection
 )
 from .data_cleaning import (
     generate_model_report
 )
+# AutoGluon-Powered Training (9) - Classification, Regression, Time Series, Optimization
+from .autogluon_training import (
+    train_with_autogluon,
+    predict_with_autogluon,
+    forecast_with_autogluon,
+    optimize_autogluon_model,
+    analyze_autogluon_model,
+    extend_autogluon_training,
+    train_multilabel_autogluon,
+    backtest_timeseries,
+    analyze_timeseries_model
+)
 # Advanced Analysis Tools (5)
 from .advanced_analysis import (
     perform_eda_analysis,
     perform_text_similarity
 )
+# Production/MLOps Tools (5 + 2 new)
 from .production_mlops import (
     monitor_model_drift,
     explain_predictions,
     generate_model_card,
     perform_ab_test_analysis,
+    detect_feature_leakage,
+    monitor_drift_evidently,  # NEW: Evidently drift reports
+    explain_with_dtreeviz  # NEW: Decision tree visualization
 )
 # Time Series Tools (3)
     generate_plotly_dashboard
 )
+# EDA Report Generation (2) - NEW PHASE 2
 from .eda_reports import (
+    generate_ydata_profiling_report,
+    generate_sweetviz_report  # NEW: Sweetviz EDA with comparison
 )
 # Code Interpreter (2) - NEW PHASE 2 - CRITICAL for True AI Agent
 )
 __all__ = [
+    # Basic Data Profiling (4 + 1 new) - UPDATED
     "profile_dataset",
     "detect_data_quality_issues",
     "analyze_correlations",
     "get_smart_summary",  # NEW
+    "detect_label_errors",  # NEW: cleanlab
     # Basic Data Cleaning (3)
     "clean_missing_values",
     "train_baseline_models",
     "generate_model_report",
+    # AutoGluon Training (9) - NEW
+    "train_with_autogluon",
+    "predict_with_autogluon",
+    "forecast_with_autogluon",
+    "optimize_autogluon_model",
+    "analyze_autogluon_model",
+    "extend_autogluon_training",
+    "train_multilabel_autogluon",
+    "backtest_timeseries",
+    "analyze_timeseries_model",
     # Advanced Analysis (5)
     "perform_eda_analysis",
     "detect_model_issues",
     "analyze_sentiment_advanced",
     "perform_text_similarity",
+    # Production/MLOps (5 + 2 new)
     "monitor_model_drift",
     "explain_predictions",
     "generate_model_card",
     "perform_ab_test_analysis",
     "detect_feature_leakage",
+    "monitor_drift_evidently",  # NEW: Evidently
+    "explain_with_dtreeviz",  # NEW: dtreeviz
     # Time Series (3)
     "forecast_time_series",
     "generate_interactive_time_series",
     "generate_plotly_dashboard",
+    # EDA Report Generation (2) - NEW PHASE 2
     "generate_ydata_profiling_report",
+    "generate_sweetviz_report",  # NEW: Sweetviz
     # Code Interpreter (2) - NEW PHASE 2 - CRITICAL for True AI Agent
     "execute_python_code",

src/tools/advanced_insights.py CHANGED Viewed

@@ -466,14 +466,16 @@ def analyze_distribution(file_path: str,
 def perform_segment_analysis(file_path: str,
                              n_segments: int = 5,
-                             features: Optional[List[str]] = None) -> Dict[str, Any]:
     """
     Perform cluster-based segment analysis.
     Args:
         file_path: Path to dataset
-        n_segments: Number of segments to create
         features: Features to use for clustering (all numeric if None)
     Returns:
         Dictionary with segment analysis results
@@ -498,18 +500,44 @@ def perform_segment_analysis(file_path: str,
     X_scaled = scaler.fit_transform(X)
     # Perform clustering
-    kmeans = KMeans(n_clusters=n_segments, random_state=42, n_init=10)
-    labels = kmeans.fit_predict(X_scaled)
     # Add cluster labels to dataframe
     df['segment'] = labels
-    # Analyze segments
     segment_profiles = []
-    for i in range(n_segments):
-        segment_data = df[df['segment'] == i]
         profile = {
-            "segment_id": i,
             "size": len(segment_data),
             "percentage": float((len(segment_data) / len(df)) * 100),
             "characteristics": {}
@@ -525,20 +553,26 @@ def perform_segment_analysis(file_path: str,
         segment_profiles.append(profile)
     results = {
         "n_segments": n_segments,
         "features_used": features,
         "total_samples": len(df),
         "segments": segment_profiles,
         "insights": [
-            f"🎯 Created {n_segments} segments from {len(df)} samples",
             f"📊 Used {len(features)} features for segmentation"
         ]
     }
     # Find most distinctive features for each segment
-    for i, profile in enumerate(segment_profiles):
-        results["insights"].append(
-            f"Segment {i}: {profile['size']} samples ({profile['percentage']:.1f}%)"
-        )
     return results

 def perform_segment_analysis(file_path: str,
                              n_segments: int = 5,
+                             features: Optional[List[str]] = None,
+                             method: str = "kmeans") -> Dict[str, Any]:
     """
     Perform cluster-based segment analysis.
     Args:
         file_path: Path to dataset
+        n_segments: Number of segments to create (ignored for HDBSCAN)
         features: Features to use for clustering (all numeric if None)
+        method: Clustering method ('kmeans' or 'hdbscan')
     Returns:
         Dictionary with segment analysis results
     X_scaled = scaler.fit_transform(X)
     # Perform clustering
+    if method == "hdbscan":
+        try:
+            from sklearn.cluster import HDBSCAN as SklearnHDBSCAN
+            print("🔍 Using HDBSCAN for density-based segmentation...")
+            clusterer = SklearnHDBSCAN(
+                min_cluster_size=max(5, len(X) // 50),
+                min_samples=max(3, len(X) // 100),
+                cluster_selection_method='eom'
+            )
+            labels = clusterer.fit_predict(X_scaled)
+            # HDBSCAN assigns -1 to noise points
+            n_clusters = len(set(labels)) - (1 if -1 in labels else 0)
+            n_noise = int((labels == -1).sum())
+            n_segments = n_clusters
+            print(f"   Found {n_clusters} clusters + {n_noise} noise points")
+        except ImportError:
+            print("⚠️ HDBSCAN not available (requires scikit-learn >= 1.3). Falling back to KMeans.")
+            method = "kmeans"
+    if method == "kmeans":
+        kmeans = KMeans(n_clusters=n_segments, random_state=42, n_init=10)
+        labels = kmeans.fit_predict(X_scaled)
     # Add cluster labels to dataframe
     df['segment'] = labels
+    # Analyze segments (include noise cluster -1 for HDBSCAN)
+    unique_labels = sorted(set(labels))
     segment_profiles = []
+    for label in unique_labels:
+        segment_data = df[df['segment'] == label]
         profile = {
+            "segment_id": int(label),
+            "label": "noise" if label == -1 else f"cluster_{label}",
             "size": len(segment_data),
             "percentage": float((len(segment_data) / len(df)) * 100),
             "characteristics": {}
         segment_profiles.append(profile)
     results = {
+        "method": method,
         "n_segments": n_segments,
         "features_used": features,
         "total_samples": len(df),
         "segments": segment_profiles,
         "insights": [
+            f"🎯 Created {n_segments} segments from {len(df)} samples using {method.upper()}",
             f"📊 Used {len(features)} features for segmentation"
         ]
     }
+    if method == "hdbscan" and n_noise > 0:
+        results["noise_points"] = n_noise
+        results["insights"].append(f"🔇 {n_noise} samples classified as noise (outliers)")
     # Find most distinctive features for each segment
+    for profile in segment_profiles:
+        if profile["segment_id"] != -1:
+            results["insights"].append(
+                f"Segment {profile['segment_id']}: {profile['size']} samples ({profile['percentage']:.1f}%)"
+            )
     return results

src/tools/advanced_preprocessing.py CHANGED Viewed

@@ -195,6 +195,8 @@ def perform_feature_scaling(
             - 'standard': StandardScaler (mean=0, std=1)
             - 'minmax': MinMaxScaler (range 0-1)
             - 'robust': RobustScaler (median, IQR - robust to outliers)
         columns: List of columns to scale (None = all numeric columns)
         output_path: Path to save scaled dataset
         scaler_save_path: Path to save fitted scaler for future use
@@ -231,8 +233,16 @@ def perform_feature_scaling(
         scaler = MinMaxScaler()
     elif scaler_type == "robust":
         scaler = RobustScaler()
     else:
-        raise ValueError(f"Unsupported scaler_type: {scaler_type}")
     # Get original statistics
     original_stats = {}

             - 'standard': StandardScaler (mean=0, std=1)
             - 'minmax': MinMaxScaler (range 0-1)
             - 'robust': RobustScaler (median, IQR - robust to outliers)
+            - 'power': PowerTransformer (Yeo-Johnson, makes data more Gaussian)
+            - 'quantile': QuantileTransformer (uniform or normal output distribution)
         columns: List of columns to scale (None = all numeric columns)
         output_path: Path to save scaled dataset
         scaler_save_path: Path to save fitted scaler for future use
         scaler = MinMaxScaler()
     elif scaler_type == "robust":
         scaler = RobustScaler()
+    elif scaler_type == "power":
+        from sklearn.preprocessing import PowerTransformer
+        scaler = PowerTransformer(method='yeo-johnson', standardize=True)
+        print("   📐 Using Yeo-Johnson PowerTransformer (makes data more Gaussian)")
+    elif scaler_type == "quantile":
+        from sklearn.preprocessing import QuantileTransformer
+        scaler = QuantileTransformer(output_distribution='normal', random_state=42, n_quantiles=min(1000, len(df)))
+        print("   📐 Using QuantileTransformer (maps to normal distribution)")
     else:
+        raise ValueError(f"Unsupported scaler_type: {scaler_type}. Use 'standard', 'minmax', 'robust', 'power', or 'quantile'.")
     # Get original statistics
     original_stats = {}

src/tools/advanced_training.py CHANGED Viewed

@@ -73,7 +73,7 @@ def hyperparameter_tuning(
     Args:
         file_path: Path to prepared dataset
         target_col: Target column name
-        model_type: Model to tune ('random_forest', 'xgboost', 'logistic', 'ridge')
         task_type: 'classification', 'regression', or 'auto' (detect from target)
         n_trials: Number of optimization trials (default 50, auto-reduced for large datasets)
         cv_folds: Number of cross-validation folds
@@ -243,8 +243,45 @@ def hyperparameter_tuning(
                 'random_state': random_state
             }
             model = Ridge(**params)
         else:
-            raise ValueError(f"Unsupported model_type: {model_type}")
         # Cross-validation
         if task_type == "classification":

     Args:
         file_path: Path to prepared dataset
         target_col: Target column name
+        model_type: Model to tune ('random_forest', 'xgboost', 'lightgbm', 'catboost', 'logistic', 'ridge')
         task_type: 'classification', 'regression', or 'auto' (detect from target)
         n_trials: Number of optimization trials (default 50, auto-reduced for large datasets)
         cv_folds: Number of cross-validation folds
                 'random_state': random_state
             }
             model = Ridge(**params)
+        elif model_type == "lightgbm":
+            from lightgbm import LGBMClassifier, LGBMRegressor
+            params = {
+                'n_estimators': trial.suggest_int('n_estimators', 50, 500),
+                'max_depth': trial.suggest_int('max_depth', 3, 12),
+                'learning_rate': trial.suggest_float('learning_rate', 0.01, 0.3, log=True),
+                'subsample': trial.suggest_float('subsample', 0.5, 1.0),
+                'colsample_bytree': trial.suggest_float('colsample_bytree', 0.5, 1.0),
+                'reg_alpha': trial.suggest_float('reg_alpha', 1e-8, 10.0, log=True),
+                'reg_lambda': trial.suggest_float('reg_lambda', 1e-8, 10.0, log=True),
+                'num_leaves': trial.suggest_int('num_leaves', 15, 127),
+                'min_child_samples': trial.suggest_int('min_child_samples', 5, 100),
+                'random_state': random_state,
+                'verbosity': -1
+            }
+            if task_type == "classification":
+                model = LGBMClassifier(**params)
+            else:
+                model = LGBMRegressor(**params)
+        elif model_type == "catboost":
+            from catboost import CatBoostClassifier, CatBoostRegressor
+            params = {
+                'iterations': trial.suggest_int('iterations', 50, 500),
+                'depth': trial.suggest_int('depth', 3, 10),
+                'learning_rate': trial.suggest_float('learning_rate', 0.01, 0.3, log=True),
+                'l2_leaf_reg': trial.suggest_float('l2_leaf_reg', 1e-8, 10.0, log=True),
+                'bagging_temperature': trial.suggest_float('bagging_temperature', 0, 10),
+                'random_strength': trial.suggest_float('random_strength', 0, 10),
+                'random_seed': random_state,
+                'verbose': 0
+            }
+            if task_type == "classification":
+                model = CatBoostClassifier(**params)
+            else:
+                model = CatBoostRegressor(**params)
         else:
+            raise ValueError(f"Unsupported model_type: {model_type}. Use 'random_forest', 'xgboost', 'lightgbm', 'catboost', 'logistic', or 'ridge'.")
         # Cross-validation
         if task_type == "classification":

src/tools/agent_tool_mapping.py CHANGED Viewed

@@ -42,6 +42,12 @@ TOOL_CATEGORIES = {
     ],
     "modeling": [
         "train_baseline_models",
         "hyperparameter_tuning",
         "perform_cross_validation",
         "train_ensemble_models",
@@ -53,6 +59,9 @@ TOOL_CATEGORIES = {
         "decompose_time_series",
         "forecast_arima",
         "forecast_prophet",
         "detect_anomalies_time_series",
     ],
     "nlp": [

     ],
     "modeling": [
         "train_baseline_models",
+        "train_with_autogluon",
+        "predict_with_autogluon",
+        "optimize_autogluon_model",
+        "analyze_autogluon_model",
+        "extend_autogluon_training",
+        "train_multilabel_autogluon",
         "hyperparameter_tuning",
         "perform_cross_validation",
         "train_ensemble_models",
         "decompose_time_series",
         "forecast_arima",
         "forecast_prophet",
+        "forecast_with_autogluon",
+        "backtest_timeseries",
+        "analyze_timeseries_model",
         "detect_anomalies_time_series",
     ],
     "nlp": [

src/tools/auto_pipeline.py CHANGED Viewed

@@ -239,7 +239,7 @@ def auto_feature_selection(file_path: str,
         target_col: Target column
         task_type: 'classification', 'regression', or 'auto'
         max_features: Maximum number of features to keep
-        method: 'mutual_info', 'f_test', or 'auto'
         output_path: Where to save selected features
     Returns:
@@ -276,6 +276,60 @@ def auto_feature_selection(file_path: str,
     # Perform selection
     n_features_to_select = min(max_features, len(numeric_features))
     if method == "mutual_info":
         if task_type == "classification":
             selector = SelectKBest(mutual_info_classif, k=n_features_to_select)

         target_col: Target column
         task_type: 'classification', 'regression', or 'auto'
         max_features: Maximum number of features to keep
+        method: 'mutual_info', 'f_test', 'boruta', or 'auto'
         output_path: Where to save selected features
     Returns:
     # Perform selection
     n_features_to_select = min(max_features, len(numeric_features))
+    if method == "boruta":
+        # BorutaPy - all-relevant feature selection
+        try:
+            from boruta import BorutaPy
+            from sklearn.ensemble import RandomForestClassifier, RandomForestRegressor
+            print("🔍 Running BorutaPy all-relevant feature selection...")
+            if task_type == "classification":
+                rf = RandomForestClassifier(n_jobs=-1, max_depth=5, random_state=42)
+            else:
+                rf = RandomForestRegressor(n_jobs=-1, max_depth=5, random_state=42)
+            boruta_selector = BorutaPy(
+                rf,
+                n_estimators='auto',
+                max_iter=100,
+                random_state=42,
+                verbose=0
+            )
+            X_filled = X_numeric.fillna(0).values
+            boruta_selector.fit(X_filled, y.values if hasattr(y, 'values') else y)
+            # Get selected features
+            selected_mask = boruta_selector.support_
+            selected_features = np.array(numeric_features)[selected_mask].tolist()
+            # Get ranking
+            feature_scores = dict(zip(numeric_features, boruta_selector.ranking_.tolist()))
+            sorted_features = sorted(feature_scores.items(), key=lambda x: x[1])
+            results = {
+                "n_features_original": len(numeric_features),
+                "n_features_selected": len(selected_features),
+                "selected_features": selected_features,
+                "feature_rankings": dict(sorted_features),
+                "tentative_features": np.array(numeric_features)[boruta_selector.support_weak_].tolist(),
+                "selection_method": "boruta",
+                "task_type": task_type
+            }
+            # Save selected features + target
+            if output_path:
+                df_selected = df[selected_features + [target_col]]
+                df_selected.to_csv(output_path, index=False)
+                results["output_path"] = output_path
+            return results
+        except ImportError:
+            print("⚠️ boruta not installed. Falling back to mutual_info. Install with: pip install boruta>=0.3")
+            method = "mutual_info" if task_type == "classification" else "f_test"
     if method == "mutual_info":
         if task_type == "classification":
             selector = SelectKBest(mutual_info_classif, k=n_features_to_select)

src/tools/autogluon_training.py ADDED Viewed

	@@ -0,0 +1,1480 @@

+"""
+AutoGluon-Powered Training Tools
+Replaces manual model training with AutoGluon's automated ML for better accuracy,
+automatic ensembling, and built-in handling of raw data (no pre-encoding needed).
+Supports:
+- Classification (binary + multiclass)
+- Regression
+- Time Series Forecasting (NEW capability)
+Scalability safeguards:
+- time_limit prevents runaway training
+- presets control compute budget
+- num_cpus capped to avoid hogging shared resources
+- Memory-aware: excludes heavy models on limited RAM
+"""
+import os
+import json
+import time
+import shutil
+import warnings
+from typing import Dict, Any, Optional, List
+from pathlib import Path
+import pandas as pd
+import numpy as np
+warnings.filterwarnings('ignore')
+# Lazy import AutoGluon to avoid slow startup
+AUTOGLUON_TABULAR_AVAILABLE = False
+AUTOGLUON_TIMESERIES_AVAILABLE = False
+def _ensure_autogluon_tabular():
+    global AUTOGLUON_TABULAR_AVAILABLE
+    try:
+        from autogluon.tabular import TabularPredictor, TabularDataset
+        AUTOGLUON_TABULAR_AVAILABLE = True
+        return TabularPredictor, TabularDataset
+    except ImportError:
+        raise ImportError(
+            "AutoGluon tabular not installed. Run: pip install autogluon.tabular"
+        )
+def _ensure_autogluon_timeseries():
+    global AUTOGLUON_TIMESERIES_AVAILABLE
+    try:
+        from autogluon.timeseries import TimeSeriesPredictor, TimeSeriesDataFrame
+        AUTOGLUON_TIMESERIES_AVAILABLE = True
+        return TimeSeriesPredictor, TimeSeriesDataFrame
+    except ImportError:
+        raise ImportError(
+            "AutoGluon timeseries not installed. Run: pip install autogluon.timeseries"
+        )
+# ============================================================
+# RESOURCE CONFIGURATION
+# Adapt to deployment environment (HF Spaces, local, cloud)
+# ============================================================
+def _get_resource_config() -> Dict[str, Any]:
+    """
+    Detect available resources and return safe training config.
+    Prevents AutoGluon from consuming too much memory/CPU on shared infra.
+    """
+    import psutil
+    total_ram_gb = psutil.virtual_memory().total / (1024 ** 3)
+    cpu_count = os.cpu_count() or 2
+    # Conservative defaults for shared environments (HF Spaces = 16GB, 2-8 vCPU)
+    config = {
+        "num_cpus": min(cpu_count, 4),  # Cap at 4 to leave room for other users
+        "num_gpus": 0,  # No GPU on free HF Spaces
+    }
+    if total_ram_gb < 8:
+        config["presets"] = "medium_quality"
+        config["excluded_model_types"] = ["NN_TORCH", "FASTAI", "KNN"]
+        config["time_limit"] = 60
+    elif total_ram_gb < 16:
+        config["presets"] = "medium_quality"
+        config["excluded_model_types"] = ["NN_TORCH", "FASTAI"]
+        config["time_limit"] = 120
+    else:
+        config["presets"] = "best_quality"
+        config["excluded_model_types"] = ["NN_TORCH"]  # Still skip neural nets for speed
+        config["time_limit"] = 180
+    return config
+# ============================================================
+# TABULAR: Classification + Regression
+# ============================================================
+def train_with_autogluon(
+    file_path: str,
+    target_col: str,
+    task_type: str = "auto",
+    time_limit: int = 120,
+    presets: str = "medium_quality",
+    eval_metric: Optional[str] = None,
+    output_dir: Optional[str] = None,
+    infer_limit: Optional[float] = None
+) -> Dict[str, Any]:
+    """
+    Train ML models using AutoGluon's automated approach.
+    Handles raw data directly — no need to pre-encode categoricals or impute missing values.
+    Automatically trains multiple models, performs stacking, and returns the best ensemble.
+    Supports: classification (binary/multiclass), regression.
+    Args:
+        file_path: Path to CSV/Parquet dataset
+        target_col: Column to predict
+        task_type: 'classification', 'regression', or 'auto' (auto-detected)
+        time_limit: Max training time in seconds (default 120 = 2 minutes)
+        presets: Quality preset - 'medium_quality' (fast), 'best_quality' (slower, better),
+                 'good_quality' (balanced)
+        eval_metric: Metric to optimize (auto-selected if None).
+                     Classification: 'accuracy', 'f1', 'roc_auc', 'log_loss'
+                     Regression: 'rmse', 'mae', 'r2', 'mape'
+        output_dir: Where to save trained model (default: ./outputs/autogluon_model)
+    Returns:
+        Dictionary with training results, leaderboard, best model info, and feature importance
+    """
+    TabularPredictor, TabularDataset = _ensure_autogluon_tabular()
+    start_time = time.time()
+    output_dir = output_dir or "./outputs/autogluon_model"
+    # ── Validate input ──
+    if not Path(file_path).exists():
+        return {"status": "error", "message": f"File not found: {file_path}"}
+    # ── Load data ──
+    print(f"\n🚀 AutoGluon Training Starting...")
+    print(f"   📁 Dataset: {file_path}")
+    print(f"   🎯 Target: {target_col}")
+    print(f"   ⏱️  Time limit: {time_limit}s")
+    print(f"   📊 Presets: {presets}")
+    try:
+        train_data = TabularDataset(file_path)
+    except Exception as e:
+        return {"status": "error", "message": f"Failed to load data: {str(e)}"}
+    if target_col not in train_data.columns:
+        return {
+            "status": "error",
+            "message": f"Target column '{target_col}' not found. Available: {list(train_data.columns)}"
+        }
+    n_rows, n_cols = train_data.shape
+    print(f"   📐 Shape: {n_rows:,} rows × {n_cols} columns")
+    # ── Get resource-aware config ──
+    resource_config = _get_resource_config()
+    # User overrides take priority
+    effective_time_limit = min(time_limit, resource_config["time_limit"])
+    effective_presets = presets
+    # ── Auto-detect task type ──
+    if task_type == "auto":
+        n_unique = train_data[target_col].nunique()
+        if n_unique <= 20 or train_data[target_col].dtype == 'object':
+            task_type = "classification"
+            if n_unique == 2:
+                task_type_detail = "binary"
+            else:
+                task_type_detail = "multiclass"
+        else:
+            task_type = "regression"
+            task_type_detail = "regression"
+    else:
+        task_type_detail = task_type
+    # ── Select eval metric ──
+    if eval_metric is None:
+        if task_type == "classification":
+            eval_metric = "f1_weighted" if task_type_detail == "multiclass" else "f1"
+        else:
+            eval_metric = "root_mean_squared_error"
+    print(f"   🔍 Task type: {task_type_detail}")
+    print(f"   📏 Eval metric: {eval_metric}")
+    print(f"   🔧 Excluded models: {resource_config.get('excluded_model_types', [])}")
+    # ── Clean output directory (AutoGluon needs fresh dir) ──
+    if Path(output_dir).exists():
+        shutil.rmtree(output_dir, ignore_errors=True)
+    # ── Train ──
+    try:
+        predictor = TabularPredictor(
+            label=target_col,
+            eval_metric=eval_metric,
+            path=output_dir,
+            problem_type=task_type if task_type != "auto" else None
+        )
+        fit_kwargs = dict(
+            train_data=train_data,
+            time_limit=effective_time_limit,
+            presets=effective_presets,
+            excluded_model_types=resource_config.get("excluded_model_types", []),
+            num_cpus=resource_config["num_cpus"],
+            num_gpus=resource_config["num_gpus"],
+            verbosity=1
+        )
+        if infer_limit is not None:
+            fit_kwargs["infer_limit"] = infer_limit
+        predictor.fit(**fit_kwargs)
+    except Exception as e:
+        return {"status": "error", "message": f"Training failed: {str(e)}"}
+    elapsed = time.time() - start_time
+    # ── Extract results ──
+    leaderboard = predictor.leaderboard(silent=True)
+    # Convert leaderboard to serializable format
+    leaderboard_data = []
+    for _, row in leaderboard.head(10).iterrows():
+        entry = {
+            "model": str(row.get("model", "")),
+            "score_val": round(float(row.get("score_val", 0)), 4),
+            "fit_time": round(float(row.get("fit_time", 0)), 1),
+            "pred_time_val": round(float(row.get("pred_time_val", 0)), 3),
+        }
+        if "stack_level" in row:
+            entry["stack_level"] = int(row["stack_level"])
+        leaderboard_data.append(entry)
+    # Best model info
+    best_model = predictor.model_best
+    best_score = float(leaderboard.iloc[0]["score_val"]) if len(leaderboard) > 0 else None
+    # Feature importance (top 20)
+    feature_importance_data = []
+    try:
+        fi = predictor.feature_importance(train_data, silent=True)
+        for feat, row in fi.head(20).iterrows():
+            feature_importance_data.append({
+                "feature": str(feat),
+                "importance": round(float(row.get("importance", 0)), 4),
+                "p_value": round(float(row.get("p_value", 1)), 4) if "p_value" in row else None
+            })
+    except Exception:
+        # feature_importance can fail on some model types
+        pass
+    # Model count
+    n_models = len(leaderboard)
+    # Summary
+    results = {
+        "status": "success",
+        "task_type": task_type_detail,
+        "eval_metric": eval_metric,
+        "best_model": best_model,
+        "best_score": best_score,
+        "n_models_trained": n_models,
+        "n_rows": n_rows,
+        "n_features": n_cols - 1,
+        "training_time_seconds": round(elapsed, 1),
+        "time_limit_used": effective_time_limit,
+        "presets": effective_presets,
+        "leaderboard": leaderboard_data,
+        "feature_importance": feature_importance_data,
+        "model_path": output_dir,
+        "output_path": output_dir,
+    }
+    # ── Print summary ──
+    print(f"\n{'='*60}")
+    print(f"✅ AUTOGLUON TRAINING COMPLETE")
+    print(f"{'='*60}")
+    print(f"📊 Models trained: {n_models}")
+    print(f"🏆 Best model: {best_model}")
+    print(f"📈 Best {eval_metric}: {best_score:.4f}" if best_score else "")
+    print(f"⏱️  Total time: {elapsed:.1f}s")
+    print(f"💾 Model saved: {output_dir}")
+    if leaderboard_data:
+        print(f"\n📋 Top 5 Leaderboard:")
+        for i, entry in enumerate(leaderboard_data[:5], 1):
+            print(f"   {i}. {entry['model']}: {entry['score_val']:.4f} (fit: {entry['fit_time']:.1f}s)")
+    if feature_importance_data:
+        print(f"\n🔑 Top 5 Features:")
+        for fi_entry in feature_importance_data[:5]:
+            print(f"   • {fi_entry['feature']}: {fi_entry['importance']:.4f}")
+    print(f"{'='*60}\n")
+    return results
+def predict_with_autogluon(
+    model_path: str,
+    data_path: str,
+    output_path: Optional[str] = None
+) -> Dict[str, Any]:
+    """
+    Make predictions using a trained AutoGluon model.
+    Args:
+        model_path: Path to saved AutoGluon model directory
+        data_path: Path to new data for prediction
+        output_path: Path to save predictions CSV (optional)
+    Returns:
+        Dictionary with predictions and metadata
+    """
+    TabularPredictor, TabularDataset = _ensure_autogluon_tabular()
+    if not Path(model_path).exists():
+        return {"status": "error", "message": f"Model not found: {model_path}"}
+    if not Path(data_path).exists():
+        return {"status": "error", "message": f"Data not found: {data_path}"}
+    try:
+        predictor = TabularPredictor.load(model_path)
+        test_data = TabularDataset(data_path)
+        predictions = predictor.predict(test_data)
+        output_path = output_path or "./outputs/autogluon_predictions.csv"
+        Path(output_path).parent.mkdir(parents=True, exist_ok=True)
+        result_df = test_data.copy()
+        result_df["prediction"] = predictions.values
+        result_df.to_csv(output_path, index=False)
+        # Prediction probabilities for classification
+        probabilities = None
+        try:
+            proba = predictor.predict_proba(test_data)
+            probabilities = {
+                "columns": list(proba.columns),
+                "sample": proba.head(5).to_dict()
+            }
+        except Exception:
+            pass
+        return {
+            "status": "success",
+            "n_predictions": len(predictions),
+            "prediction_sample": predictions.head(10).tolist(),
+            "output_path": output_path,
+            "model_used": predictor.model_best,
+            "probabilities": probabilities
+        }
+    except Exception as e:
+        return {"status": "error", "message": f"Prediction failed: {str(e)}"}
+# ============================================================
+# TIME SERIES FORECASTING
+# ============================================================
+def forecast_with_autogluon(
+    file_path: str,
+    target_col: str,
+    time_col: str,
+    forecast_horizon: int = 30,
+    id_col: Optional[str] = None,
+    freq: Optional[str] = None,
+    time_limit: int = 120,
+    presets: str = "medium_quality",
+    output_path: Optional[str] = None,
+    static_features_path: Optional[str] = None,
+    known_covariates_cols: Optional[List[str]] = None,
+    holiday_country: Optional[str] = None,
+    fill_missing: bool = True,
+    models: Optional[List[str]] = None,
+    quantile_levels: Optional[List[float]] = None
+) -> Dict[str, Any]:
+    """
+    Forecast time series using AutoGluon's TimeSeriesPredictor.
+    Supports multiple forecasting models automatically: DeepAR, ETS, ARIMA, Theta,
+    Chronos (foundation model), and statistical ensembles.
+    Enhanced with covariates, holiday features, model selection, and quantile forecasting.
+    Args:
+        file_path: Path to time series CSV/Parquet
+        target_col: Column with values to forecast
+        time_col: Column with timestamps/dates
+        forecast_horizon: Number of future periods to predict
+        id_col: Column identifying different series (for multi-series)
+        freq: Frequency string ('D'=daily, 'h'=hourly, 'MS'=monthly, 'W'=weekly)
+        time_limit: Max training time in seconds
+        presets: 'fast_training', 'medium_quality', 'best_quality', or 'chronos_tiny'
+        output_path: Path to save forecast CSV
+        static_features_path: CSV with per-series metadata (one row per series)
+        known_covariates_cols: Columns with future-known values (holidays, promotions)
+        holiday_country: Country code for auto holiday features (e.g. 'US', 'UK', 'IN')
+        fill_missing: Whether to auto-fill missing values in time series
+        models: Specific models to train (e.g. ['ETS', 'DeepAR', 'AutoARIMA'])
+        quantile_levels: Quantile levels for probabilistic forecasts (e.g. [0.1, 0.5, 0.9])
+    Returns:
+        Dictionary with forecasts, model performance, and leaderboard
+    """
+    TimeSeriesPredictor, TimeSeriesDataFrame = _ensure_autogluon_timeseries()
+    start_time = time.time()
+    output_dir = "./outputs/autogluon_ts_model"
+    output_path = output_path or "./outputs/autogluon_forecast.csv"
+    # ── Validate ──
+    if not Path(file_path).exists():
+        return {"status": "error", "message": f"File not found: {file_path}"}
+    print(f"\n🚀 AutoGluon Time Series Forecasting...")
+    print(f"   📁 Dataset: {file_path}")
+    print(f"   🎯 Target: {target_col}")
+    print(f"   📅 Time column: {time_col}")
+    print(f"   🔮 Forecast horizon: {forecast_horizon} periods")
+    # ── Load and prepare data ──
+    try:
+        df = pd.read_csv(file_path)
+    except Exception:
+        try:
+            df = pd.read_parquet(file_path)
+        except Exception as e:
+            return {"status": "error", "message": f"Failed to load data: {str(e)}"}
+    if target_col not in df.columns:
+        return {
+            "status": "error",
+            "message": f"Target column '{target_col}' not found. Available: {list(df.columns)}"
+        }
+    if time_col not in df.columns:
+        return {
+            "status": "error",
+            "message": f"Time column '{time_col}' not found. Available: {list(df.columns)}"
+        }
+    # Parse datetime
+    df[time_col] = pd.to_datetime(df[time_col])
+    df = df.sort_values(time_col)
+    # If no id_col, create a dummy one (single series)
+    if id_col is None or id_col not in df.columns:
+        id_col = "__series_id"
+        df[id_col] = "series_0"
+    # Auto-detect frequency if not provided
+    if freq is None:
+        time_diffs = df[time_col].diff().dropna()
+        median_diff = time_diffs.median()
+        if median_diff <= pd.Timedelta(hours=2):
+            freq = "h"
+        elif median_diff <= pd.Timedelta(days=1.5):
+            freq = "D"
+        elif median_diff <= pd.Timedelta(days=8):
+            freq = "W"
+        elif median_diff <= pd.Timedelta(days=35):
+            freq = "MS"
+        else:
+            freq = "D"  # Default
+    print(f"   📊 Frequency: {freq}")
+    print(f"   📐 Shape: {df.shape[0]:,} rows")
+    # ── Add holiday features (#29) ──
+    if holiday_country:
+        try:
+            import holidays as holidays_lib
+            country_holidays = holidays_lib.country_holidays(holiday_country)
+            df['is_holiday'] = df[time_col].dt.date.apply(
+                lambda d: 1 if d in country_holidays else 0
+            ).astype(float)
+            if known_covariates_cols is None:
+                known_covariates_cols = []
+            if 'is_holiday' not in known_covariates_cols:
+                known_covariates_cols.append('is_holiday')
+            print(f"   🎄 Holiday features added for: {holiday_country}")
+        except ImportError:
+            print(f"   ⚠️ 'holidays' package not installed. Skipping holiday features.")
+        except Exception as e:
+            print(f"   ⚠️ Could not add holiday features: {e}")
+    # ── Convert to TimeSeriesDataFrame ──
+    try:
+        ts_df = TimeSeriesDataFrame.from_data_frame(
+            df,
+            id_column=id_col,
+            timestamp_column=time_col
+        )
+    except Exception as e:
+        return {"status": "error", "message": f"Failed to create time series: {str(e)}"}
+    # ── Attach static features (#26) ──
+    if static_features_path and Path(static_features_path).exists():
+        try:
+            static_df = pd.read_csv(static_features_path)
+            ts_df.static_features = static_df
+            print(f"   📌 Static features loaded: {list(static_df.columns)}")
+        except Exception as e:
+            print(f"   ⚠️ Could not load static features: {e}")
+    # ── Fill missing values (#36) ──
+    if fill_missing:
+        try:
+            ts_df = ts_df.fill_missing_values()
+            print(f"   🔧 Missing values filled")
+        except Exception:
+            pass
+    # ── Clean output dir ──
+    if Path(output_dir).exists():
+        shutil.rmtree(output_dir, ignore_errors=True)
+    # ── Get resource config ──
+    resource_config = _get_resource_config()
+    effective_time_limit = min(time_limit, resource_config["time_limit"])
+    # ── Train forecasting models ──
+    try:
+        predictor_kwargs = dict(
+            target=target_col,
+            prediction_length=forecast_horizon,
+            path=output_dir,
+            freq=freq
+        )
+        if known_covariates_cols:
+            predictor_kwargs["known_covariates_names"] = known_covariates_cols
+        if quantile_levels:
+            predictor_kwargs["quantile_levels"] = quantile_levels
+        predictor = TimeSeriesPredictor(**predictor_kwargs)
+        ts_fit_kwargs = dict(
+            train_data=ts_df,
+            time_limit=effective_time_limit,
+            presets=presets,
+        )
+        if models:
+            ts_fit_kwargs["hyperparameters"] = {m: {} for m in models}
+        predictor.fit(**ts_fit_kwargs)
+    except Exception as e:
+        return {"status": "error", "message": f"Time series training failed: {str(e)}"}
+    elapsed = time.time() - start_time
+    # ── Generate forecasts ──
+    try:
+        predict_kwargs = {}
+        if known_covariates_cols:
+            try:
+                future_known = predictor.make_future_data_frame(ts_df)
+                if holiday_country:
+                    import holidays as holidays_lib
+                    country_holidays = holidays_lib.country_holidays(holiday_country)
+                    dates = future_known.index.get_level_values('timestamp')
+                    future_known['is_holiday'] = [
+                        1.0 if d.date() in country_holidays else 0.0 for d in dates
+                    ]
+                predict_kwargs["known_covariates"] = future_known
+            except Exception:
+                pass
+        forecasts = predictor.predict(ts_df, **predict_kwargs)
+    except Exception as e:
+        return {"status": "error", "message": f"Forecasting failed: {str(e)}"}
+    # ── Leaderboard ──
+    leaderboard = predictor.leaderboard(silent=True)
+    leaderboard_data = []
+    for _, row in leaderboard.head(10).iterrows():
+        leaderboard_data.append({
+            "model": str(row.get("model", "")),
+            "score_val": round(float(row.get("score_val", 0)), 4),
+            "fit_time": round(float(row.get("fit_time", 0)), 1),
+        })
+    best_model = predictor.model_best if hasattr(predictor, 'model_best') else leaderboard_data[0]["model"] if leaderboard_data else "unknown"
+    best_score = leaderboard_data[0]["score_val"] if leaderboard_data else None
+    # ── Save forecasts ──
+    Path(output_path).parent.mkdir(parents=True, exist_ok=True)
+    try:
+        forecast_df = forecasts.reset_index()
+        forecast_df.to_csv(output_path, index=False)
+    except Exception:
+        output_path = output_path  # Keep path but note it may not have saved
+    # ── Forecast summary ──
+    forecast_summary = {}
+    try:
+        mean_col = "mean" if "mean" in forecasts.columns else forecasts.columns[0]
+        forecast_values = forecasts[mean_col].values
+        forecast_summary = {
+            "mean_forecast": round(float(np.mean(forecast_values)), 2),
+            "min_forecast": round(float(np.min(forecast_values)), 2),
+            "max_forecast": round(float(np.max(forecast_values)), 2),
+            "forecast_std": round(float(np.std(forecast_values)), 2),
+        }
+    except Exception:
+        pass
+    results = {
+        "status": "success",
+        "task_type": "time_series_forecasting",
+        "target_col": target_col,
+        "time_col": time_col,
+        "forecast_horizon": forecast_horizon,
+        "frequency": freq,
+        "n_series": df[id_col].nunique() if id_col != "__series_id" else 1,
+        "n_data_points": len(df),
+        "best_model": best_model,
+        "best_score": best_score,
+        "n_models_trained": len(leaderboard),
+        "training_time_seconds": round(elapsed, 1),
+        "leaderboard": leaderboard_data,
+        "forecast_summary": forecast_summary,
+        "output_path": output_path,
+        "model_path": output_dir,
+    }
+    # ── Print summary ──
+    print(f"\n{'='*60}")
+    print(f"✅ TIME SERIES FORECASTING COMPLETE")
+    print(f"{'='*60}")
+    print(f"📊 Models trained: {len(leaderboard)}")
+    print(f"🏆 Best model: {best_model}")
+    print(f"📈 Best score: {best_score}")
+    print(f"🔮 Forecast: {forecast_horizon} periods ahead")
+    if forecast_summary:
+        print(f"📉 Forecast range: {forecast_summary.get('min_forecast')} to {forecast_summary.get('max_forecast')}")
+    print(f"⏱️  Total time: {elapsed:.1f}s")
+    print(f"💾 Forecasts saved: {output_path}")
+    if leaderboard_data:
+        print(f"\n📋 Leaderboard:")
+        for i, entry in enumerate(leaderboard_data[:5], 1):
+            print(f"   {i}. {entry['model']}: {entry['score_val']:.4f}")
+    print(f"{'='*60}\n")
+    return results
+# ============================================================
+# POST-TRAINING OPTIMIZATION (#1, #2, #6, #8, #9, #24)
+# ============================================================
+def optimize_autogluon_model(
+    model_path: str,
+    operation: str,
+    data_path: Optional[str] = None,
+    metric: Optional[str] = None,
+    models_to_delete: Optional[List[str]] = None,
+    output_dir: Optional[str] = None
+) -> Dict[str, Any]:
+    """
+    Post-training optimization on a trained AutoGluon model.
+    Operations:
+      - refit_full: Re-train best models on 100% data (no held-out fold) for deployment
+      - distill: Compress ensemble into a single lighter model via knowledge distillation
+      - calibrate_threshold: Optimize binary classification threshold for best F1/precision/recall
+      - deploy_optimize: Strip training artifacts for minimal deployment footprint
+      - delete_models: Remove specific models to free resources
+    Args:
+        model_path: Path to saved AutoGluon model directory
+        operation: One of 'refit_full', 'distill', 'calibrate_threshold', 'deploy_optimize', 'delete_models'
+        data_path: Path to dataset (required for distill, calibrate_threshold)
+        metric: Metric to optimize for calibrate_threshold: 'f1', 'balanced_accuracy', 'precision', 'recall'
+        models_to_delete: List of model names to delete (for delete_models operation)
+        output_dir: Directory for optimized model output (for deploy_optimize)
+    Returns:
+        Dictionary with optimization results
+    """
+    TabularPredictor, TabularDataset = _ensure_autogluon_tabular()
+    if not Path(model_path).exists():
+        return {"status": "error", "message": f"Model not found: {model_path}"}
+    try:
+        predictor = TabularPredictor.load(model_path)
+    except Exception as e:
+        return {"status": "error", "message": f"Failed to load model: {str(e)}"}
+    print(f"\n🔧 AutoGluon Model Optimization: {operation}")
+    print(f"   📁 Model: {model_path}")
+    try:
+        if operation == "refit_full":
+            refit_map = predictor.refit_full()
+            refit_models = list(refit_map.values())
+            new_leaderboard = predictor.leaderboard(silent=True)
+            leaderboard_data = []
+            for _, row in new_leaderboard.head(10).iterrows():
+                leaderboard_data.append({
+                    "model": str(row.get("model", "")),
+                    "score_val": round(float(row.get("score_val", 0)), 4),
+                })
+            print(f"   ✅ Models refit on 100% data: {refit_models}")
+            return {
+                "status": "success",
+                "operation": "refit_full",
+                "message": "Models re-trained on 100% data (no held-out folds) for deployment",
+                "refit_models": refit_models,
+                "original_best": predictor.model_best,
+                "leaderboard": leaderboard_data,
+                "model_path": model_path
+            }
+        elif operation == "distill":
+            if not data_path or not Path(data_path).exists():
+                return {"status": "error", "message": "data_path required for distillation"}
+            train_data = TabularDataset(data_path)
+            resource_config = _get_resource_config()
+            distilled = predictor.distill(
+                train_data=train_data,
+                time_limit=resource_config["time_limit"],
+                augment_method='spunge'
+            )
+            new_leaderboard = predictor.leaderboard(silent=True)
+            leaderboard_data = []
+            for _, row in new_leaderboard.head(10).iterrows():
+                leaderboard_data.append({
+                    "model": str(row.get("model", "")),
+                    "score_val": round(float(row.get("score_val", 0)), 4),
+                })
+            print(f"   ✅ Ensemble distilled into: {distilled}")
+            return {
+                "status": "success",
+                "operation": "distill",
+                "message": "Ensemble distilled into lighter model(s) via knowledge distillation",
+                "distilled_models": distilled,
+                "best_model": predictor.model_best,
+                "leaderboard": leaderboard_data,
+                "model_path": model_path
+            }
+        elif operation == "calibrate_threshold":
+            if not data_path or not Path(data_path).exists():
+                return {"status": "error", "message": "data_path required for threshold calibration"}
+            if predictor.problem_type != 'binary':
+                return {"status": "error", "message": "Threshold calibration only works for binary classification"}
+            test_data = TabularDataset(data_path)
+            metric = metric or "f1"
+            threshold, score = predictor.calibrate_decision_threshold(
+                data=test_data,
+                metric=metric
+            )
+            print(f"   ✅ Optimal threshold: {threshold:.4f} ({metric}={score:.4f})")
+            return {
+                "status": "success",
+                "operation": "calibrate_threshold",
+                "optimal_threshold": round(float(threshold), 4),
+                "score_at_threshold": round(float(score), 4),
+                "metric": metric,
+                "message": f"Optimal threshold: {threshold:.4f} (default was 0.5), {metric}={score:.4f}",
+                "model_path": model_path
+            }
+        elif operation == "deploy_optimize":
+            output_dir = output_dir or model_path + "_deploy"
+            size_before = sum(
+                f.stat().st_size for f in Path(model_path).rglob('*') if f.is_file()
+            ) / (1024 * 1024)
+            deploy_path = predictor.clone_for_deployment(output_dir)
+            deploy_predictor = TabularPredictor.load(deploy_path)
+            deploy_predictor.save_space()
+            size_after = sum(
+                f.stat().st_size for f in Path(deploy_path).rglob('*') if f.is_file()
+            ) / (1024 * 1024)
+            print(f"   ✅ Optimized: {size_before:.1f}MB → {size_after:.1f}MB")
+            return {
+                "status": "success",
+                "operation": "deploy_optimize",
+                "message": f"Model optimized for deployment: {size_before:.1f}MB → {size_after:.1f}MB ({(1-size_after/max(size_before,0.01))*100:.0f}% reduction)",
+                "size_before_mb": round(size_before, 1),
+                "size_after_mb": round(size_after, 1),
+                "deploy_path": str(deploy_path),
+                "best_model": deploy_predictor.model_best
+            }
+        elif operation == "delete_models":
+            if not models_to_delete:
+                return {"status": "error", "message": "models_to_delete list required"}
+            before_count = len(predictor.model_names())
+            predictor.delete_models(models_to_delete=models_to_delete, dry_run=False)
+            after_count = len(predictor.model_names())
+            print(f"   ✅ Deleted {before_count - after_count} models")
+            return {
+                "status": "success",
+                "operation": "delete_models",
+                "message": f"Deleted {before_count - after_count} models ({before_count} → {after_count})",
+                "remaining_models": predictor.model_names(),
+                "best_model": predictor.model_best,
+                "model_path": model_path
+            }
+        else:
+            return {
+                "status": "error",
+                "message": f"Unknown operation '{operation}'. Choose: refit_full, distill, calibrate_threshold, deploy_optimize, delete_models"
+            }
+    except Exception as e:
+        return {"status": "error", "message": f"Optimization failed: {str(e)}"}
+# ============================================================
+# MODEL ANALYSIS & INSPECTION (#19 + extended leaderboard)
+# ============================================================
+def analyze_autogluon_model(
+    model_path: str,
+    data_path: Optional[str] = None,
+    operation: str = "summary"
+) -> Dict[str, Any]:
+    """
+    Inspect and analyze a trained AutoGluon model.
+    Operations:
+      - summary: Extended leaderboard with detailed model info (stack levels, memory, etc.)
+      - transform_features: Returns the internally transformed feature matrix
+      - info: Comprehensive model metadata and training summary
+    Args:
+        model_path: Path to saved AutoGluon model directory
+        data_path: Path to dataset (required for transform_features)
+        operation: One of 'summary', 'transform_features', 'info'
+    Returns:
+        Dictionary with analysis results
+    """
+    TabularPredictor, TabularDataset = _ensure_autogluon_tabular()
+    if not Path(model_path).exists():
+        return {"status": "error", "message": f"Model not found: {model_path}"}
+    try:
+        predictor = TabularPredictor.load(model_path)
+    except Exception as e:
+        return {"status": "error", "message": f"Failed to load model: {str(e)}"}
+    try:
+        if operation == "summary":
+            leaderboard = predictor.leaderboard(extra_info=True, silent=True)
+            leaderboard_data = []
+            for _, row in leaderboard.iterrows():
+                entry = {"model": str(row.get("model", ""))}
+                for col in leaderboard.columns:
+                    if col != "model":
+                        val = row[col]
+                        try:
+                            entry[str(col)] = round(float(val), 4) if isinstance(val, (int, float, np.floating)) else str(val)
+                        except (ValueError, TypeError):
+                            entry[str(col)] = str(val)
+                leaderboard_data.append(entry)
+            return {
+                "status": "success",
+                "operation": "summary",
+                "best_model": predictor.model_best,
+                "problem_type": predictor.problem_type,
+                "eval_metric": str(predictor.eval_metric),
+                "n_models": len(leaderboard),
+                "model_names": predictor.model_names(),
+                "leaderboard": leaderboard_data
+            }
+        elif operation == "transform_features":
+            if not data_path or not Path(data_path).exists():
+                return {"status": "error", "message": "data_path required for transform_features"}
+            data = TabularDataset(data_path)
+            transformed = predictor.transform_features(data)
+            output_path = "./outputs/autogluon_transformed_features.csv"
+            Path(output_path).parent.mkdir(parents=True, exist_ok=True)
+            transformed.to_csv(output_path, index=False)
+            return {
+                "status": "success",
+                "operation": "transform_features",
+                "original_shape": list(data.shape),
+                "transformed_shape": list(transformed.shape),
+                "original_columns": list(data.columns[:20]),
+                "transformed_columns": list(transformed.columns[:30]),
+                "output_path": output_path,
+                "message": f"Features transformed: {data.shape[1]} original → {transformed.shape[1]} engineered"
+            }
+        elif operation == "info":
+            info = predictor.info()
+            safe_info = {}
+            for key, val in info.items():
+                try:
+                    json.dumps(val)
+                    safe_info[key] = val
+                except (TypeError, ValueError):
+                    safe_info[key] = str(val)
+            return {
+                "status": "success",
+                "operation": "info",
+                "model_info": safe_info
+            }
+        else:
+            return {
+                "status": "error",
+                "message": f"Unknown operation '{operation}'. Choose: summary, transform_features, info"
+            }
+    except Exception as e:
+        return {"status": "error", "message": f"Analysis failed: {str(e)}"}
+# ============================================================
+# INCREMENTAL TRAINING (#3, #5)
+# ============================================================
+def extend_autogluon_training(
+    model_path: str,
+    operation: str = "fit_extra",
+    data_path: Optional[str] = None,
+    time_limit: int = 60,
+    hyperparameters: Optional[Dict] = None
+) -> Dict[str, Any]:
+    """
+    Add models or re-fit ensemble on an existing AutoGluon predictor.
+    Operations:
+      - fit_extra: Train additional models/hyperparameters without retraining from scratch
+      - fit_weighted_ensemble: Re-fit the weighted ensemble layer on existing base models
+    Args:
+        model_path: Path to saved AutoGluon model directory
+        operation: 'fit_extra' or 'fit_weighted_ensemble'
+        data_path: Path to training data (required for fit_extra)
+        time_limit: Additional training time in seconds
+        hyperparameters: Model hyperparameters dict for fit_extra.
+            e.g. {"GBM": {"num_boost_round": 500}, "RF": {}}
+    Returns:
+        Dictionary with updated model info
+    """
+    TabularPredictor, TabularDataset = _ensure_autogluon_tabular()
+    if not Path(model_path).exists():
+        return {"status": "error", "message": f"Model not found: {model_path}"}
+    try:
+        predictor = TabularPredictor.load(model_path)
+    except Exception as e:
+        return {"status": "error", "message": f"Failed to load model: {str(e)}"}
+    before_models = predictor.model_names()
+    print(f"\n🔧 Extending AutoGluon Model: {operation}")
+    print(f"   📁 Model: {model_path}")
+    print(f"   📊 Current models: {len(before_models)}")
+    try:
+        if operation == "fit_extra":
+            if not data_path or not Path(data_path).exists():
+                return {"status": "error", "message": "data_path required for fit_extra"}
+            resource_config = _get_resource_config()
+            hp = hyperparameters or {
+                "GBM": [
+                    {"extra_trees": True, "ag_args": {"name_suffix": "XT"}},
+                    {"num_boost_round": 500},
+                ],
+                "RF": [
+                    {"criterion": "gini", "ag_args": {"name_suffix": "Gini"}},
+                    {"criterion": "entropy", "ag_args": {"name_suffix": "Entr"}},
+                ],
+            }
+            predictor.fit_extra(
+                hyperparameters=hp,
+                time_limit=min(time_limit, resource_config["time_limit"]),
+                num_cpus=resource_config["num_cpus"],
+                num_gpus=0
+            )
+        elif operation == "fit_weighted_ensemble":
+            predictor.fit_weighted_ensemble()
+        else:
+            return {
+                "status": "error",
+                "message": f"Unknown operation '{operation}'. Choose: fit_extra, fit_weighted_ensemble"
+            }
+        after_models = predictor.model_names()
+        leaderboard = predictor.leaderboard(silent=True)
+        leaderboard_data = []
+        for _, row in leaderboard.head(10).iterrows():
+            leaderboard_data.append({
+                "model": str(row.get("model", "")),
+                "score_val": round(float(row.get("score_val", 0)), 4),
+                "fit_time": round(float(row.get("fit_time", 0)), 1),
+            })
+        new_models = [m for m in after_models if m not in before_models]
+        print(f"   ✅ New models added: {len(new_models)}")
+        print(f"   🏆 Best model: {predictor.model_best}")
+        return {
+            "status": "success",
+            "operation": operation,
+            "models_before": len(before_models),
+            "models_after": len(after_models),
+            "new_models": new_models,
+            "best_model": predictor.model_best,
+            "leaderboard": leaderboard_data,
+            "model_path": model_path
+        }
+    except Exception as e:
+        return {"status": "error", "message": f"Extension failed: {str(e)}"}
+# ============================================================
+# MULTI-LABEL PREDICTION (#14)
+# ============================================================
+def train_multilabel_autogluon(
+    file_path: str,
+    target_cols: List[str],
+    time_limit: int = 120,
+    presets: str = "medium_quality",
+    output_dir: Optional[str] = None
+) -> Dict[str, Any]:
+    """
+    Train multi-label prediction using AutoGluon's MultilabelPredictor.
+    Predicts multiple target columns simultaneously by training separate
+    TabularPredictors per label with shared feature engineering.
+    Args:
+        file_path: Path to CSV/Parquet dataset
+        target_cols: List of columns to predict (e.g. ['label1', 'label2', 'label3'])
+        time_limit: Max training time per label in seconds
+        presets: Quality preset
+        output_dir: Where to save trained model
+    Returns:
+        Dictionary with per-label results and overall performance
+    """
+    try:
+        from autogluon.tabular import TabularDataset, MultilabelPredictor
+    except ImportError:
+        return {
+            "status": "error",
+            "message": "MultilabelPredictor not available. Ensure autogluon.tabular>=1.2 is installed."
+        }
+    start_time = time.time()
+    output_dir = output_dir or "./outputs/autogluon_multilabel"
+    if not Path(file_path).exists():
+        return {"status": "error", "message": f"File not found: {file_path}"}
+    try:
+        data = TabularDataset(file_path)
+    except Exception as e:
+        return {"status": "error", "message": f"Failed to load data: {str(e)}"}
+    missing_cols = [c for c in target_cols if c not in data.columns]
+    if missing_cols:
+        return {
+            "status": "error",
+            "message": f"Target columns not found: {missing_cols}. Available: {list(data.columns)}"
+        }
+    print(f"\n🚀 AutoGluon Multi-Label Training...")
+    print(f"   📁 Dataset: {file_path}")
+    print(f"   🎯 Targets: {target_cols}")
+    print(f"   📐 Shape: {data.shape[0]:,} rows × {data.shape[1]} columns")
+    resource_config = _get_resource_config()
+    effective_time_limit = min(time_limit, resource_config["time_limit"])
+    if Path(output_dir).exists():
+        shutil.rmtree(output_dir, ignore_errors=True)
+    try:
+        multi_predictor = MultilabelPredictor(
+            labels=target_cols,
+            path=output_dir
+        )
+        multi_predictor.fit(
+            train_data=data,
+            time_limit=effective_time_limit,
+            presets=presets
+        )
+    except Exception as e:
+        return {"status": "error", "message": f"Multi-label training failed: {str(e)}"}
+    elapsed = time.time() - start_time
+    per_label_results = {}
+    for label in target_cols:
+        try:
+            label_predictor = multi_predictor.get_predictor(label)
+            lb = label_predictor.leaderboard(silent=True)
+            per_label_results[label] = {
+                "best_model": label_predictor.model_best,
+                "best_score": round(float(lb.iloc[0]["score_val"]), 4) if len(lb) > 0 else None,
+                "n_models": len(lb),
+                "problem_type": label_predictor.problem_type
+            }
+        except Exception:
+            per_label_results[label] = {"error": "Could not retrieve results"}
+    print(f"\n{'='*60}")
+    print(f"✅ MULTI-LABEL TRAINING COMPLETE")
+    print(f"{'='*60}")
+    for label, result in per_label_results.items():
+        score = result.get('best_score', 'N/A')
+        model = result.get('best_model', 'N/A')
+        print(f"   🎯 {label}: {model} (score: {score})")
+    print(f"   ⏱️  Total time: {elapsed:.1f}s")
+    print(f"{'='*60}\n")
+    return {
+        "status": "success",
+        "task_type": "multilabel",
+        "n_labels": len(target_cols),
+        "labels": target_cols,
+        "per_label_results": per_label_results,
+        "training_time_seconds": round(elapsed, 1),
+        "model_path": output_dir,
+        "output_path": output_dir
+    }
+# ============================================================
+# TIME SERIES BACKTESTING (#33)
+# ============================================================
+def backtest_timeseries(
+    file_path: str,
+    target_col: str,
+    time_col: str,
+    forecast_horizon: int = 30,
+    id_col: Optional[str] = None,
+    freq: Optional[str] = None,
+    num_val_windows: int = 3,
+    time_limit: int = 120,
+    presets: str = "medium_quality",
+    output_path: Optional[str] = None
+) -> Dict[str, Any]:
+    """
+    Backtest time series models using multiple validation windows.
+    Trains models with multi-window cross-validation for robust performance
+    estimates. More reliable than a single train/test split.
+    Args:
+        file_path: Path to time series CSV/Parquet
+        target_col: Column with values to forecast
+        time_col: Column with timestamps/dates
+        forecast_horizon: Periods to predict per window
+        id_col: Column identifying different series
+        freq: Frequency string ('D', 'h', 'W', 'MS')
+        num_val_windows: Number of backtesting windows (default: 3)
+        time_limit: Max training time in seconds
+        presets: Quality preset
+        output_path: Path to save backtest predictions CSV
+    Returns:
+        Dictionary with per-window evaluation and aggregate metrics
+    """
+    TimeSeriesPredictor, TimeSeriesDataFrame = _ensure_autogluon_timeseries()
+    start_time = time.time()
+    output_dir = "./outputs/autogluon_ts_backtest"
+    output_path = output_path or "./outputs/autogluon_backtest.csv"
+    if not Path(file_path).exists():
+        return {"status": "error", "message": f"File not found: {file_path}"}
+    print(f"\n📊 Time Series Backtesting ({num_val_windows} windows)...")
+    print(f"   📁 Dataset: {file_path}")
+    print(f"   🎯 Target: {target_col}")
+    print(f"   🔮 Horizon: {forecast_horizon} periods × {num_val_windows} windows")
+    # Load data
+    try:
+        df = pd.read_csv(file_path)
+    except Exception:
+        try:
+            df = pd.read_parquet(file_path)
+        except Exception as e:
+            return {"status": "error", "message": f"Failed to load data: {str(e)}"}
+    if target_col not in df.columns or time_col not in df.columns:
+        return {"status": "error", "message": f"Columns not found. Available: {list(df.columns)}"}
+    df[time_col] = pd.to_datetime(df[time_col])
+    df = df.sort_values(time_col)
+    if id_col is None or id_col not in df.columns:
+        id_col_name = "__series_id"
+        df[id_col_name] = "series_0"
+    else:
+        id_col_name = id_col
+    # Auto-detect frequency
+    if freq is None:
+        time_diffs = df[time_col].diff().dropna()
+        median_diff = time_diffs.median()
+        if median_diff <= pd.Timedelta(hours=2):
+            freq = "h"
+        elif median_diff <= pd.Timedelta(days=1.5):
+            freq = "D"
+        elif median_diff <= pd.Timedelta(days=8):
+            freq = "W"
+        elif median_diff <= pd.Timedelta(days=35):
+            freq = "MS"
+        else:
+            freq = "D"
+    try:
+        ts_df = TimeSeriesDataFrame.from_data_frame(
+            df, id_column=id_col_name, timestamp_column=time_col
+        )
+    except Exception as e:
+        return {"status": "error", "message": f"Failed to create time series: {str(e)}"}
+    if Path(output_dir).exists():
+        shutil.rmtree(output_dir, ignore_errors=True)
+    resource_config = _get_resource_config()
+    try:
+        predictor = TimeSeriesPredictor(
+            target=target_col,
+            prediction_length=forecast_horizon,
+            path=output_dir,
+            freq=freq
+        )
+        predictor.fit(
+            train_data=ts_df,
+            time_limit=min(time_limit, resource_config["time_limit"]),
+            presets=presets,
+            num_val_windows=num_val_windows
+        )
+    except Exception as e:
+        return {"status": "error", "message": f"Backtest training failed: {str(e)}"}
+    elapsed = time.time() - start_time
+    # Get backtest predictions
+    try:
+        bt_preds = predictor.backtest_predictions()
+        Path(output_path).parent.mkdir(parents=True, exist_ok=True)
+        bt_df = bt_preds.reset_index()
+        bt_df.to_csv(output_path, index=False)
+    except Exception:
+        bt_preds = None
+    # Leaderboard
+    leaderboard = predictor.leaderboard(silent=True)
+    leaderboard_data = []
+    for _, row in leaderboard.head(10).iterrows():
+        leaderboard_data.append({
+            "model": str(row.get("model", "")),
+            "score_val": round(float(row.get("score_val", 0)), 4),
+            "fit_time": round(float(row.get("fit_time", 0)), 1),
+        })
+    best_model = predictor.model_best if hasattr(predictor, 'model_best') else "unknown"
+    best_score = leaderboard_data[0]["score_val"] if leaderboard_data else None
+    print(f"\n{'='*60}")
+    print(f"✅ BACKTESTING COMPLETE ({num_val_windows} windows)")
+    print(f"{'='*60}")
+    print(f"🏆 Best: {best_model} (score: {best_score})")
+    print(f"⏱️  Time: {elapsed:.1f}s")
+    print(f"{'='*60}\n")
+    return {
+        "status": "success",
+        "task_type": "backtesting",
+        "num_val_windows": num_val_windows,
+        "forecast_horizon": forecast_horizon,
+        "best_model": best_model,
+        "best_score": best_score,
+        "n_models_trained": len(leaderboard),
+        "training_time_seconds": round(elapsed, 1),
+        "leaderboard": leaderboard_data,
+        "output_path": output_path,
+        "model_path": output_dir
+    }
+# ============================================================
+# TIME SERIES ANALYSIS (#34, #35, #37)
+# ============================================================
+def analyze_timeseries_model(
+    model_path: str,
+    data_path: str,
+    time_col: str,
+    id_col: Optional[str] = None,
+    operation: str = "feature_importance",
+    output_path: Optional[str] = None
+) -> Dict[str, Any]:
+    """
+    Analyze a trained AutoGluon time series model.
+    Operations:
+      - feature_importance: Permutation importance of covariates
+      - plot: Generate forecast vs actuals visualization
+      - make_future_dataframe: Generate future timestamp skeleton for prediction
+    Args:
+        model_path: Path to saved AutoGluon TimeSeriesPredictor
+        data_path: Path to time series data
+        time_col: Column with timestamps/dates
+        id_col: Column identifying different series
+        operation: One of 'feature_importance', 'plot', 'make_future_dataframe'
+        output_path: Path to save output
+    Returns:
+        Dictionary with analysis results
+    """
+    TimeSeriesPredictor, TimeSeriesDataFrame = _ensure_autogluon_timeseries()
+    if not Path(model_path).exists():
+        return {"status": "error", "message": f"Model not found: {model_path}"}
+    if not Path(data_path).exists():
+        return {"status": "error", "message": f"Data not found: {data_path}"}
+    try:
+        predictor = TimeSeriesPredictor.load(model_path)
+    except Exception as e:
+        return {"status": "error", "message": f"Failed to load model: {str(e)}"}
+    # Reconstruct TimeSeriesDataFrame
+    try:
+        df = pd.read_csv(data_path)
+        df[time_col] = pd.to_datetime(df[time_col])
+        df = df.sort_values(time_col)
+        if id_col is None or id_col not in df.columns:
+            id_col_name = "__series_id"
+            df[id_col_name] = "series_0"
+        else:
+            id_col_name = id_col
+        ts_df = TimeSeriesDataFrame.from_data_frame(
+            df, id_column=id_col_name, timestamp_column=time_col
+        )
+    except Exception as e:
+        return {"status": "error", "message": f"Failed to create time series data: {str(e)}"}
+    try:
+        if operation == "feature_importance":
+            fi = predictor.feature_importance(ts_df)
+            fi_data = []
+            if isinstance(fi, pd.DataFrame):
+                for feat in fi.index:
+                    row_data = {"feature": str(feat)}
+                    for col in fi.columns:
+                        try:
+                            row_data[str(col)] = round(float(fi.loc[feat, col]), 4)
+                        except (TypeError, ValueError):
+                            row_data[str(col)] = str(fi.loc[feat, col])
+                    fi_data.append(row_data)
+            return {
+                "status": "success",
+                "operation": "feature_importance",
+                "features": fi_data,
+                "model_path": model_path,
+                "message": f"Feature importance computed for {len(fi_data)} features"
+            }
+        elif operation == "plot":
+            output_path = output_path or "./outputs/plots/ts_forecast_plot.png"
+            Path(output_path).parent.mkdir(parents=True, exist_ok=True)
+            import matplotlib
+            matplotlib.use('Agg')
+            import matplotlib.pyplot as plt
+            predictions = predictor.predict(ts_df)
+            try:
+                predictor.plot(ts_df, predictions, quantile_levels=[0.1, 0.9])
+                plt.savefig(output_path, dpi=150, bbox_inches='tight')
+                plt.close()
+            except Exception:
+                # Fallback: manual plot
+                fig, ax = plt.subplots(figsize=(12, 6))
+                target = predictor.target
+                for item_id in list(ts_df.item_ids)[:3]:
+                    actual = ts_df.loc[item_id][target].tail(100)
+                    ax.plot(actual.index, actual.values, label=f'Actual ({item_id})', linewidth=1.5)
+                    if item_id in predictions.item_ids:
+                        pred = predictions.loc[item_id]
+                        mean_col = "mean" if "mean" in pred.columns else pred.columns[0]
+                        ax.plot(pred.index, pred[mean_col].values, '--', label=f'Forecast ({item_id})', linewidth=1.5)
+                ax.set_title(f'Time Series Forecast - {predictor.model_best}')
+                ax.legend()
+                ax.grid(True, alpha=0.3)
+                plt.tight_layout()
+                plt.savefig(output_path, dpi=150, bbox_inches='tight')
+                plt.close()
+            return {
+                "status": "success",
+                "operation": "plot",
+                "output_path": output_path,
+                "message": f"Forecast plot saved to {output_path}"
+            }
+        elif operation == "make_future_dataframe":
+            output_path = output_path or "./outputs/future_dataframe.csv"
+            Path(output_path).parent.mkdir(parents=True, exist_ok=True)
+            future_df = predictor.make_future_data_frame(ts_df)
+            future_df.reset_index().to_csv(output_path, index=False)
+            return {
+                "status": "success",
+                "operation": "make_future_dataframe",
+                "shape": list(future_df.shape),
+                "columns": list(future_df.columns) if hasattr(future_df, 'columns') else [],
+                "output_path": output_path,
+                "message": f"Future dataframe generated: {len(future_df)} rows"
+            }
+        else:
+            return {
+                "status": "error",
+                "message": f"Unknown operation '{operation}'. Choose: feature_importance, plot, make_future_dataframe"
+            }
+    except Exception as e:
+        return {"status": "error", "message": f"Analysis failed: {str(e)}"}

src/tools/business_intelligence.py CHANGED Viewed

@@ -649,8 +649,69 @@ def detect_causal_relationships(
             result["statistical_significance"] = float(p_value)
             result["causal_effect"] = float(uplift)
         else:
-            raise ValueError(f"Unknown method '{method}'. Use 'granger', 'propensity', or 'uplift'")
         print(f"✅ Causal analysis complete!")
         if result.get("causal_effect") is not None:

             result["statistical_significance"] = float(p_value)
             result["causal_effect"] = float(uplift)
+        elif method == "dowhy":
+            # DoWhy causal inference - formal causal graph approach
+            try:
+                import dowhy
+                from dowhy import CausalModel
+            except ImportError:
+                raise ValueError("dowhy not installed. Install with: pip install dowhy>=0.11")
+            print("  Building DoWhy causal model...")
+            df = data.to_pandas()
+            # Build causal model
+            # Construct a simple causal graph: covariates -> treatment -> outcome
+            if covariates:
+                graph_dot = f'digraph {{ {treatment_column} -> {outcome_column};'
+                for cov in covariates:
+                    graph_dot += f' {cov} -> {treatment_column}; {cov} -> {outcome_column};'
+                graph_dot += ' }'
+            else:
+                graph_dot = f'digraph {{ {treatment_column} -> {outcome_column}; }}'
+            model = CausalModel(
+                data=df,
+                treatment=treatment_column,
+                outcome=outcome_column,
+                common_causes=covariates,
+                graph=graph_dot
+            )
+            # Identify causal effect
+            identified_estimand = model.identify_effect(proceed_when_unidentifiable=True)
+            # Estimate using linear regression (lightweight)
+            estimate = model.estimate_effect(
+                identified_estimand,
+                method_name="backdoor.linear_regression"
+            )
+            # Refutation test (placebo treatment)
+            try:
+                refutation = model.refute_estimate(
+                    identified_estimand,
+                    estimate,
+                    method_name="placebo_treatment_refuter",
+                    placebo_type="permute",
+                    num_simulations=20
+                )
+                refutation_result = {
+                    "new_effect": float(refutation.new_effect) if hasattr(refutation, 'new_effect') else None,
+                    "p_value": float(refutation.refutation_result.get('p_value', 1.0)) if hasattr(refutation, 'refutation_result') and isinstance(refutation.refutation_result, dict) else None
+                }
+            except Exception:
+                refutation_result = {"note": "Refutation test could not be completed"}
+            result["causal_effect"] = float(estimate.value)
+            result["estimand"] = str(identified_estimand)
+            result["estimation_method"] = "backdoor.linear_regression"
+            result["refutation"] = refutation_result
+            result["statistical_significance"] = None  # DoWhy uses refutation instead
         else:
+            raise ValueError(f"Unknown method '{method}'. Use 'granger', 'propensity', 'uplift', or 'dowhy'")
         print(f"✅ Causal analysis complete!")
         if result.get("causal_effect") is not None:

src/tools/code_interpreter.py CHANGED Viewed

@@ -177,8 +177,10 @@ except Exception as e:
         # Track existing files BEFORE execution to detect new files
         existing_files = set()
         if allow_file_operations:
-            for output_dir in ['./outputs/code', './outputs/data', './outputs/plots']:
                 if os.path.exists(output_dir):
                     for file_path in Path(output_dir).resolve().glob('**/*'):
                         if file_path.is_file():
@@ -229,9 +231,11 @@ except Exception as e:
             # Success! Find NEWLY generated files (not existing before execution)
             generated_files = []
             if allow_file_operations:
                 cwd = Path.cwd()
-                for output_dir in ['./outputs/code', './outputs/data', './outputs/plots']:
                     if os.path.exists(output_dir):
                         abs_output_dir = Path(output_dir).resolve()
                         for file_path in abs_output_dir.glob('**/*'):

         # Track existing files BEFORE execution to detect new files
         existing_files = set()
+        # 🔥 FIX: Also scan /tmp/data_science_agent/ since LLM often saves files there
+        scan_dirs = ['./outputs/code', './outputs/data', './outputs/plots', '/tmp/data_science_agent']
         if allow_file_operations:
+            for output_dir in scan_dirs:
                 if os.path.exists(output_dir):
                     for file_path in Path(output_dir).resolve().glob('**/*'):
                         if file_path.is_file():
             # Success! Find NEWLY generated files (not existing before execution)
             generated_files = []
+            # 🔥 FIX: Also scan /tmp/data_science_agent/ for files created by LLM code
+            scan_dirs = ['./outputs/code', './outputs/data', './outputs/plots', '/tmp/data_science_agent']
             if allow_file_operations:
                 cwd = Path.cwd()
+                for output_dir in scan_dirs:
                     if os.path.exists(output_dir):
                         abs_output_dir = Path(output_dir).resolve()
                         for file_path in abs_output_dir.glob('**/*'):

src/tools/data_cleaning.py CHANGED Viewed

@@ -124,10 +124,81 @@ def clean_missing_values(file_path: str, strategy,
             strategy = strategy_dict
             print(f"🔧 Applying '{list(strategy_dict.values())[0] if strategy_dict else strategy}' strategy to {len(strategy_dict)} columns with missing values")
         else:
             return {
                 "success": False,
-                "error": f"Invalid strategy '{strategy}'. Use 'auto', 'median', 'mean', 'mode', 'forward_fill', 'drop', or provide a dictionary.",
                 "error_type": "ValueError"
             }

             strategy = strategy_dict
             print(f"🔧 Applying '{list(strategy_dict.values())[0] if strategy_dict else strategy}' strategy to {len(strategy_dict)} columns with missing values")
+        elif strategy in ["iterative", "mice"]:
+            # MICE / Iterative Imputation using sklearn IterativeImputer
+            # This handles ALL numeric columns at once (multivariate imputation)
+            print(f"🔧 Applying Iterative (MICE) imputation to numeric columns...")
+            try:
+                from sklearn.experimental import enable_iterative_imputer  # noqa: F401
+                from sklearn.impute import IterativeImputer
+                from sklearn.linear_model import BayesianRidge
+                import pandas as pd
+                # Identify numeric columns with missing values
+                numeric_cols_with_nulls = [
+                    col for col in numeric_cols if df[col].null_count() > 0
+                ]
+                if not numeric_cols_with_nulls:
+                    print("   ℹ️ No numeric columns with missing values for MICE imputation")
+                else:
+                    # Convert numeric columns to pandas for IterativeImputer
+                    df_pd = df.select(numeric_cols).to_pandas()
+                    # Fit and transform
+                    imputer = IterativeImputer(
+                        estimator=BayesianRidge(),
+                        max_iter=10,
+                        random_state=42,
+                        missing_values=float('nan')
+                    )
+                    imputed_data = imputer.fit_transform(df_pd)
+                    # Replace columns back in Polars DataFrame
+                    for i, col_name in enumerate(numeric_cols):
+                        df = df.with_columns(
+                            pl.Series(col_name, imputed_data[:, i])
+                        )
+                    for col_name in numeric_cols_with_nulls:
+                        report["columns_processed"][col_name] = {
+                            "status": "success",
+                            "strategy": "iterative_mice",
+                            "nulls_before": int(df[col_name].null_count()),  # Should be 0 now
+                            "nulls_after": 0
+                        }
+                    print(f"   ✅ MICE imputed {len(numeric_cols_with_nulls)} numeric columns using {len(numeric_cols)} features")
+                # Handle remaining non-numeric columns with mode
+                for col in df.columns:
+                    if df[col].null_count() > 0 and col not in numeric_cols:
+                        mode_val = df[col].drop_nulls().mode().first()
+                        if mode_val is not None:
+                            df = df.with_columns(
+                                pl.col(col).fill_null(mode_val).alias(col)
+                            )
+                            report["columns_processed"][col] = {
+                                "status": "success",
+                                "strategy": "mode (non-numeric fallback)",
+                                "nulls_before": int(df[col].null_count()),
+                                "nulls_after": 0
+                            }
+            except ImportError:
+                return {
+                    "success": False,
+                    "error": "IterativeImputer requires scikit-learn >= 1.4. Install with: pip install scikit-learn>=1.4",
+                    "error_type": "MissingDependency"
+                }
+            # Skip per-column processing for MICE (already handled above)
+            strategy = {}
         else:
             return {
                 "success": False,
+                "error": f"Invalid strategy '{strategy}'. Use 'auto', 'median', 'mean', 'mode', 'forward_fill', 'drop', 'iterative', 'mice', or provide a dictionary.",
                 "error_type": "ValueError"
             }

src/tools/data_profiling.py CHANGED Viewed

@@ -486,3 +486,108 @@ def analyze_correlations(file_path: str, target: Optional[str] = None) -> Dict[s
             }
     return result

             }
     return result
+def detect_label_errors(
+    file_path: str,
+    target_col: str,
+    features: Optional[List[str]] = None,
+    n_folds: int = 5,
+    output_path: Optional[str] = None
+) -> Dict[str, Any]:
+    """
+    Detect potential label errors in a classification dataset using cleanlab.
+    Uses confident learning to find mislabeled examples by:
+    1. Training cross-validated classifiers
+    2. Computing out-of-sample predicted probabilities
+    3. Identifying labels that disagree with model predictions
+    Args:
+        file_path: Path to dataset
+        target_col: Target/label column name
+        features: Feature columns to use (None = all numeric)
+        n_folds: Number of cross-validation folds
+        output_path: Optional path to save flagged rows
+    Returns:
+        Dictionary with label error analysis results
+    """
+    try:
+        from cleanlab.classification import CleanLearning
+    except ImportError:
+        return {
+            'status': 'error',
+            'message': 'cleanlab not installed. Install with: pip install cleanlab>=2.6'
+        }
+    from sklearn.linear_model import LogisticRegression
+    from sklearn.preprocessing import LabelEncoder
+    validate_file_exists(file_path)
+    validate_file_format(file_path)
+    df = load_dataframe(file_path)
+    validate_dataframe(df)
+    validate_column_exists(df, target_col)
+    print(f"🔍 Detecting label errors in '{target_col}' using cleanlab...")
+    # Get features
+    if features is None:
+        features = get_numeric_columns(df)
+        features = [f for f in features if f != target_col]
+    if not features:
+        return {'status': 'error', 'message': 'No numeric features found for label error detection'}
+    # Convert to pandas/numpy
+    df_pd = df.to_pandas()
+    X = df_pd[features].fillna(0).values
+    y_raw = df_pd[target_col].values
+    # Encode labels
+    le = LabelEncoder()
+    y = le.fit_transform(y_raw)
+    # Use CleanLearning to find label issues
+    cl = CleanLearning(
+        clf=LogisticRegression(max_iter=500, solver='lbfgs', multi_class='auto'),
+        cv_n_folds=n_folds
+    )
+    label_issues = cl.find_label_issues(X, y)
+    # Extract results
+    n_issues = label_issues['is_label_issue'].sum()
+    issue_indices = label_issues[label_issues['is_label_issue']].index.tolist()
+    # Get details for flagged rows
+    flagged_rows = []
+    for idx in issue_indices[:50]:  # Limit to top 50
+        flagged_rows.append({
+            'row_index': int(idx),
+            'current_label': str(y_raw[idx]),
+            'suggested_label': str(le.inverse_transform([label_issues.loc[idx, 'predicted_label']])[0]) if 'predicted_label' in label_issues.columns else 'unknown',
+            'confidence': float(1 - label_issues.loc[idx, 'label_quality']) if 'label_quality' in label_issues.columns else None
+        })
+    print(f"   🚨 Found {n_issues} potential label errors ({n_issues/len(y)*100:.1f}%)")
+    # Save flagged rows
+    if output_path and issue_indices:
+        flagged_df = df_pd.iloc[issue_indices]
+        flagged_df.to_csv(output_path, index=False)
+        print(f"   💾 Flagged rows saved to: {output_path}")
+    return {
+        'status': 'success',
+        'total_samples': len(y),
+        'label_errors_found': int(n_issues),
+        'error_percentage': round(n_issues / len(y) * 100, 2),
+        'flagged_rows': flagged_rows,
+        'n_classes': len(le.classes_),
+        'classes': le.classes_.tolist(),
+        'output_path': output_path,
+        'recommendation': f'Review {n_issues} flagged samples for potential mislabeling' if n_issues > 0 else 'No label errors detected'
+    }

src/tools/eda_reports.py CHANGED Viewed

@@ -161,3 +161,100 @@ def generate_ydata_profiling_report(
             "error": f"Failed to generate ydata-profiling report: {str(e)}",
             "error_type": type(e).__name__
         }

             "error": f"Failed to generate ydata-profiling report: {str(e)}",
             "error_type": type(e).__name__
         }
+def generate_sweetviz_report(
+    file_path: str,
+    target_col: Optional[str] = None,
+    compare_file_path: Optional[str] = None,
+    output_path: str = "./outputs/reports/sweetviz_report.html",
+    title: str = "Sweetviz EDA Report"
+) -> Dict[str, Any]:
+    """
+    Generate an interactive EDA report using Sweetviz.
+    Sweetviz provides:
+    - Feature-by-feature analysis with distributions
+    - Target analysis (associations with target variable)
+    - Dataset comparison (train vs test)
+    - Correlations/associations for numeric and categorical features
+    Args:
+        file_path: Path to the dataset CSV file
+        target_col: Optional target column for supervised analysis
+        compare_file_path: Optional second dataset for comparison (e.g., test set)
+        output_path: Where to save the HTML report
+        title: Title for the report
+    Returns:
+        Dict with success status and report path
+    """
+    try:
+        import sweetviz as sv
+        import pandas as pd
+    except ImportError:
+        return {
+            "success": False,
+            "error": "sweetviz not installed. Install with: pip install sweetviz>=2.3",
+            "error_type": "MissingDependency"
+        }
+    try:
+        # Read dataset
+        if file_path.endswith('.csv'):
+            df = pd.read_csv(file_path)
+        elif file_path.endswith('.parquet'):
+            df = pd.read_parquet(file_path)
+        else:
+            raise ValueError(f"Unsupported file format: {file_path}")
+        # Create output directory
+        os.makedirs(os.path.dirname(output_path) or "./outputs/reports", exist_ok=True)
+        # Generate report
+        if compare_file_path:
+            # Comparison report (train vs test)
+            if compare_file_path.endswith('.csv'):
+                df_compare = pd.read_csv(compare_file_path)
+            else:
+                df_compare = pd.read_parquet(compare_file_path)
+            print(f"📊 Generating Sweetviz comparison report...")
+            if target_col and target_col in df.columns:
+                report = sv.compare([df, "Dataset 1"], [df_compare, "Dataset 2"], target_feat=target_col)
+            else:
+                report = sv.compare([df, "Dataset 1"], [df_compare, "Dataset 2"])
+        else:
+            # Single dataset analysis
+            print(f"📊 Generating Sweetviz EDA report...")
+            if target_col and target_col in df.columns:
+                report = sv.analyze(df, target_feat=target_col)
+            else:
+                report = sv.analyze(df)
+        # Save report (show_html=False prevents auto-opening browser)
+        report.show_html(output_path, open_browser=False)
+        num_features = len(df.columns)
+        num_rows = len(df)
+        print(f"✅ Sweetviz report saved to: {output_path}")
+        return {
+            "success": True,
+            "report_path": output_path,
+            "message": f"✅ Sweetviz report generated at: {output_path}",
+            "statistics": {
+                "rows": num_rows,
+                "columns": num_features,
+                "target_column": target_col,
+                "comparison_mode": compare_file_path is not None
+            }
+        }
+    except Exception as e:
+        return {
+            "success": False,
+            "error": f"Failed to generate Sweetviz report: {str(e)}",
+            "error_type": type(e).__name__
+        }

src/tools/feature_engineering.py CHANGED Viewed

@@ -242,7 +242,7 @@ def encode_categorical(file_path: str, method: str = "auto", columns: Optional[L
                 # Create new column with frequencies
                 new_col_name = f"{col}_freq"
                 df = df.with_columns(
-                    pl.col(col).map_dict(freq_map, default=0.0).alias(new_col_name)
                 )
                 # Drop original column
@@ -274,7 +274,7 @@ def encode_categorical(file_path: str, method: str = "auto", columns: Optional[L
                 # Create new column with target encoding
                 new_col_name = f"{col}_target_enc"
                 df = df.with_columns(
-                    pl.col(col).map_dict(target_map, default=global_mean).alias(new_col_name)
                 )
                 # Drop original column

                 # Create new column with frequencies
                 new_col_name = f"{col}_freq"
                 df = df.with_columns(
+                    pl.col(col).replace_strict(freq_map, default=0.0).alias(new_col_name)
                 )
                 # Drop original column
                 # Create new column with target encoding
                 new_col_name = f"{col}_target_enc"
                 df = df.with_columns(
+                    pl.col(col).replace_strict(target_map, default=global_mean).alias(new_col_name)
                 )
                 # Drop original column

src/tools/nlp_text_analytics.py CHANGED Viewed

@@ -483,20 +483,48 @@ def analyze_sentiment_advanced(
                     result["emotions"] = None
         else:
-            # Fallback to TextBlob
-            print("  Using TextBlob for sentiment analysis...")
-            sentiments = []
-            for text in texts_clean:
-                blob = TextBlob(text)
-                sentiments.append({
-                    "polarity": blob.sentiment.polarity,
-                    "subjectivity": blob.sentiment.subjectivity,
-                    "label": "POSITIVE" if blob.sentiment.polarity > 0 else "NEGATIVE" if blob.sentiment.polarity < 0 else "NEUTRAL",
-                    "text": text[:100]
-                })
-            result["sentiments"] = sentiments
         # Aspect-based sentiment
         if aspects:

                     result["emotions"] = None
         else:
+            # Check if method is 'vader' - use vaderSentiment
+            if method == "vader":
+                try:
+                    from vaderSentiment.vaderSentiment import SentimentIntensityAnalyzer
+                    print("  Using VADER for sentiment analysis...")
+                    analyzer = SentimentIntensityAnalyzer()
+                    sentiments = []
+                    for text in texts_clean:
+                        scores = analyzer.polarity_scores(text)
+                        label = "POSITIVE" if scores['compound'] > 0.05 else "NEGATIVE" if scores['compound'] < -0.05 else "NEUTRAL"
+                        sentiments.append({
+                            "compound": scores['compound'],
+                            "positive": scores['pos'],
+                            "negative": scores['neg'],
+                            "neutral": scores['neu'],
+                            "label": label,
+                            "text": text[:100]
+                        })
+                    result["sentiments"] = sentiments
+                except ImportError:
+                    print("⚠️ vaderSentiment not installed. Falling back to TextBlob.")
+                    print("   Install with: pip install vaderSentiment>=3.3")
+                    method = "textblob"
+            if method in ["textblob", "transformer"]:
+                # Fallback to TextBlob
+                print("  Using TextBlob for sentiment analysis...")
+                sentiments = []
+                for text in texts_clean:
+                    blob = TextBlob(text)
+                    sentiments.append({
+                        "polarity": blob.sentiment.polarity,
+                        "subjectivity": blob.sentiment.subjectivity,
+                        "label": "POSITIVE" if blob.sentiment.polarity > 0 else "NEGATIVE" if blob.sentiment.polarity < 0 else "NEUTRAL",
+                        "text": text[:100]
+                    })
+                result["sentiments"] = sentiments
         # Aspect-based sentiment
         if aspects:

src/tools/production_mlops.py CHANGED Viewed

@@ -659,3 +659,194 @@ def detect_feature_leakage(
         'total_issues': total_issues,
         'recommendation': 'Review and remove suspicious features before training' if total_issues > 0 else 'No obvious leakage detected'
     }

         'total_issues': total_issues,
         'recommendation': 'Review and remove suspicious features before training' if total_issues > 0 else 'No obvious leakage detected'
     }
+def monitor_drift_evidently(
+    reference_data_path: str,
+    current_data_path: str,
+    output_path: Optional[str] = None
+) -> Dict[str, Any]:
+    """
+    Generate a comprehensive data drift report using Evidently AI.
+    Evidently provides production-grade drift detection with:
+    - Statistical tests per feature (KS, Chi-squared, Jensen-Shannon)
+    - Data quality metrics
+    - Interactive HTML dashboard
+    Args:
+        reference_data_path: Path to training/reference dataset
+        current_data_path: Path to production/current dataset
+        output_path: Path to save HTML drift report
+    Returns:
+        Dictionary with drift metrics and report path
+    """
+    try:
+        from evidently.report import Report
+        from evidently.metric_preset import DataDriftPreset, DataQualityPreset
+    except ImportError:
+        return {
+            'status': 'error',
+            'message': 'evidently not installed. Install with: pip install evidently>=0.4'
+        }
+    import pandas as pd_ev
+    validate_file_exists(reference_data_path)
+    validate_file_exists(current_data_path)
+    # Load data as pandas (evidently requires pandas)
+    ref_df = load_dataframe(reference_data_path).to_pandas()
+    curr_df = load_dataframe(current_data_path).to_pandas()
+    print("🔍 Generating Evidently drift report...")
+    # Create drift report
+    report = Report(metrics=[
+        DataDriftPreset(),
+        DataQualityPreset()
+    ])
+    report.run(reference_data=ref_df, current_data=curr_df)
+    # Save HTML report
+    if output_path is None:
+        output_path = "./outputs/reports/evidently_drift_report.html"
+    os.makedirs(os.path.dirname(output_path), exist_ok=True)
+    report.save_html(output_path)
+    # Extract results as dict
+    report_dict = report.as_dict()
+    # Parse drift results
+    drift_metrics = report_dict.get('metrics', [])
+    drifted_features = []
+    total_features = 0
+    for metric in drift_metrics:
+        result_data = metric.get('result', {})
+        if 'drift_by_columns' in result_data:
+            for col_name, col_data in result_data['drift_by_columns'].items():
+                total_features += 1
+                if col_data.get('drift_detected', False):
+                    drifted_features.append(col_name)
+    print(f"✅ Evidently report saved to: {output_path}")
+    print(f"   📊 {len(drifted_features)}/{total_features} features with drift detected")
+    return {
+        'status': 'success',
+        'report_path': output_path,
+        'total_features_analyzed': total_features,
+        'drifted_features': drifted_features,
+        'n_drifted': len(drifted_features),
+        'recommendation': 'Retrain model' if drifted_features else 'No significant drift detected'
+    }
+def explain_with_dtreeviz(
+    model_path: str,
+    data_path: str,
+    target_col: str,
+    feature_names: Optional[List[str]] = None,
+    instance_index: int = 0,
+    output_path: Optional[str] = None
+) -> Dict[str, Any]:
+    """
+    Generate tree visualization using dtreeviz for tree-based models.
+    Creates publication-quality decision tree visualizations showing:
+    - Decision path for individual predictions
+    - Feature distributions at each node
+    - Split thresholds with data histograms
+    Args:
+        model_path: Path to trained tree-based model (.pkl)
+        data_path: Path to dataset
+        target_col: Target column name
+        feature_names: List of feature names (auto-detected if None)
+        instance_index: Index of instance to trace through tree
+        output_path: Path to save SVG visualization
+    Returns:
+        Dictionary with visualization path and tree info
+    """
+    try:
+        import dtreeviz
+    except ImportError:
+        return {
+            'status': 'error',
+            'message': 'dtreeviz not installed. Install with: pip install dtreeviz>=2.2'
+        }
+    validate_file_exists(model_path)
+    validate_file_exists(data_path)
+    model = joblib.load(model_path)
+    df = load_dataframe(data_path)
+    validate_dataframe(df)
+    # Prepare data
+    if target_col in df.columns:
+        X = df.drop(target_col).to_pandas()
+        y = df[target_col].to_pandas()
+    else:
+        X = df.to_pandas()
+        y = None
+    if feature_names is None:
+        feature_names = X.columns.tolist()
+    print(f"🌳 Generating dtreeviz visualization...")
+    if output_path is None:
+        output_path = "./outputs/reports/dtreeviz_tree.svg"
+    os.makedirs(os.path.dirname(output_path), exist_ok=True)
+    try:
+        # Check if model is a tree-based model
+        from sklearn.tree import DecisionTreeClassifier, DecisionTreeRegressor
+        from sklearn.ensemble import RandomForestClassifier, RandomForestRegressor
+        # For ensemble models, use the first estimator
+        tree_model = model
+        if hasattr(model, 'estimators_'):
+            tree_model = model.estimators_[0]
+            print("   📌 Using first estimator from ensemble for visualization")
+        # Determine task type
+        is_classifier = hasattr(model, 'predict_proba')
+        # Create visualization
+        viz_model = dtreeviz.model(
+            tree_model,
+            X_train=X,
+            y_train=y,
+            feature_names=feature_names,
+            target_name=target_col,
+            class_names=list(map(str, sorted(y.unique()))) if is_classifier and y is not None else None
+        )
+        # Generate tree visualization
+        v = viz_model.view(x=X.iloc[instance_index])
+        v.save(output_path)
+        print(f"✅ Tree visualization saved to: {output_path}")
+        return {
+            'status': 'success',
+            'visualization_path': output_path,
+            'model_type': type(model).__name__,
+            'n_features': len(feature_names),
+            'instance_explained': instance_index,
+            'tree_depth': tree_model.get_depth() if hasattr(tree_model, 'get_depth') else 'unknown'
+        }
+    except Exception as e:
+        return {
+            'status': 'error',
+            'message': f'dtreeviz visualization failed: {str(e)}. Ensure model is tree-based (DecisionTree, RandomForest, XGBoost).'
+        }

src/tools/time_series.py CHANGED Viewed

@@ -46,7 +46,7 @@ def forecast_time_series(
         time_col: Time/date column name
         target_col: Target variable to forecast
         forecast_horizon: Number of periods to forecast ahead
-        method: Forecasting method ('arima', 'sarima', 'prophet', 'exponential_smoothing')
         seasonal_period: Seasonal period (e.g., 7 for weekly, 12 for monthly)
         output_path: Path to save forecast results
@@ -108,6 +108,57 @@ def forecast_time_series(
             }
         }
     elif method == "arima":
         # ARIMA model
         ts_data = df_pd.set_index(time_col)[target_col]

         time_col: Time/date column name
         target_col: Target variable to forecast
         forecast_horizon: Number of periods to forecast ahead
+        method: Forecasting method ('arima', 'auto_arima', 'sarima', 'prophet', 'exponential_smoothing')
         seasonal_period: Seasonal period (e.g., 7 for weekly, 12 for monthly)
         output_path: Path to save forecast results
             }
         }
+    elif method == "auto_arima":
+        # Auto ARIMA using pmdarima - automatically finds best (p,d,q) order
+        try:
+            import pmdarima as pm
+        except ImportError:
+            return {
+                'status': 'error',
+                'message': 'pmdarima not installed. Install with: pip install pmdarima>=2.0'
+            }
+        ts_data = df_pd.set_index(time_col)[target_col]
+        print("🔧 Running auto_arima to find optimal ARIMA order...")
+        auto_model = pm.auto_arima(
+            ts_data,
+            seasonal=bool(seasonal_period),
+            m=seasonal_period or 1,
+            stepwise=True,
+            suppress_warnings=True,
+            error_action='ignore',
+            max_p=5, max_q=5, max_d=2,
+            max_P=2, max_Q=2, max_D=1,
+            trace=False
+        )
+        # Forecast
+        forecast_vals, conf_int = auto_model.predict(
+            n_periods=forecast_horizon,
+            return_conf_int=True
+        )
+        forecast_index = pd.date_range(start=ts_data.index[-1], periods=forecast_horizon+1, freq='D')[1:]
+        result = {
+            'method': 'auto_arima',
+            'order': str(auto_model.order),
+            'seasonal_order': str(auto_model.seasonal_order) if seasonal_period else None,
+            'forecast': [
+                {
+                    'date': str(date),
+                    'value': float(val),
+                    'lower_ci': float(ci[0]),
+                    'upper_ci': float(ci[1])
+                }
+                for date, val, ci in zip(forecast_index, forecast_vals, conf_int)
+            ],
+            'aic': float(auto_model.aic()),
+            'bic': float(auto_model.bic()),
+            'model_summary': str(auto_model.summary())
+        }
+        print(f"   ✅ Best order: {auto_model.order} | AIC: {auto_model.aic():.2f}")
     elif method == "arima":
         # ARIMA model
         ts_data = df_pd.set_index(time_col)[target_col]

src/tools/tools_registry.py CHANGED Viewed

@@ -1067,6 +1067,40 @@ TOOLS = [
             }
         }
     },
     # ============================================
     # TIME SERIES (3)
@@ -1449,6 +1483,55 @@ TOOLS = [
             }
         }
     },
     # ========================================
     # CODE INTERPRETER - THE GAME CHANGER 🚀
     # ========================================
@@ -1632,6 +1715,390 @@ TOOLS = [
                 "required": ["project_id", "query"]
             }
         }
     }
 ]

             }
         }
     },
+    {
+        "type": "function",
+        "function": {
+            "name": "monitor_drift_evidently",
+            "description": "Generate comprehensive data drift report using Evidently AI. Provides statistical tests per feature, data quality metrics, and interactive HTML dashboard.",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "reference_data_path": {"type": "string", "description": "Path to training/reference dataset"},
+                    "current_data_path": {"type": "string", "description": "Path to production/current dataset"},
+                    "output_path": {"type": "string", "description": "Path to save HTML drift report"}
+                },
+                "required": ["reference_data_path", "current_data_path"]
+            }
+        }
+    },
+    {
+        "type": "function",
+        "function": {
+            "name": "explain_with_dtreeviz",
+            "description": "Generate publication-quality decision tree visualizations using dtreeviz. Shows decision path, feature distributions at each node, and split thresholds.",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "model_path": {"type": "string", "description": "Path to trained tree-based model (.pkl)"},
+                    "data_path": {"type": "string", "description": "Path to dataset"},
+                    "target_col": {"type": "string", "description": "Target column name"},
+                    "instance_index": {"type": "integer", "description": "Index of instance to trace through tree (default: 0)"},
+                    "output_path": {"type": "string", "description": "Path to save SVG visualization"}
+                },
+                "required": ["model_path", "data_path", "target_col"]
+            }
+        }
+    },
     # ============================================
     # TIME SERIES (3)
             }
         }
     },
+    {
+        "type": "function",
+        "function": {
+            "name": "generate_sweetviz_report",
+            "description": "Generate interactive EDA report using Sweetviz. Provides feature-by-feature analysis, target associations, and dataset comparison. Great for train vs test comparison.",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "file_path": {"type": "string", "description": "Path to the dataset CSV/Parquet file"},
+                    "target_col": {"type": "string", "description": "Optional target column for supervised analysis"},
+                    "compare_file_path": {"type": "string", "description": "Optional second dataset for comparison (e.g., test set)"},
+                    "output_path": {"type": "string", "description": "Where to save HTML report (default: ./outputs/reports/sweetviz_report.html)"}
+                },
+                "required": ["file_path"]
+            }
+        }
+    },
+    {
+        "type": "function",
+        "function": {
+            "name": "detect_label_errors",
+            "description": "Detect potential label errors in classification datasets using cleanlab. Uses confident learning to find mislabeled examples by cross-validating classifiers and identifying disagreements.",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "file_path": {"type": "string", "description": "Path to classification dataset"},
+                    "target_col": {"type": "string", "description": "Target/label column name"},
+                    "features": {"type": "array", "items": {"type": "string"}, "description": "Feature columns (None = all numeric)"},
+                    "output_path": {"type": "string", "description": "Path to save flagged rows"}
+                },
+                "required": ["file_path", "target_col"]
+            }
+        }
+    },
+    {
+        "type": "function",
+        "function": {
+            "name": "validate_schema_pandera",
+            "description": "Validate a DataFrame against a pandera schema. Check column types, nullability, value ranges, and custom constraints.",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "file_path": {"type": "string", "description": "Path to dataset to validate"},
+                    "schema_config": {"type": "object", "description": "Schema configuration with column definitions"}
+                },
+                "required": ["file_path", "schema_config"]
+            }
+        }
+    },
     # ========================================
     # CODE INTERPRETER - THE GAME CHANGER 🚀
     # ========================================
                 "required": ["project_id", "query"]
             }
         }
+    },
+    # ============================================
+    # AUTOGLUON TRAINING (3) - AutoML at Scale
+    # ============================================
+    {
+        "type": "function",
+        "function": {
+            "name": "train_with_autogluon",
+            "description": "Train ML models using AutoGluon AutoML. Automatically trains and ensembles 10+ models (LightGBM, XGBoost, CatBoost, RandomForest, etc.) with stacking. Handles raw data directly - no need to manually encode categoricals or impute missing values. Supports classification (binary/multiclass) and regression. Use this instead of train_baseline_models for best performance.",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "file_path": {
+                        "type": "string",
+                        "description": "Path to CSV/Parquet dataset"
+                    },
+                    "target_col": {
+                        "type": "string",
+                        "description": "Column to predict"
+                    },
+                    "task_type": {
+                        "type": "string",
+                        "enum": ["classification", "regression", "auto"],
+                        "description": "Type of ML task. 'auto' to detect automatically."
+                    },
+                    "time_limit": {
+                        "type": "integer",
+                        "description": "Max training time in seconds (default: 120). Higher = better models."
+                    },
+                    "presets": {
+                        "type": "string",
+                        "enum": ["medium_quality", "good_quality", "best_quality"],
+                        "description": "Quality preset. medium_quality=fast, best_quality=slower but better."
+                    },
+                    "eval_metric": {
+                        "type": "string",
+                        "description": "Metric to optimize. Classification: 'accuracy','f1','roc_auc'. Regression: 'rmse','mae','r2'. Auto-selected if None."
+                    },
+                    "output_dir": {
+                        "type": "string",
+                        "description": "Directory to save trained model (default: ./outputs/autogluon_model)"
+                    },
+                    "infer_limit": {
+                        "type": "number",
+                        "description": "Max inference time per row in seconds. Only models meeting this speed constraint are kept. E.g. 0.01 = 10ms/row."
+                    }
+                },
+                "required": ["file_path", "target_col"]
+            }
+        }
+    },
+    {
+        "type": "function",
+        "function": {
+            "name": "predict_with_autogluon",
+            "description": "Make predictions on new data using a trained AutoGluon model. Returns predictions and probability scores for classification tasks.",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "model_path": {
+                        "type": "string",
+                        "description": "Path to saved AutoGluon model directory"
+                    },
+                    "data_path": {
+                        "type": "string",
+                        "description": "Path to new data CSV/Parquet for prediction"
+                    },
+                    "output_path": {
+                        "type": "string",
+                        "description": "Path to save predictions CSV"
+                    }
+                },
+                "required": ["model_path", "data_path"]
+            }
+        }
+    },
+    {
+        "type": "function",
+        "function": {
+            "name": "forecast_with_autogluon",
+            "description": "Forecast time series using AutoGluon TimeSeriesPredictor. Trains and ensembles multiple models including DeepAR, ETS, ARIMA, Theta, and Chronos. Supports covariates, holiday features, model selection, and probabilistic forecasts. Much more powerful than basic ARIMA/Prophet.",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "file_path": {
+                        "type": "string",
+                        "description": "Path to time series CSV/Parquet"
+                    },
+                    "target_col": {
+                        "type": "string",
+                        "description": "Column with values to forecast"
+                    },
+                    "time_col": {
+                        "type": "string",
+                        "description": "Column with timestamps/dates"
+                    },
+                    "forecast_horizon": {
+                        "type": "integer",
+                        "description": "Number of future periods to predict (default: 30)"
+                    },
+                    "id_col": {
+                        "type": "string",
+                        "description": "Column identifying different series (for multi-series forecasting)"
+                    },
+                    "freq": {
+                        "type": "string",
+                        "description": "Frequency: 'D'=daily, 'h'=hourly, 'W'=weekly, 'MS'=monthly. Auto-detected if omitted."
+                    },
+                    "time_limit": {
+                        "type": "integer",
+                        "description": "Max training time in seconds (default: 120)"
+                    },
+                    "presets": {
+                        "type": "string",
+                        "enum": ["fast_training", "medium_quality", "best_quality"],
+                        "description": "Quality preset for forecasting models"
+                    },
+                    "output_path": {
+                        "type": "string",
+                        "description": "Path to save forecast CSV"
+                    },
+                    "static_features_path": {
+                        "type": "string",
+                        "description": "CSV with per-series metadata (one row per series). Improves cross-series learning."
+                    },
+                    "known_covariates_cols": {
+                        "type": "array",
+                        "items": {"type": "string"},
+                        "description": "Columns with future-known values (holidays, promotions, day_of_week)"
+                    },
+                    "holiday_country": {
+                        "type": "string",
+                        "description": "Country code for auto holiday features: 'US', 'UK', 'IN', 'DE', etc."
+                    },
+                    "fill_missing": {
+                        "type": "boolean",
+                        "description": "Auto-fill missing values in time series (default: true)"
+                    },
+                    "models": {
+                        "type": "array",
+                        "items": {"type": "string"},
+                        "description": "Specific models to train: 'ETS', 'AutoARIMA', 'Theta', 'DeepAR', 'PatchTST', 'DLinear', 'TFT', 'SeasonalNaive'"
+                    },
+                    "quantile_levels": {
+                        "type": "array",
+                        "items": {"type": "number"},
+                        "description": "Quantile levels for probabilistic forecasts. E.g. [0.1, 0.5, 0.9] for 10th/50th/90th percentile."
+                    }
+                },
+                "required": ["file_path", "target_col", "time_col"]
+            }
+        }
+    },
+    # ============================================
+    # AUTOGLUON ADVANCED (6) - Post-Training, Analysis, Multi-Label, Backtesting
+    # ============================================
+    {
+        "type": "function",
+        "function": {
+            "name": "optimize_autogluon_model",
+            "description": "Post-training optimization on a trained AutoGluon model. Operations: refit_full (re-train on 100% data for deployment), distill (compress ensemble into single model), calibrate_threshold (optimize binary classification threshold), deploy_optimize (strip artifacts for minimal deployment), delete_models (remove specific models to free resources).",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "model_path": {
+                        "type": "string",
+                        "description": "Path to saved AutoGluon model directory"
+                    },
+                    "operation": {
+                        "type": "string",
+                        "enum": ["refit_full", "distill", "calibrate_threshold", "deploy_optimize", "delete_models"],
+                        "description": "Optimization operation to perform"
+                    },
+                    "data_path": {
+                        "type": "string",
+                        "description": "Path to dataset (required for distill, calibrate_threshold)"
+                    },
+                    "metric": {
+                        "type": "string",
+                        "enum": ["f1", "balanced_accuracy", "precision", "recall"],
+                        "description": "Metric for calibrate_threshold optimization"
+                    },
+                    "models_to_delete": {
+                        "type": "array",
+                        "items": {"type": "string"},
+                        "description": "Model names to delete (for delete_models operation)"
+                    },
+                    "output_dir": {
+                        "type": "string",
+                        "description": "Output directory for deploy_optimize"
+                    }
+                },
+                "required": ["model_path", "operation"]
+            }
+        }
+    },
+    {
+        "type": "function",
+        "function": {
+            "name": "analyze_autogluon_model",
+            "description": "Inspect and analyze a trained AutoGluon model. Operations: summary (extended leaderboard with stack levels, memory, inference speed), transform_features (get internally transformed feature matrix), info (comprehensive model metadata and training summary).",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "model_path": {
+                        "type": "string",
+                        "description": "Path to saved AutoGluon model directory"
+                    },
+                    "data_path": {
+                        "type": "string",
+                        "description": "Path to dataset (required for transform_features)"
+                    },
+                    "operation": {
+                        "type": "string",
+                        "enum": ["summary", "transform_features", "info"],
+                        "description": "Analysis operation to perform"
+                    }
+                },
+                "required": ["model_path"]
+            }
+        }
+    },
+    {
+        "type": "function",
+        "function": {
+            "name": "extend_autogluon_training",
+            "description": "Add models or re-fit ensemble on an existing AutoGluon predictor without retraining from scratch. Operations: fit_extra (train additional models/hyperparameters), fit_weighted_ensemble (re-fit ensemble weights on existing base models).",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "model_path": {
+                        "type": "string",
+                        "description": "Path to saved AutoGluon model directory"
+                    },
+                    "operation": {
+                        "type": "string",
+                        "enum": ["fit_extra", "fit_weighted_ensemble"],
+                        "description": "Extension operation to perform"
+                    },
+                    "data_path": {
+                        "type": "string",
+                        "description": "Path to training data (required for fit_extra)"
+                    },
+                    "time_limit": {
+                        "type": "integer",
+                        "description": "Additional training time in seconds (default: 60)"
+                    },
+                    "hyperparameters": {
+                        "type": "object",
+                        "description": "Model hyperparameters dict. E.g. {\"GBM\": {\"num_boost_round\": 500}, \"RF\": {}}"
+                    }
+                },
+                "required": ["model_path"]
+            }
+        }
+    },
+    {
+        "type": "function",
+        "function": {
+            "name": "train_multilabel_autogluon",
+            "description": "Train multi-label prediction model. Predicts multiple target columns simultaneously by training separate AutoGluon TabularPredictors per label with shared feature engineering. Use when dataset has multiple columns to predict.",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "file_path": {
+                        "type": "string",
+                        "description": "Path to CSV/Parquet dataset"
+                    },
+                    "target_cols": {
+                        "type": "array",
+                        "items": {"type": "string"},
+                        "description": "List of columns to predict (e.g. ['label1', 'label2'])"
+                    },
+                    "time_limit": {
+                        "type": "integer",
+                        "description": "Max training time per label in seconds (default: 120)"
+                    },
+                    "presets": {
+                        "type": "string",
+                        "enum": ["medium_quality", "good_quality", "best_quality"],
+                        "description": "Quality preset"
+                    },
+                    "output_dir": {
+                        "type": "string",
+                        "description": "Where to save trained model"
+                    }
+                },
+                "required": ["file_path", "target_cols"]
+            }
+        }
+    },
+    {
+        "type": "function",
+        "function": {
+            "name": "backtest_timeseries",
+            "description": "Backtest time series models using multiple validation windows. More robust performance estimation than single train/test split. Trains models with multi-window cross-validation and returns per-window evaluation.",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "file_path": {
+                        "type": "string",
+                        "description": "Path to time series CSV/Parquet"
+                    },
+                    "target_col": {
+                        "type": "string",
+                        "description": "Column with values to forecast"
+                    },
+                    "time_col": {
+                        "type": "string",
+                        "description": "Column with timestamps/dates"
+                    },
+                    "forecast_horizon": {
+                        "type": "integer",
+                        "description": "Periods to predict per window (default: 30)"
+                    },
+                    "id_col": {
+                        "type": "string",
+                        "description": "Column identifying different series"
+                    },
+                    "freq": {
+                        "type": "string",
+                        "description": "Frequency string"
+                    },
+                    "num_val_windows": {
+                        "type": "integer",
+                        "description": "Number of backtesting windows (default: 3)"
+                    },
+                    "time_limit": {
+                        "type": "integer",
+                        "description": "Max training time in seconds"
+                    },
+                    "presets": {
+                        "type": "string",
+                        "enum": ["fast_training", "medium_quality", "best_quality"],
+                        "description": "Quality preset"
+                    },
+                    "output_path": {
+                        "type": "string",
+                        "description": "Path to save backtest predictions CSV"
+                    }
+                },
+                "required": ["file_path", "target_col", "time_col"]
+            }
+        }
+    },
+    {
+        "type": "function",
+        "function": {
+            "name": "analyze_timeseries_model",
+            "description": "Analyze a trained AutoGluon time series model. Operations: feature_importance (permutation importance of covariates), plot (forecast vs actuals visualization), make_future_dataframe (generate future timestamp skeleton for prediction with covariates).",
+            "parameters": {
+                "type": "object",
+                "properties": {
+                    "model_path": {
+                        "type": "string",
+                        "description": "Path to saved AutoGluon TimeSeriesPredictor"
+                    },
+                    "data_path": {
+                        "type": "string",
+                        "description": "Path to time series data"
+                    },
+                    "time_col": {
+                        "type": "string",
+                        "description": "Column with timestamps/dates"
+                    },
+                    "id_col": {
+                        "type": "string",
+                        "description": "Column identifying different series"
+                    },
+                    "operation": {
+                        "type": "string",
+                        "enum": ["feature_importance", "plot", "make_future_dataframe"],
+                        "description": "Analysis operation to perform"
+                    },
+                    "output_path": {
+                        "type": "string",
+                        "description": "Path to save output (plot image or CSV)"
+                    }
+                },
+                "required": ["model_path", "data_path", "time_col"]
+            }
+        }
     }
 ]

src/tools/visualization_engine.py CHANGED Viewed

@@ -181,7 +181,7 @@ def generate_data_quality_plots(file_path: str, output_dir: str) -> Dict[str, An
     return {"plot_paths": plots, "figures": figures, "n_plots": len(plots)}
-def generate_eda_plots(file_path: str, target_col: Optional[str], output_dir: str) -> Dict[str, Any]:
     """Generate exploratory data analysis plots using Matplotlib."""
     df = load_dataframe(file_path).to_pandas()
     plots = []

     return {"plot_paths": plots, "figures": figures, "n_plots": len(plots)}
+def generate_eda_plots(file_path: str, target_col: Optional[str] = None, output_dir: str = "./outputs/plots/eda") -> Dict[str, Any]:
     """Generate exploratory data analysis plots using Matplotlib."""
     df = load_dataframe(file_path).to_pandas()
     plots = []

src/utils/schema_extraction.py CHANGED Viewed

@@ -22,13 +22,27 @@ def extract_schema_local(file_path: str, sample_rows: int = 5) -> Dict[str, Any]
     try:
         # Read with Polars (faster than pandas)
         if file_path.endswith('.csv'):
-            df = pl.read_csv(file_path)
         elif file_path.endswith('.parquet'):
             df = pl.read_parquet(file_path)
         else:
             # Fallback to pandas
             import pandas as pd
-            pdf = pd.read_csv(file_path)
             df = pl.from_pandas(pdf)
         # Basic metadata

     try:
         # Read with Polars (faster than pandas)
         if file_path.endswith('.csv'):
+            # 🔥 FIX: Use infer_schema_length and ignore_errors to handle mixed-type columns
+            # This prevents failures like: could not parse `835.159865` as dtype `i64`
+            try:
+                df = pl.read_csv(file_path, infer_schema_length=10000, ignore_errors=True)
+            except Exception:
+                # Final fallback: read everything as strings, then let Polars infer
+                try:
+                    import pandas as pd
+                    pdf = pd.read_csv(file_path, low_memory=False)
+                    df = pl.from_pandas(pdf)
+                except Exception as e2:
+                    return {
+                        'error': f"Failed to read CSV: {str(e2)}",
+                        'file_path': file_path
+                    }
         elif file_path.endswith('.parquet'):
             df = pl.read_parquet(file_path)
         else:
             # Fallback to pandas
             import pandas as pd
+            pdf = pd.read_csv(file_path, low_memory=False)
             df = pl.from_pandas(pdf)
         # Basic metadata

src/utils/validation.py CHANGED Viewed

@@ -268,3 +268,110 @@ def validate_strategy_config(strategy: Dict[str, Any],
         raise ValidationError(
             f"Missing required strategy keys: {', '.join(missing)}"
         )

         raise ValidationError(
             f"Missing required strategy keys: {', '.join(missing)}"
         )
+def validate_schema_pandera(
+    df: pl.DataFrame,
+    schema_config: Dict[str, Any]
+) -> Dict[str, Any]:
+    """
+    Validate a DataFrame against a pandera schema.
+    Schema config format:
+    {
+        "columns": {
+            "age": {"dtype": "int", "nullable": False, "checks": {"ge": 0, "le": 150}},
+            "name": {"dtype": "str", "nullable": False},
+            "salary": {"dtype": "float", "nullable": True, "checks": {"ge": 0}}
+        },
+        "coerce": True
+    }
+    Args:
+        df: Polars DataFrame to validate
+        schema_config: Dictionary defining the expected schema
+    Returns:
+        Dictionary with validation results and any errors found
+    """
+    try:
+        import pandera as pa
+        import pandas as pd
+    except ImportError:
+        return {
+            'status': 'error',
+            'message': 'pandera not installed. Install with: pip install pandera>=0.18'
+        }
+    columns_config = schema_config.get("columns", {})
+    coerce = schema_config.get("coerce", True)
+    # Build pandera schema from config
+    schema_columns = {}
+    dtype_map = {
+        "int": pa.Int,
+        "float": pa.Float,
+        "str": pa.String,
+        "bool": pa.Bool,
+        "datetime": pa.DateTime,
+    }
+    check_map = {
+        "ge": lambda v: pa.Check.ge(v),
+        "le": lambda v: pa.Check.le(v),
+        "gt": lambda v: pa.Check.gt(v),
+        "lt": lambda v: pa.Check.lt(v),
+        "in_range": lambda v: pa.Check.in_range(v[0], v[1]),
+        "isin": lambda v: pa.Check.isin(v),
+        "str_matches": lambda v: pa.Check.str_matches(v),
+        "str_length": lambda v: pa.Check.str_length(max_value=v),
+    }
+    for col_name, col_config in columns_config.items():
+        col_dtype = dtype_map.get(col_config.get("dtype", ""), None)
+        nullable = col_config.get("nullable", True)
+        checks_config = col_config.get("checks", {})
+        checks = []
+        for check_name, check_val in checks_config.items():
+            if check_name in check_map:
+                checks.append(check_map[check_name](check_val))
+        schema_columns[col_name] = pa.Column(
+            dtype=col_dtype,
+            nullable=nullable,
+            checks=checks if checks else None,
+            coerce=coerce
+        )
+    schema = pa.DataFrameSchema(columns=schema_columns, coerce=coerce)
+    # Convert Polars to Pandas for pandera validation
+    df_pd = df.to_pandas()
+    try:
+        schema.validate(df_pd, lazy=True)
+        return {
+            'status': 'success',
+            'valid': True,
+            'message': 'DataFrame passed all schema validations',
+            'columns_validated': list(columns_config.keys())
+        }
+    except pa.errors.SchemaErrors as err:
+        errors = []
+        for _, row in err.failure_cases.iterrows():
+            errors.append({
+                'column': str(row.get('column', '')),
+                'check': str(row.get('check', '')),
+                'failure_case': str(row.get('failure_case', '')),
+                'index': int(row.get('index', -1)) if row.get('index') is not None else None
+            })
+        return {
+            'status': 'success',
+            'valid': False,
+            'message': f'Schema validation failed with {len(errors)} errors',
+            'errors': errors[:50],  # Limit to 50 errors
+            'total_errors': len(errors),
+            'columns_validated': list(columns_config.keys())
+        }

test_data/sample.csv DELETED Viewed

@@ -1,16 +0,0 @@
-age,income,score,purchased
-25,50000,75,1
-30,60000,82,1
-22,45000,68,0
-35,75000,88,1
-28,55000,79,1
-40,90000,92,1
-23,42000,65,0
-32,68000,85,1
-27,52000,76,1
-38,82000,90,1
-24,48000,71,0
-31,65000,84,1
-26,51000,77,1
-29,58000,80,1
-33,72000,87,1