feature: nicer chat ui (#126)

marcellodebernardi · web-flow · commit fad9f2747cae · 2025-05-27T22:21:24.000-07:00
* chore: bump to 0.23.2

* feat: add some observability methods to registry

* fix: add fileio tests to ensure backwards comp

* feat: add 0.23.2 legacy model loading test

* refactor: tools for object registry entities

* fix: convert tags that can't be written with safe_dump

* feat: add dataset listing tool to manager

* fix: simplify schema resolver tool use

* fix: schema resolution before proper dataset processing

* feat: add ui for local testing of chat

* fix: encourage schema resolver to be more 'minimal'

* fix: rename get_raw_dataset_schema for clarity

* fix: memory flushed between messages

* chore: bump to 0.23.3

* fix: transformed dataset not marked immutable

* fix: schema resolver adds unnecessary fields

* chore: poetry lock
diff --git a/plexe/agents/agents.py b/plexe/agents/agents.py
@@ -2,12 +2,13 @@
 This module defines a multi-agent ML engineering system for building machine learning models.
 """
 
+import json
 import logging
 import types
 from dataclasses import dataclass, field
 from typing import List, Dict, Optional, Callable
 
-from smolagents import CodeAgent, LiteLLMModel
+from smolagents import CodeAgent, LiteLLMModel, AgentText
 
 from plexe.agents.dataset_analyser import EdaAgent
 from plexe.agents.dataset_splitter import DatasetSplitterAgent
@@ -206,6 +207,9 @@ def run(self, task, additional_args: dict) -> ModelGenerationResult:
             if logger.isEnabledFor(logging.DEBUG):
                 logger.debug("Agent result: %s", result)
 
+            if isinstance(result, AgentText):
+                result = json.loads(str(result))
+
             # Extract data from the agent result
             training_code_id = result.get("training_code_id", "")
             inference_code_id = result.get("inference_code_id", "")
diff --git a/plexe/agents/dataset_analyser.py b/plexe/agents/dataset_analyser.py
@@ -13,7 +13,7 @@
 from plexe.config import config, prompt_templates
 from plexe.internal.common.utils.agents import get_prompt_templates
 from plexe.tools.datasets import register_eda_report, drop_null_columns, get_latest_datasets
-from plexe.tools.schemas import get_raw_dataset_schema
+from plexe.tools.schemas import get_dataset_schema
 
 logger = logging.getLogger(__name__)
 
@@ -58,7 +58,7 @@ def __init__(
                 "- the name of the dataset to be analysed"
             ),
             model=LiteLLMModel(model_id=self.model_id),
-            tools=[drop_null_columns, register_eda_report, get_raw_dataset_schema, get_latest_datasets],
+            tools=[drop_null_columns, register_eda_report, get_dataset_schema, get_latest_datasets],
             add_base_tools=False,
             verbosity_level=self.verbosity,
             # planning_interval=3,
diff --git a/plexe/agents/model_trainer.py b/plexe/agents/model_trainer.py
@@ -12,7 +12,7 @@
 from plexe.internal.common.utils.agents import get_prompt_templates
 from plexe.tools.execution import get_executor_tool
 from plexe.tools.response_formatting import format_final_mle_agent_response
-from plexe.tools.schemas import get_raw_dataset_schema, get_model_schemas
+from plexe.tools.schemas import get_dataset_schema, get_model_schemas
 from plexe.tools.training import get_training_code_generation_tool, get_training_code_fixing_tool
 from plexe.tools.validation import validate_training_code
 from plexe.tools.datasets import get_training_datasets
@@ -58,7 +58,7 @@ def __init__(
             tools=[
                 get_training_code_generation_tool(tool_model_id),
                 validate_training_code,
-                get_raw_dataset_schema,
+                get_dataset_schema,
                 get_training_code_fixing_tool(tool_model_id),
                 get_executor_tool(distributed),
                 format_final_mle_agent_response,
diff --git a/plexe/main.py b/plexe/main.py
@@ -2,13 +2,46 @@
 Application entry point for using the plexe package as a conversational agent.
 """
 
-from smolagents import GradioUI
-from plexe.agents.conversational import ConversationalAgent
+import threading
+import time
+import webbrowser
+import logging
+
+import uvicorn
+
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
 
 
 def main():
-    ui = GradioUI(ConversationalAgent().agent)
-    ui.launch()
+    """Launch the Plexe assistant with a web UI."""
+    host = "127.0.0.1"
+    port = 8000
+
+    # Configure uvicorn to run in a thread
+    config = uvicorn.Config("plexe.server:app", host=host, port=port, log_level="info", reload=False)
+    server = uvicorn.Server(config)
+
+    # Start server in a background thread
+    thread = threading.Thread(target=server.run, daemon=True)
+    thread.start()
+
+    # Give the server a moment to start
+    time.sleep(4)
+
+    # Open the browser
+    url = f"http://{host}:{port}"
+    logger.info(f"Opening browser at {url}")
+    webbrowser.open(url)
+
+    # Keep the main thread alive
+    try:
+        logger.info("Plexe Assistant is running. Press Ctrl+C to stop.")
+        while True:
+            time.sleep(1)
+    except KeyboardInterrupt:
+        logger.info("\nShutting down Plexe Assistant...")
+        server.should_exit = True
 
 
 if __name__ == "__main__":
diff --git a/plexe/server.py b/plexe/server.py
@@ -0,0 +1,90 @@
+"""
+FastAPI server for the Plexe conversational agent.
+
+This module provides a lightweight WebSocket API for the conversational agent
+and serves the assistant-ui frontend for local execution.
+"""
+
+import json
+import logging
+import uuid
+from pathlib import Path
+
+from fastapi import FastAPI, WebSocket, WebSocketDisconnect
+from fastapi.staticfiles import StaticFiles
+from fastapi.responses import FileResponse
+
+from plexe.agents.conversational import ConversationalAgent
+
+logger = logging.getLogger(__name__)
+
+app = FastAPI(title="Plexe Assistant", version="1.0.0")
+
+# Serve static files from the ui directory
+ui_dir = Path(__file__).parent / "ui"
+if ui_dir.exists():
+    app.mount("/static", StaticFiles(directory=str(ui_dir)), name="static")
+
+
+@app.get("/")
+async def root():
+    """Serve the main HTML page."""
+    index_path = ui_dir / "index.html"
+    if index_path.exists():
+        return FileResponse(str(index_path))
+    return {"error": "Frontend not found. Please ensure plexe/ui/index.html exists."}
+
+
+@app.websocket("/ws")
+async def websocket_endpoint(websocket: WebSocket):
+    """WebSocket endpoint for real-time chat communication."""
+    await websocket.accept()
+    session_id = str(uuid.uuid4())
+    logger.info(f"New WebSocket connection: {session_id}")
+
+    # Create a new agent instance for this session
+    agent = ConversationalAgent()
+
+    try:
+        while True:
+            # Receive message from client
+            data = await websocket.receive_text()
+
+            try:
+                message_data = json.loads(data)
+                user_message = message_data.get("content", "")
+
+                # Process the message with the agent
+                logger.debug(f"Processing message: {user_message[:100]}...")
+                response = agent.agent.run(user_message, reset=False)
+
+                # Send response back to client
+                await websocket.send_json({"role": "assistant", "content": response, "id": str(uuid.uuid4())})
+
+            except json.JSONDecodeError:
+                # Handle plain text messages for compatibility
+                response = agent.agent.run(data, reset=False)
+                await websocket.send_json({"role": "assistant", "content": response, "id": str(uuid.uuid4())})
+
+            except Exception as e:
+                logger.error(f"Error processing message: {e}")
+                await websocket.send_json(
+                    {
+                        "role": "assistant",
+                        "content": f"I encountered an error: {str(e)}. Please try again.",
+                        "id": str(uuid.uuid4()),
+                        "error": True,
+                    }
+                )
+
+    except WebSocketDisconnect:
+        logger.info(f"WebSocket disconnected: {session_id}")
+    except Exception as e:
+        logger.error(f"WebSocket error for session {session_id}: {e}")
+        await websocket.close()
+
+
+@app.get("/health")
+async def health_check():
+    """Health check endpoint."""
+    return {"status": "healthy", "service": "plexe-assistant"}
diff --git a/plexe/templates/prompts/agent/eda_prompt_templates.yaml b/plexe/templates/prompts/agent/eda_prompt_templates.yaml
@@ -14,7 +14,7 @@ managed_agent:
     ## Available Tools:
     - `get_latest_datasets`: Returns all available datasets with their roles (raw, transformed, train, val, test)
     - `drop_null_columns`: Clean datasets by removing problematic columns
-    - `get_raw_dataset_schema`: Get column names and types for a dataset
+    - `get_dataset_schema`: Get column names and types for a dataset
     - `register_eda_report`: Store your analysis findings
     
     To access datasets, USE EXACTLY THIS PATTERN:
diff --git a/plexe/templates/prompts/agent/mle_prompt_templates.yaml b/plexe/templates/prompts/agent/mle_prompt_templates.yaml
@@ -10,7 +10,7 @@ managed_agent:
     ## Available Tools:
     - `get_training_datasets`: Get training and validation dataset names automatically
     - `get_model_schemas`: Get input/output schemas directly
-    - `get_raw_dataset_schema`: Understand dataset structure
+    - `get_dataset_schema`: Understand dataset structure
     - `get_feature_transformer_code`: Retrieve feature transformation code (if exists) if you need to review it
     - `generate_training_code`: Generate ML training code
     - `validate_training_code`: Validate generated code
diff --git a/plexe/templates/prompts/agent/schema_resolver_prompt_templates.yaml b/plexe/templates/prompts/agent/schema_resolver_prompt_templates.yaml
@@ -31,13 +31,15 @@ managed_agent:
     5. Call register_final_model_schemas with your determined schemas and reasoning
     
     ## Key requirements:
-    1. IMPORTANT: keep schemas aligned with dataset structure unless the task clearly requires otherwise
+    1. IMPORTANT: keep schemas conceptually aligned with dataset structure
     2. Use only Python types: "int", "float", "str", "bool"
     3. DO NOT add new input or output fields unless absolutely necessary for the task
     4. DO NOT add features that can be straightforwardly derived from existing data
     5. Schemas should include only necessary fields for the model's purpose
     6. You can REMOVE fields that are unnecessary, irrelevant, redundant, or contain bad data; this is highly encouraged
-    6. Include reasoning for any deviations from the dataset structure
+    7. Include reasoning for any deviations from the dataset structure
+    8. Ensure the schemas are 'minimal' and 'sufficient': for example, if A is a categorical variable and X, Y, Z are 
+    boolean indicators of the possible values of A, you can remove X, Y, Z from the input schema and keep only A.
     
     When calling register_final_model_schemas, use this format:
     - input_schema: dictionary mapping field names to types
diff --git a/plexe/tools/execution.py b/plexe/tools/execution.py
@@ -283,7 +283,7 @@ def apply_feature_transformer(dataset_name: str) -> Dict:
         # Register transformed dataset
         transformed_name = f"{dataset_name}_transformed"
         transformed_ds = DatasetAdapter.coerce(transformed_df)
-        object_registry.register(TabularConvertible, transformed_name, transformed_ds, overwrite=True)
+        object_registry.register(TabularConvertible, transformed_name, transformed_ds, overwrite=True, immutable=True)
 
         logger.debug(f"✅ Applied feature transformer to {dataset_name} → {transformed_name}")
 
diff --git a/plexe/tools/schemas.py b/plexe/tools/schemas.py
@@ -74,9 +74,10 @@ def register_final_model_schemas(
 
 
 @tool
-def get_raw_dataset_schema(dataset_name: str) -> Dict[str, Any]:
+def get_dataset_schema(dataset_name: str) -> Dict[str, Any]:
     """
-    Extract the schema (column names and types) from a raw dataset.
+    Extract the schema (column names and types) from a dataset. This is useful for understanding the structure
+    of the dataset and how it can be used in model training.
 
     Args:
         dataset_name: Name of the dataset in the registry
diff --git a/plexe/ui/index.html b/plexe/ui/index.html
diff --git a/poetry.lock b/poetry.lock
diff --git a/pyproject.toml b/pyproject.toml