feat: add "blocked for human input" feature across full stack

Agents can now request structured human input when they encounter genuine blockers (API keys, design choices, external configs). The request is displayed in the UI with a dynamic form, and the human's response is stored and made available when the agent resumes. Changes span 21 files + 1 new component: - Database: 3 new columns (needs_human_input, human_input_request, human_input_response) with migration - MCP: new feature_request_human_input tool + guards on existing tools - API: new resolve-human-input endpoint, 4th feature bucket - Orchestrator: skip needs_human_input features in scheduling - Progress: 4-tuple return from count_passing_tests - WebSocket: needs_human_input count in progress messages - UI: conditional 4th Kanban column, HumanInputForm component, amber status indicators, dependency graph support Co-Authored-By: Claude Opus 4.6 <noreply@anthropic.com>
2026-03-17 10:53:09 +00:00 · 2026-02-08 14:11:35 -05:00
parent 9eb08d3f71
commit 656df0fd9a
21 changed files with 570 additions and 53 deletions
--- a/server/routers/features.py
+++ b/server/routers/features.py
@@ -23,6 +23,7 @@ from ..schemas import (
    FeatureListResponse,
    FeatureResponse,
    FeatureUpdate,
+    HumanInputResponse,
 )
 from ..utils.project_helpers import get_project_path as _get_project_path
 from ..utils.validation import validate_project_name
@@ -104,6 +105,9 @@ def feature_to_response(f, passing_ids: set[int] | None = None) -> FeatureRespon
        in_progress=f.in_progress if f.in_progress is not None else False,
        blocked=blocked,
        blocking_dependencies=blocking,
+        needs_human_input=getattr(f, 'needs_human_input', False) or False,
+        human_input_request=getattr(f, 'human_input_request', None),
+        human_input_response=getattr(f, 'human_input_response', None),
    )


@@ -143,11 +147,14 @@ async def list_features(project_name: str):
            pending = []
            in_progress = []
            done = []
+            needs_human_input_list = []

            for f in all_features:
                feature_response = feature_to_response(f, passing_ids)
                if f.passes:
                    done.append(feature_response)
+                elif getattr(f, 'needs_human_input', False):
+                    needs_human_input_list.append(feature_response)
                elif f.in_progress:
                    in_progress.append(feature_response)
                else:
@@ -157,6 +164,7 @@ async def list_features(project_name: str):
                pending=pending,
                in_progress=in_progress,
                done=done,
+                needs_human_input=needs_human_input_list,
            )
    except HTTPException:
        raise
@@ -341,9 +349,11 @@ async def get_dependency_graph(project_name: str):
                deps = f.dependencies or []
                blocking = [d for d in deps if d not in passing_ids]

-                status: Literal["pending", "in_progress", "done", "blocked"]
+                status: Literal["pending", "in_progress", "done", "blocked", "needs_human_input"]
                if f.passes:
                    status = "done"
+                elif getattr(f, 'needs_human_input', False):
+                    status = "needs_human_input"
                elif blocking:
                    status = "blocked"
                elif f.in_progress:
@@ -564,6 +574,71 @@ async def skip_feature(project_name: str, feature_id: int):
        raise HTTPException(status_code=500, detail="Failed to skip feature")


+@router.post("/{feature_id}/resolve-human-input", response_model=FeatureResponse)
+async def resolve_human_input(project_name: str, feature_id: int, response: HumanInputResponse):
+    """Resolve a human input request for a feature.
+
+    Validates all required fields have values, stores the response,
+    and returns the feature to the pending queue for agents to pick up.
+    """
+    project_name = validate_project_name(project_name)
+    project_dir = _get_project_path(project_name)
+
+    if not project_dir:
+        raise HTTPException(status_code=404, detail=f"Project '{project_name}' not found in registry")
+
+    if not project_dir.exists():
+        raise HTTPException(status_code=404, detail="Project directory not found")
+
+    _, Feature = _get_db_classes()
+
+    try:
+        with get_db_session(project_dir) as session:
+            feature = session.query(Feature).filter(Feature.id == feature_id).first()
+
+            if not feature:
+                raise HTTPException(status_code=404, detail=f"Feature {feature_id} not found")
+
+            if not getattr(feature, 'needs_human_input', False):
+                raise HTTPException(status_code=400, detail="Feature is not waiting for human input")
+
+            # Validate required fields
+            request_data = feature.human_input_request
+            if request_data and isinstance(request_data, dict):
+                for field_def in request_data.get("fields", []):
+                    if field_def.get("required", True):
+                        field_id = field_def.get("id")
+                        if field_id not in response.fields or response.fields[field_id] in (None, ""):
+                            raise HTTPException(
+                                status_code=400,
+                                detail=f"Required field '{field_def.get('label', field_id)}' is missing"
+                            )
+
+            # Store response and return to pending queue
+            from datetime import datetime, timezone
+            response_data = {
+                "fields": {k: v for k, v in response.fields.items()},
+                "responded_at": datetime.now(timezone.utc).isoformat(),
+            }
+            feature.human_input_response = response_data
+            feature.needs_human_input = False
+            # Keep in_progress=False, passes=False so it returns to pending
+
+            session.commit()
+            session.refresh(feature)
+
+            # Compute passing IDs for response
+            all_features = session.query(Feature).all()
+            passing_ids = {f.id for f in all_features if f.passes}
+
+            return feature_to_response(feature, passing_ids)
+    except HTTPException:
+        raise
+    except Exception:
+        logger.exception("Failed to resolve human input")
+        raise HTTPException(status_code=500, detail="Failed to resolve human input")
+
+
 # ============================================================================
 # Dependency Management Endpoints
 # ============================================================================
--- a/server/routers/projects.py
+++ b/server/routers/projects.py
@@ -102,7 +102,7 @@ def get_project_stats(project_dir: Path) -> ProjectStats:
    """Get statistics for a project."""
    _init_imports()
    assert _count_passing_tests is not None  # guaranteed by _init_imports()
-    passing, in_progress, total = _count_passing_tests(project_dir)
+    passing, in_progress, total, _needs_human_input = _count_passing_tests(project_dir)
    percentage = (passing / total * 100) if total > 0 else 0.0
    return ProjectStats(
        passing=passing,
--- a/server/schemas.py
+++ b/server/schemas.py
@@ -120,16 +120,41 @@ class FeatureResponse(FeatureBase):
    in_progress: bool
    blocked: bool = False  # Computed: has unmet dependencies
    blocking_dependencies: list[int] = Field(default_factory=list)  # Computed
+    needs_human_input: bool = False
+    human_input_request: dict | None = None
+    human_input_response: dict | None = None

    class Config:
        from_attributes = True


+class HumanInputField(BaseModel):
+    """Schema for a single human input field."""
+    id: str
+    label: str
+    type: Literal["text", "textarea", "select", "boolean"] = "text"
+    required: bool = True
+    placeholder: str | None = None
+    options: list[dict] | None = None  # For select: [{value, label}]
+
+
+class HumanInputRequest(BaseModel):
+    """Schema for an agent's human input request."""
+    prompt: str
+    fields: list[HumanInputField]
+
+
+class HumanInputResponse(BaseModel):
+    """Schema for a human's response to an input request."""
+    fields: dict[str, str | bool | list[str]]
+
+
 class FeatureListResponse(BaseModel):
    """Response containing list of features organized by status."""
    pending: list[FeatureResponse]
    in_progress: list[FeatureResponse]
    done: list[FeatureResponse]
+    needs_human_input: list[FeatureResponse] = Field(default_factory=list)


 class FeatureBulkCreate(BaseModel):
@@ -153,7 +178,7 @@ class DependencyGraphNode(BaseModel):
    id: int
    name: str
    category: str
-    status: Literal["pending", "in_progress", "done", "blocked"]
+    status: Literal["pending", "in_progress", "done", "blocked", "needs_human_input"]
    priority: int
    dependencies: list[int]

@@ -257,6 +282,7 @@ class WSProgressMessage(BaseModel):
    in_progress: int
    total: int
    percentage: float
+    needs_human_input: int = 0


 class WSFeatureUpdateMessage(BaseModel):
--- a/server/services/process_manager.py
+++ b/server/services/process_manager.py
@@ -255,7 +255,10 @@ class AgentProcessManager:
                ).all()
                if stuck:
                    for f in stuck:
-                        f.in_progress = False
+                        # Don't clear in_progress for features blocked for human input -
+                        # they should stay in needs_human_input state even after crash
+                        if not getattr(f, 'needs_human_input', False):
+                            f.in_progress = False
                    session.commit()
                    logger.info(
                        "Cleaned up %d stuck feature(s) for %s",
--- a/server/websocket.py
+++ b/server/websocket.py
@@ -689,15 +689,19 @@ async def poll_progress(websocket: WebSocket, project_name: str, project_dir: Pa
    last_in_progress = -1
    last_total = -1

+    last_needs_human_input = -1
+
    while True:
        try:
-            passing, in_progress, total = count_passing_tests(project_dir)
+            passing, in_progress, total, needs_human_input = count_passing_tests(project_dir)

            # Only send if changed
-            if passing != last_passing or in_progress != last_in_progress or total != last_total:
+            if (passing != last_passing or in_progress != last_in_progress
+                    or total != last_total or needs_human_input != last_needs_human_input):
                last_passing = passing
                last_in_progress = in_progress
                last_total = total
+                last_needs_human_input = needs_human_input
                percentage = (passing / total * 100) if total > 0 else 0

                await websocket.send_json({
@@ -706,6 +710,7 @@ async def poll_progress(websocket: WebSocket, project_name: str, project_dir: Pa
                    "in_progress": in_progress,
                    "total": total,
                    "percentage": round(percentage, 1),
+                    "needs_human_input": needs_human_input,
                })

            await asyncio.sleep(2)  # Poll every 2 seconds
@@ -858,7 +863,7 @@ async def project_websocket(websocket: WebSocket, project_name: str):

        # Send initial progress
        count_passing_tests = _get_count_passing_tests()
-        passing, in_progress, total = count_passing_tests(project_dir)
+        passing, in_progress, total, needs_human_input = count_passing_tests(project_dir)
        percentage = (passing / total * 100) if total > 0 else 0
        await websocket.send_json({
            "type": "progress",
@@ -866,6 +871,7 @@ async def project_websocket(websocket: WebSocket, project_name: str):
            "in_progress": in_progress,
            "total": total,
            "percentage": round(percentage, 1),
+            "needs_human_input": needs_human_input,
        })

        # Keep connection alive and handle incoming messages