refactor example project so each agent does its job in turn

2026-01-09 21:27:53 -05:00 · 2024-06-13 10:48:37 +02:00
parent 1645cdd277
commit 7d225bbfe2
11 changed files with 185 additions and 111 deletions
--- a/core/agents/architect.py
+++ b/core/agents/architect.py
@@ -4,10 +4,12 @@ from pydantic import BaseModel, Field

 from core.agents.base import BaseAgent
 from core.agents.convo import AgentConvo
-from core.agents.mixins import SystemDependencyCheckerMixin
 from core.agents.response import AgentResponse
+from core.db.models import Specification
 from core.llm.parser import JSONParser
+from core.log import get_logger
 from core.telemetry import telemetry
+from core.templates.example_project import EXAMPLE_PROJECTS
 from core.templates.registry import PROJECT_TEMPLATES, ProjectTemplateEnum
 from core.ui.base import ProjectStage

@@ -16,6 +18,8 @@ WARN_SYSTEM_DEPS = ["docker", "kubernetes", "microservices"]
 WARN_FRAMEWORKS = ["next.js", "vue", "vue.js", "svelte", "angular"]
 WARN_FRAMEWORKS_URL = "https://github.com/Pythagora-io/gpt-pilot/wiki/Using-GPT-Pilot-with-frontend-frameworks"

+log = get_logger(__name__)
+

 # FIXME: all the reponse pydantic models should be strict (see config._StrictModel), also check if we
 # can disallow adding custom Python attributes to the model
@@ -68,33 +72,41 @@ class Architecture(BaseModel):
    )


-class Architect(SystemDependencyCheckerMixin, BaseAgent):
+class Architect(BaseAgent):
    agent_type = "architect"
    display_name = "Architect"

    async def run(self) -> AgentResponse:
        await self.ui.send_project_stage(ProjectStage.ARCHITECTURE)

+        spec = self.current_state.specification.clone()
+
+        if spec.example_project:
+            self.prepare_example_project(spec)
+        else:
+            await self.plan_architecture(spec)
+
+        await self.check_system_dependencies(spec)
+
+        self.next_state.specification = spec
+        telemetry.set("template", spec.template)
+        self.next_state.action = ARCHITECTURE_STEP_NAME
+        return AgentResponse.done(self)
+
+    async def plan_architecture(self, spec: Specification):
+        await self.send_message("Planning project architecture ...")
+
        llm = self.get_llm()
        convo = AgentConvo(self).template("technologies", templates=PROJECT_TEMPLATES).require_schema(Architecture)
-
-        await self.send_message("Planning project architecture ...")
        arch: Architecture = await llm(convo, parser=JSONParser(Architecture))

        await self.check_compatibility(arch)

-        spec = self.current_state.specification.clone()
        spec.architecture = arch.architecture
        spec.system_dependencies = [d.model_dump() for d in arch.system_dependencies]
        spec.package_dependencies = [d.model_dump() for d in arch.package_dependencies]
        spec.template = arch.template.value if arch.template else None

-        self.next_state.specification = spec
-        await self.check_system_dependencies(spec)
-        telemetry.set("template", spec.template)
-        self.next_state.action = ARCHITECTURE_STEP_NAME
-        return AgentResponse.done(self)
-
    async def check_compatibility(self, arch: Architecture) -> bool:
        warn_system_deps = [dep.name for dep in arch.system_dependencies if dep.name.lower() in WARN_SYSTEM_DEPS]
        warn_package_deps = [dep.name for dep in arch.package_dependencies if dep.name.lower() in WARN_FRAMEWORKS]
@@ -122,3 +134,51 @@ class Architect(SystemDependencyCheckerMixin, BaseAgent):
        # return AgentResponse.revise_spec()
        # that SpecWriter should catch and allow the user to reword the initial spec.
        return True
+
+    def prepare_example_project(self, spec: Specification):
+        log.debug(f"Setting architecture for example project: {spec.example_project}")
+        arch = EXAMPLE_PROJECTS[spec.example_project]["architecture"]
+
+        spec.architecture = arch["architecture"]
+        spec.system_dependencies = arch["system_dependencies"]
+        spec.package_dependencies = arch["package_dependencies"]
+        spec.template = arch["template"]
+        telemetry.set("template", spec.template)
+
+    async def check_system_dependencies(self, spec: Specification):
+        """
+        Check whether the required system dependencies are installed.
+
+        This also stores the app architecture telemetry data, including the
+        information about whether each system dependency is installed.
+
+        :param spec: Project specification.
+        """
+        deps = spec.system_dependencies
+
+        for dep in deps:
+            status_code, _, _ = await self.process_manager.run_command(dep["test"])
+            dep["installed"] = bool(status_code == 0)
+            if status_code != 0:
+                if dep["required_locally"]:
+                    remedy = "Please install it before proceeding with your app."
+                else:
+                    remedy = "If you would like to use it locally, please install it before proceeding."
+                await self.send_message(f"❌ {dep['name']} is not available. {remedy}")
+                await self.ask_question(
+                    f"Once you have installed {dep['name']}, please press Continue.",
+                    buttons={"continue": "Continue"},
+                    buttons_only=True,
+                    default="continue",
+                )
+            else:
+                await self.send_message(f"✅ {dep['name']} is available.")
+
+        telemetry.set(
+            "architecture",
+            {
+                "description": spec.architecture,
+                "system_dependencies": deps,
+                "package_dependencies": spec.package_dependencies,
+            },
+        )
--- a/core/agents/external_docs.py
+++ b/core/agents/external_docs.py
@@ -26,7 +26,7 @@ class SelectedDocsets(BaseModel):
 class ExternalDocumentation(BaseAgent):
    """Agent in charge of collecting and storing additional documentation.

-    Docs are per task and are stores in the `tasks` variable in the project state.
+    Docs are per task and are stores in the `docs` variable in the project state.
    This agent ensures documentation is collected only once per task.

    Agent does 2 LLM interactions:
@@ -44,7 +44,12 @@ class ExternalDocumentation(BaseAgent):
    display_name = "Documentation"

    async def run(self) -> AgentResponse:
-        available_docsets = await self._get_available_docsets()
+        if self.current_state.specification.example_project:
+            log.debug("Example project detected, no documentation selected.")
+            available_docsets = []
+        else:
+            available_docsets = await self._get_available_docsets()
+
        selected_docsets = await self._select_docsets(available_docsets)
        await telemetry.trace_code_event("docsets_used", selected_docsets)

@@ -149,6 +154,8 @@ class ExternalDocumentation(BaseAgent):
        Documentation snippets are stored as a list of dictionaries:
        {"key": docset-key, "desc": documentation-description, "snippets": list-of-snippets}

+        :param snippets: List of tuples: (docset_key, snippets)
+        :param available_docsets: List of available docsets from the API.
        """

        docsets_dict = dict(available_docsets)
@@ -157,4 +164,3 @@ class ExternalDocumentation(BaseAgent):
            docs.append({"key": docset_key, "desc": docsets_dict[docset_key], "snippets": snip})

        self.next_state.docs = docs
-        self.next_state.flag_tasks_as_modified()
--- a/core/agents/mixins.py
+++ b/core/agents/mixins.py
@@ -1,8 +1,6 @@
 from typing import Optional

 from core.agents.convo import AgentConvo
-from core.db.models.specification import Specification
-from core.telemetry import telemetry


 class IterationPromptMixin:
@@ -37,54 +35,3 @@ class IterationPromptMixin:
        )
        llm_solution: str = await llm(convo)
        return llm_solution
-
-
-class SystemDependencyCheckerMixin:
-    """
-    Provides a method to check whether the required system dependencies are installed.
-
-    Used by Architect and SpecWriter agents. Assumes the agent has access to UI
-    and ProcessManager.
-    """
-
-    async def check_system_dependencies(self, spec: Specification):
-        """
-        Check whether the required system dependencies are installed.
-
-        This also stores the app architecture telemetry data, including the
-        information about whether each system dependency is installed.
-
-        :param spec: Project specification.
-        """
-        deps = spec.system_dependencies
-        checked = {}
-
-        for dep in deps:
-            status_code, _, _ = await self.process_manager.run_command(dep["test"])
-            dep["installed"] = bool(status_code == 0)
-            if status_code != 0:
-                if dep["required_locally"]:
-                    remedy = "Please install it before proceeding with your app."
-                else:
-                    remedy = "If you would like to use it locally, please install it before proceeding."
-                await self.send_message(f"❌ {dep['name']} is not available. {remedy}")
-                await self.ask_question(
-                    f"Once you have installed {dep['name']}, please press Continue.",
-                    buttons={"continue": "Continue"},
-                    buttons_only=True,
-                    default="continue",
-                )
-                checked[dep["name"]] = "missing"
-            else:
-                await self.send_message(f"✅ {dep['name']} is available.")
-                checked[dep["name"]] = "present"
-
-        telemetry.set(
-            "architecture",
-            {
-                "description": spec.architecture,
-                "system_dependencies": deps,
-                "package_dependencies": spec.package_dependencies,
-                "checked_system_dependencies": checked,
-            },
-        )
--- a/core/agents/spec_writer.py
+++ b/core/agents/spec_writer.py
@@ -1,14 +1,13 @@
 from core.agents.base import BaseAgent
 from core.agents.convo import AgentConvo
-from core.agents.mixins import SystemDependencyCheckerMixin
 from core.agents.response import AgentResponse
 from core.db.models import Complexity
 from core.llm.parser import StringParser
+from core.log import get_logger
 from core.telemetry import telemetry
 from core.templates.example_project import (
-    EXAMPLE_PROJECT_ARCHITECTURE,
-    EXAMPLE_PROJECT_DESCRIPTION,
-    EXAMPLE_PROJECT_PLAN,
+    DEFAULT_EXAMPLE_PROJECT,
+    EXAMPLE_PROJECTS,
 )

 # If the project description is less than this, perform an analysis using LLM
@@ -19,8 +18,10 @@ INITIAL_PROJECT_HOWTO_URL = (
 )
 SPEC_STEP_NAME = "Create specification"

+log = get_logger(__name__)

-class SpecWriter(SystemDependencyCheckerMixin, BaseAgent):
+
+class SpecWriter(BaseAgent):
    agent_type = "spec-writer"
    display_name = "Spec Writer"

@@ -42,16 +43,15 @@ class SpecWriter(SystemDependencyCheckerMixin, BaseAgent):
            return AgentResponse.import_project(self)

        if response.button == "example":
-            await self.send_message("Starting example project with description:")
-            await self.send_message(EXAMPLE_PROJECT_DESCRIPTION)
-            await self.prepare_example_project()
+            await self.prepare_example_project(DEFAULT_EXAMPLE_PROJECT)
            return AgentResponse.done(self)
+
        elif response.button == "continue":
            # FIXME: Workaround for the fact that VSCode "continue" button does
            # nothing but repeat the question. We reproduce this bug for bug here.
            return AgentResponse.done(self)

-        spec = response.text
+        spec = response.text.strip()

        complexity = await self.check_prompt_complexity(spec)
        await telemetry.trace_code_event(
@@ -82,31 +82,21 @@ class SpecWriter(SystemDependencyCheckerMixin, BaseAgent):
        llm_response: str = await llm(convo, temperature=0, parser=StringParser())
        return llm_response.lower()

-    async def prepare_example_project(self):
+    async def prepare_example_project(self, example_name: str):
+        example_description = EXAMPLE_PROJECTS[example_name]["description"].strip()
+
+        log.debug(f"Starting example project: {example_name}")
+        await self.send_message(f"Starting example project with description:\n\n{example_description}")
+
        spec = self.current_state.specification.clone()
-        spec.description = EXAMPLE_PROJECT_DESCRIPTION
-        spec.architecture = EXAMPLE_PROJECT_ARCHITECTURE["architecture"]
-        spec.system_dependencies = EXAMPLE_PROJECT_ARCHITECTURE["system_dependencies"]
-        spec.package_dependencies = EXAMPLE_PROJECT_ARCHITECTURE["package_dependencies"]
-        spec.template = EXAMPLE_PROJECT_ARCHITECTURE["template"]
-        spec.complexity = Complexity.SIMPLE
-        telemetry.set("initial_prompt", spec.description.strip())
-        telemetry.set("is_complex_app", False)
-        telemetry.set("template", spec.template)
-
-        await self.check_system_dependencies(spec)
-
+        spec.example_project = example_name
+        spec.description = example_description
+        spec.complexity = EXAMPLE_PROJECTS[example_name]["complexity"]
        self.next_state.specification = spec

-        self.next_state.epics = [
-            {
-                "name": "Initial Project",
-                "description": EXAMPLE_PROJECT_DESCRIPTION,
-                "completed": False,
-                "complexity": Complexity.SIMPLE,
-            }
-        ]
-        self.next_state.tasks = EXAMPLE_PROJECT_PLAN
+        telemetry.set("initial_prompt", spec.description)
+        telemetry.set("example_project", example_name)
+        telemetry.set("is_complex_app", spec.complexity != Complexity.SIMPLE)

    async def analyze_spec(self, spec: str) -> str:
        msg = (
--- a/core/agents/tech_lead.py
+++ b/core/agents/tech_lead.py
@@ -11,6 +11,7 @@ from core.db.models.project_state import TaskStatus
 from core.llm.parser import JSONParser
 from core.log import get_logger
 from core.telemetry import telemetry
+from core.templates.example_project import EXAMPLE_PROJECTS
 from core.templates.registry import apply_project_template, get_template_description, get_template_summary
 from core.ui.base import ProjectStage, success_source

@@ -42,8 +43,10 @@ class TechLead(BaseAgent):
            return await self.update_epic()

        if len(self.current_state.epics) == 0:
-            self.create_initial_project_epic()
-            # Orchestrator will rerun us to break down the initial project epic
+            if self.current_state.specification.example_project:
+                self.plan_example_project()
+            else:
+                self.create_initial_project_epic()
            return AgentResponse.done(self)

        await self.ui.send_project_stage(ProjectStage.CODING)
@@ -203,3 +206,18 @@ class TechLead(BaseAgent):
        ]
        log.debug(f"Updated development plan for {epic['name']}, {len(response.plan)} tasks remaining")
        return AgentResponse.done(self)
+
+    def plan_example_project(self):
+        example_name = self.current_state.specification.example_project
+        log.debug(f"Planning example project: {example_name}")
+
+        example = EXAMPLE_PROJECTS[example_name]
+        self.next_state.epics = [
+            {
+                "name": "Initial Project",
+                "description": example["description"],
+                "completed": False,
+                "complexity": example["complexity"],
+            }
+        ]
+        self.next_state.tasks = example["plan"]
--- a/core/db/migrations/README
+++ b/core/db/migrations/README
@@ -1 +1,10 @@
-Generic single-database configuration.
+Pythagora uses Alembic for database migrations.
+
+After changing any of the database models, create a new migration:
+
+    alembic -c core/db/alembic.ini revision --autogenerate -m "description"
+
+Migrations are applied automatically when the application starts, but can also be
+run manually with:
+
+    alembic -c core/db/alembic.ini upgrade head
--- a/core/db/migrations/versions/ff891d366761_add_example_project_to_spec.py
+++ b/core/db/migrations/versions/ff891d366761_add_example_project_to_spec.py
@@ -0,0 +1,34 @@
+"""add example project to spec
+
+Revision ID: ff891d366761
+Revises: b760f66138c0
+Create Date: 2024-06-13 09:38:33.329161
+
+"""
+
+from typing import Sequence, Union
+
+import sqlalchemy as sa
+from alembic import op
+
+# revision identifiers, used by Alembic.
+revision: str = "ff891d366761"
+down_revision: Union[str, None] = "b760f66138c0"
+branch_labels: Union[str, Sequence[str], None] = None
+depends_on: Union[str, Sequence[str], None] = None
+
+
+def upgrade() -> None:
+    # ### commands auto generated by Alembic - please adjust! ###
+    with op.batch_alter_table("specifications", schema=None) as batch_op:
+        batch_op.add_column(sa.Column("example_project", sa.String(), nullable=True))
+
+    # ### end Alembic commands ###
+
+
+def downgrade() -> None:
+    # ### commands auto generated by Alembic - please adjust! ###
+    with op.batch_alter_table("specifications", schema=None) as batch_op:
+        batch_op.drop_column("example_project")
+
+    # ### end Alembic commands ###
--- a/core/db/models/specification.py
+++ b/core/db/models/specification.py
@@ -31,6 +31,7 @@ class Specification(Base):
    package_dependencies: Mapped[list[dict]] = mapped_column(default=list)
    template: Mapped[Optional[str]] = mapped_column()
    complexity: Mapped[str] = mapped_column(server_default=Complexity.HARD)
+    example_project: Mapped[Optional[str]] = mapped_column()

    # Relationships
    project_states: Mapped[list["ProjectState"]] = relationship(back_populates="specification", lazy="raise")
@@ -46,6 +47,7 @@ class Specification(Base):
            package_dependencies=self.package_dependencies,
            template=self.template,
            complexity=self.complexity,
+            example_project=self.example_project,
        )
        return clone

--- a/core/telemetry/init.py
+++ b/core/telemetry/init.py
@@ -73,7 +73,7 @@ class Telemetry:
            "python_version": sys.version,
            # GPT Pilot version
            "pilot_version": get_version(),
-            # GPT Pilot Extension version
+            # Pythagora VSCode Extension version
            "extension_version": None,
            # Is extension used
            "is_extension": False,
@@ -86,6 +86,8 @@ class Telemetry:
            "is_complex_app": None,
            # Optional template used for the project
            "template": None,
+            # Optional, example project selected by the user
+            "example_project": None,
            # Optional user contact email
            "user_contact": None,
            # Unique project ID (app_id)
--- a/core/templates/example_project.py
+++ b/core/templates/example_project.py
@@ -1,3 +1,5 @@
+from core.db.models import Complexity
+
 EXAMPLE_PROJECT_DESCRIPTION = """
 The application is a simple ToDo app built using React. Its primary function is to allow users to manage a list of tasks (todos). Each task has a description and a state (open or completed, with the default state being open). The application is frontend-only, with no user sign-up or authentication process. The goal is to provide a straightforward and user-friendly interface for task management.

@@ -64,3 +66,15 @@ EXAMPLE_PROJECT_PLAN = [
        "status": "todo",
    }
 ]
+
+
+EXAMPLE_PROJECTS = {
+    "example-project": {
+        "description": EXAMPLE_PROJECT_DESCRIPTION,
+        "architecture": EXAMPLE_PROJECT_ARCHITECTURE,
+        "complexity": Complexity.SIMPLE,
+        "plan": EXAMPLE_PROJECT_PLAN,
+    }
+}
+
+DEFAULT_EXAMPLE_PROJECT = "example-project"
--- a/tests/agents/test_spec_writer.py
+++ b/tests/agents/test_spec_writer.py
@@ -23,16 +23,8 @@ async def test_start_example_project(agentcontext):
    assert response.type == ResponseType.DONE

    assert sm.current_state.specification.description != ""
-    assert sm.current_state.specification.architecture != ""
-    assert sm.current_state.specification.system_dependencies != []
-    assert sm.current_state.specification.package_dependencies != []
    assert sm.current_state.specification.complexity == Complexity.SIMPLE
-    assert sm.current_state.epics != []
-    assert sm.current_state.tasks != []
-    pm.run_command.assert_awaited_once_with("node --version")
-
-    assert telemetry.data["initial_prompt"] == sm.current_state.specification.description.strip()
-    assert telemetry.data["architecture"]["system_dependencies"][0]["installed"] is True
+    assert telemetry.data["initial_prompt"] == sm.current_state.specification.description


@pytest.mark.asyncio