Pythagora-io · zvone187 · Aug 7, 2024 · Aug 7, 2024 · Aug 7, 2024 · Aug 7, 2024
diff --git a/core/agents/bug_hunter.py b/core/agents/bug_hunter.py
@@ -30,6 +30,21 @@ class HuntConclusionOptions(BaseModel):
     )
 
 
+class ImportantLog(BaseModel):
+    logCode: str = Field(description="Actual line of code that prints the log.")
+    shouldBeDifferent: bool = Field(
+        description="Whether the current output should be different from the expected output."
+    )
+    filePath: str = Field(description="Path to the file in which the log exists.")
+    currentOutput: str = Field(description="Current output of the log.")
+    expectedOutput: str = Field(description="Expected output of the log.")
+    explanation: str = Field(description="A brief explanation of the log.")
+
+
+class ImportantLogsForDebugging(BaseModel):
+    logs: list[ImportantLog] = Field(description="Important logs that will help the human debug the current bug.")
+
+
 class BugHunter(BaseAgent):
     agent_type = "bug-hunter"
     display_name = "Bug Hunter"
@@ -46,6 +61,8 @@ async def run(self) -> AgentResponse:
             return await self.ask_user_to_test(False, True)
         elif current_iteration["status"] == IterationStatus.AWAITING_BUG_REPRODUCTION:
             return await self.ask_user_to_test(True, False)
+        elif current_iteration["status"] == IterationStatus.START_PAIR_PROGRAMMING:
+            return await self.start_pair_programming()
 
     async def get_bug_reproduction_instructions(self):
         llm = self.get_llm()
@@ -62,24 +79,7 @@ async def get_bug_reproduction_instructions(self):
 
     async def check_logs(self, logs_message: str = None):
         llm = self.get_llm(CHECK_LOGS_AGENT_NAME)
-        convo = AgentConvo(self).template(
-            "iteration",
-            current_task=self.current_state.current_task,
-            user_feedback=self.current_state.current_iteration["user_feedback"],
-            user_feedback_qa=self.current_state.current_iteration["user_feedback_qa"],
-            docs=self.current_state.docs,
-            magic_words=magic_words,
-            next_solution_to_try=None,
-        )
-
-        for hunting_cycle in self.current_state.current_iteration.get("bug_hunting_cycles", []):
-            convo = convo.assistant(hunting_cycle["human_readable_instructions"]).template(
-                "log_data",
-                backend_logs=hunting_cycle["backend_logs"],
-                frontend_logs=hunting_cycle["frontend_logs"],
-                fix_attempted=hunting_cycle["fix_attempted"],
-            )
-
+        convo = self.generate_iteration_convo_so_far()
         human_readable_instructions = await llm(convo, temperature=0.5)
 
         convo = (
@@ -93,23 +93,13 @@ async def check_logs(self, logs_message: str = None):
         llm = self.get_llm()
         hunt_conclusion = await llm(convo, parser=JSONParser(HuntConclusionOptions), temperature=0)
 
-        self.next_state.current_iteration["description"] = human_readable_instructions
-        self.next_state.current_iteration["bug_hunting_cycles"] += [
-            {
-                "human_readable_instructions": human_readable_instructions,
-                "fix_attempted": any(
-                    c["fix_attempted"] for c in self.current_state.current_iteration["bug_hunting_cycles"]
-                ),
-            }
-        ]
-
         if hunt_conclusion.conclusion == magic_words.PROBLEM_IDENTIFIED:
             # if no need for logs, implement iteration same as before
-            self.next_state.current_iteration["status"] = IterationStatus.AWAITING_BUG_FIX
+            self.set_data_for_next_hunting_cycle(human_readable_instructions, IterationStatus.AWAITING_BUG_FIX)
             await self.send_message("The bug is found - I'm  attempting to fix it.")
         else:
             # if logs are needed, add logging steps
-            self.next_state.current_iteration["status"] = IterationStatus.AWAITING_LOGGING
+            self.set_data_for_next_hunting_cycle(human_readable_instructions, IterationStatus.AWAITING_LOGGING)
             await self.send_message("Adding more logs to identify the bug.")
 
         self.next_state.flag_iterations_as_modified()
@@ -121,14 +111,22 @@ async def ask_user_to_test(self, awaiting_bug_reproduction: bool = False, awaiti
             + self.current_state.current_iteration["bug_reproduction_description"]
         )
 
+        buttons = {}
+
+        last_iteration = self.current_state.iterations[-1] if len(self.current_state.iterations) >= 3 else None
+        if last_iteration:
+            buttons["start_pair_programming"] = "Start Pair Programming"
+
         if self.current_state.run_command:
             await self.ui.send_run_command(self.current_state.run_command)
 
         if awaiting_user_test:
+            buttons["yes"] = "Yes, the issue is fixed"
+            buttons["no"] = "No"
             user_feedback = await self.ask_question(
                 "Is the bug you reported fixed now?",
-                buttons={"yes": "Yes, the issue is fixed", "no": "No"},
-                default="continue",
+                buttons=buttons,
+                default="yes",
                 buttons_only=True,
                 hint="Instructions for testing:\n\n"
                 + self.current_state.current_iteration["bug_reproduction_description"],
@@ -137,21 +135,31 @@ async def ask_user_to_test(self, awaiting_bug_reproduction: bool = False, awaiti
 
             if user_feedback.button == "yes":
                 self.next_state.complete_iteration()
+            elif user_feedback.button == "start_pair_programming":
+                self.next_state.current_iteration["status"] = IterationStatus.START_PAIR_PROGRAMMING
+                # TODO: Leon check if this is needed
+                self.next_state.flag_iterations_as_modified()
             else:
                 awaiting_bug_reproduction = True
 
         if awaiting_bug_reproduction:
             # TODO how can we get FE and BE logs automatically?
+            buttons["continue"] = "Continue"
+            buttons["done"] = "Bug is fixed"
             backend_logs = await self.ask_question(
                 "Please do exactly what you did in the last iteration, paste **BACKEND** logs here and click CONTINUE.",
-                buttons={"continue": "Continue", "done": "Bug is fixed"},
+                buttons=buttons,
                 default="continue",
                 hint="Instructions for testing:\n\n"
                 + self.current_state.current_iteration["bug_reproduction_description"],
             )
 
             if backend_logs.button == "done":
                 self.next_state.complete_iteration()
+            elif backend_logs.button == "start_pair_programming":
+                self.next_state.current_iteration["status"] = IterationStatus.START_PAIR_PROGRAMMING
+                # TODO: Leon check if this is needed
+                self.next_state.flag_iterations_as_modified()
             else:
                 frontend_logs = await self.ask_question(
                     "Please paste **frontend** logs here and click CONTINUE.",
@@ -170,3 +178,151 @@ async def ask_user_to_test(self, awaiting_bug_reproduction: bool = False, awaiti
                     self.next_state.complete_iteration()
 
         return AgentResponse.done(self)
+
+    async def start_pair_programming(self):
+        llm = self.get_llm()
+        convo = self.generate_iteration_convo_so_far(True)
+        convo.remove_last_x_messages(1)
+        convo = convo.template("problem_explanation")
+        await self.ui.start_important_stream()
+        initial_explanation = await llm(convo, temperature=0.5)
+
+        convo = convo.template("data_about_logs").require_schema(ImportantLogsForDebugging)
+
+        data_about_logs = await llm(convo, parser=JSONParser(ImportantLogsForDebugging), temperature=0.5)
+
+        await self.ui.send_data_about_logs(
+            {
+                "logs": [
+                    {
+                        "currentLog": d.currentOutput,
+                        "expectedLog": d.expectedOutput,
+                        "explanation": d.explanation,
+                        "filePath": d.filePath,
+                        "logCode": d.logCode,
+                        "shouldBeDifferent": d.shouldBeDifferent,
+                    }
+                    for d in data_about_logs.logs
+                ]
+            }
+        )
+
+        while True:
+            self.next_state.current_iteration["initial_explanation"] = initial_explanation
+            next_step = await self.ask_question(
+                "What do you want to do?",
+                buttons={
+                    "question": "I have a question",
+                    "done": "I fixed the bug myself",
+                    "tell_me_more": "Tell me more about the bug",
+                    "solution_hint": "I think I know where the problem is",
+                    "other": "Other",
+                },
+                buttons_only=True,
+                default="continue",
+                hint="Instructions for testing:\n\n"
+                + self.current_state.current_iteration["bug_reproduction_description"],
+            )
+
+            # TODO: remove when Leon checks
+            convo.remove_last_x_messages(2)
+
+            if len(convo.messages) > 10:
+                convo.trim(1, 2)
+
+            # TODO: in the future improve with a separate conversation that parses the user info and goes into an appropriate if statement
+            if next_step.button == "done":
+                self.next_state.complete_iteration()
+                break
+            elif next_step.button == "question":
+                user_response = await self.ask_question("Oh, cool, what would you like to know?")
+                convo = convo.template("ask_a_question", question=user_response.text)
+                await self.ui.start_important_stream()
+                llm_answer = await llm(convo, temperature=0.5)
+                await self.send_message(llm_answer)
+            elif next_step.button == "tell_me_more":
+                convo.template("tell_me_more")
+                await self.ui.start_important_stream()
+                response = await llm(convo, temperature=0.5)
+                await self.send_message(response)
+            elif next_step.button == "other":
+                # this is the same as "question" - we want to keep an option for users to click to understand if we're missing something with other options
+                user_response = await self.ask_question("Let me know what you think...")
+                convo = convo.template("ask_a_question", question=user_response.text)
+                await self.ui.start_important_stream()
+                llm_answer = await llm(convo, temperature=0.5)
+                await self.send_message(llm_answer)
+            elif next_step.button == "solution_hint":
+                human_hint_label = "Amazing!!! How do you think we can solve this bug?"
+                while True:
+                    human_hint = await self.ask_question(human_hint_label)
+                    convo = convo.template("instructions_from_human_hint", human_hint=human_hint.text)
+                    await self.ui.start_important_stream()
+                    llm = self.get_llm(CHECK_LOGS_AGENT_NAME)
+                    human_readable_instructions = await llm(convo, temperature=0.5)
+                    human_approval = await self.ask_question(
+                        "Can I implement this solution?", buttons={"yes": "Yes", "no": "No"}, buttons_only=True
+                    )
+                    llm = self.get_llm()
+                    if human_approval.button == "yes":
+                        self.set_data_for_next_hunting_cycle(
+                            human_readable_instructions, IterationStatus.AWAITING_BUG_FIX
+                        )
+                        self.next_state.flag_iterations_as_modified()
+                        break
+                    else:
+                        human_hint_label = "Oh, my bad, what did I misunderstand?"
+                break
+            elif next_step.button == "tell_me_more":
+                convo.template("tell_me_more")
+                await self.ui.start_important_stream()
+                response = await llm(convo, temperature=0.5)
+                await self.send_message(response)
+                continue
+
+        # TODO: send telemetry so we know what do users mostly click here!
+        return AgentResponse.done(self)
+
+    def generate_iteration_convo_so_far(self, omit_last_cycle=False):
+        convo = AgentConvo(self).template(
+            "iteration",
+            current_task=self.current_state.current_task,
+            user_feedback=self.current_state.current_iteration["user_feedback"],
+            user_feedback_qa=self.current_state.current_iteration["user_feedback_qa"],
+            docs=self.current_state.docs,
+            magic_words=magic_words,
+            next_solution_to_try=None,
+        )
+
+        hunting_cycles = self.current_state.current_iteration.get("bug_hunting_cycles", [])[
+            0 : (-1 if omit_last_cycle else None)
+        ]
+
+        for hunting_cycle in hunting_cycles:
+            convo = convo.assistant(hunting_cycle["human_readable_instructions"]).template(
+                "log_data",
+                backend_logs=hunting_cycle.get("backend_logs"),
+                frontend_logs=hunting_cycle.get("frontend_logs"),
+                fix_attempted=hunting_cycle.get("fix_attempted"),
+            )
+
+        return convo
+
+    def set_data_for_next_hunting_cycle(self, human_readable_instructions, new_status):
+        self.next_state.current_iteration["description"] = human_readable_instructions
+        self.next_state.current_iteration["bug_hunting_cycles"] += [
+            {
+                "human_readable_instructions": human_readable_instructions,
+                "fix_attempted": any(
+                    c["fix_attempted"] for c in self.current_state.current_iteration["bug_hunting_cycles"]
+                ),
+            }
+        ]
+
+        self.next_state.current_iteration["status"] = new_status
+
+    async def continue_on(self, convo, button_value, user_response):
+        llm = self.get_llm()
+        convo = convo.template("continue_on")
+        continue_on = await llm(convo, temperature=0.5)
+        return continue_on
diff --git a/core/agents/convo.py b/core/agents/convo.py
@@ -88,6 +88,22 @@
         child.prompt_log = deepcopy(self.prompt_log)
         return child
 
+    def trim(self, trim_index: int, trim_count: int) -> "AgentConvo":
+        """
+        Trim the conversation starting from the given index by 1 message.
+        :param trim_index:
+        :return:
+        """
+        self.messages = self.messages[:trim_index] + self.messages[trim_index + trim_count :]
+        return self
+
+    def remove_last_x_messages(self, count: int) -> "AgentConvo":
+        """
+        Remove the last `count` messages from the conversation.
+        """
+        self.messages = self.messages[:-count]
+        return self
+
     def require_schema(self, model: BaseModel) -> "AgentConvo":
         def remove_defs(d):
             if isinstance(d, dict):
@@ -106,6 +122,6 @@
        )
        return self

    def remove_last_x_messages(self, x: int) -> "AgentConvo":
        self.messages = self.messages[:-x]
        return self
diff --git a/core/agents/developer.py b/core/agents/developer.py
@@ -119,7 +119,7 @@ async def breakdown_current_iteration(self, task_review_feedback: Optional[str]
             source = "bug_hunt"
             n_tasks = len(self.next_state.iterations)
             log.debug(f"Breaking down the logging cycle {description}")
-            await self.send_message("Breaking down the current iteration logging cycle ...")
+            await self.send_message("Breaking down the current bug hunting cycle ...")
         else:
             iteration = self.current_state.current_iteration
             current_task["task_review_feedback"] = None

diff --git a/core/agents/orchestrator.py b/core/agents/orchestrator.py
@@ -233,6 +233,9 @@ def create_agent(self, prev_response: Optional[AgentResponse]) -> BaseAgent:
             if current_iteration_status == IterationStatus.HUNTING_FOR_BUG:
                 # Triggering the bug hunter to start the hunt
                 return BugHunter(self.state_manager, self.ui)
+            elif current_iteration_status == IterationStatus.START_PAIR_PROGRAMMING:
+                # Pythagora cannot solve the issue so we're starting pair programming
+                return BugHunter(self.state_manager, self.ui)
             elif current_iteration_status == IterationStatus.AWAITING_LOGGING:
                 # Get the developer to implement logs needed for debugging
                 return Developer(self.state_manager, self.ui)

diff --git a/core/agents/troubleshooter.py b/core/agents/troubleshooter.py
@@ -216,7 +216,7 @@ async def get_user_feedback(
         If "is_loop" is True, Pythagora is stuck in a loop and needs to consider alternative solutions.
 
         The last element in the tuple is the user feedback, which may be empty if the user provided no
-        feedback (eg. if they just clicked on "Continue" or "I'm stuck in a loop").
+        feedback (eg. if they just clicked on "Continue" or "Start Pair Programming").
         """
 
         bug_report = None
@@ -233,17 +233,17 @@ async def get_user_feedback(
 
         buttons = {"continue": "Everything works", "change": "I want to make a change", "bug": "There is an issue"}
         if last_iteration:
-            buttons["loop"] = "I'm stuck in a loop"
+            buttons["start_pair_programming"] = "Start Pair Programming"
 
         user_response = await self.ask_question(
             test_message, buttons=buttons, default="continue", buttons_only=True, hint=hint
         )
         if user_response.button == "continue" or user_response.cancelled:
             should_iterate = False
 
-        elif user_response.button == "loop":
+        elif user_response.button == "start_pair_programming":
             await telemetry.trace_code_event(
-                "stuck-in-loop",
+                "pair-programming-started",
                 {
                     "clicked": True,
                     "task_index": self.current_state.tasks.index(self.current_state.current_task) + 1,

diff --git a/core/db/models/project_state.py b/core/db/models/project_state.py
@@ -42,6 +42,7 @@ class IterationStatus:
     FIND_SOLUTION = "find_solution"
     PROBLEM_SOLVER = "problem_solver"
     NEW_FEATURE_REQUESTED = "new_feature_requested"
+    START_PAIR_PROGRAMMING = "start_pair_programming"
     DONE = "done"
 
 

diff --git a/core/prompts/bug-hunter/ask_a_question.prompt b/core/prompts/bug-hunter/ask_a_question.prompt
@@ -0,0 +1,4 @@
+The developer wants to ask you a question. Here is the question:
+{{question}}
+
+Please answer and refer to all the files in the repository and everything we've talked about so far but do not form your answer in any way that was asked for before, just answer the question as if you're talking to a colleague.
diff --git a/core/prompts/bug-hunter/data_about_logs.prompt b/core/prompts/bug-hunter/data_about_logs.prompt
@@ -0,0 +1,7 @@
+Tell me the most important logs that are relevant for this issue. For each log, tell me the the following:
+ 1. line in the code (eg. `print(...)`, `console.log(...)`, etc.) that generated the log
+ 2. what file is the log in (eg. `index.js`, `routes/users.js`, etc. - make sure to put the entire path like listed above)
+ 2. the current output of that log (make sure not to put the entire log output but maximum 5-10 lines of the output)
+ 3. the expected output of that log (also make sure to put maximum of 5-10 lines of the output)
+ 4. should the log be different from the current output or are the current and expected output the same
+ 5. a brief explanation of why the output is incorrect and what should be different here (use maximum 2-3 sentences)
diff --git a/core/prompts/bug-hunter/instructions_from_human_hint.prompt b/core/prompts/bug-hunter/instructions_from_human_hint.prompt
@@ -0,0 +1,6 @@
+The human is sending you a hint about how to solve this bug. Here is what human said:
+```
+{{ human_hint }}
+```
+
+Now, based on this hint, break down exactly what the problem is, what is the solution to this problem and how can we implement this solution so that the bug is fixed.
diff --git a/core/prompts/bug-hunter/problem_explanation.prompt b/core/prompts/bug-hunter/problem_explanation.prompt
@@ -0,0 +1,4 @@
+This also didn't help to solve the issue so we can conclude that you are unable to solve this problem yourself so I got a human here who will help you out.
+
+First, focus on the problem you're facing and explain it to the human. Explain what is the issue that you're working in and what should the human try to do to solve this problem. Is there anything the human can look at that you don't have access to - a database, API response, etc.? If there is something for the human to look at, specify exactly how can the human obtain this information. Keep the answer short and to the point.
+
diff --git a/core/prompts/bug-hunter/tell_me_more.prompt b/core/prompts/bug-hunter/tell_me_more.prompt
@@ -0,0 +1 @@
+Please tell me more about the problem we're working on and don't repeat things you said before but tell me something I don't know.