Merge pull request Pythagora-io#775 from Pythagora-io/development

LeonOstrez · web-flow · commit 06a21b916757 · 2024-03-21T15:36:01.000-07:00
Development
diff --git a/pilot/.env.example b/pilot/.env.example
@@ -10,10 +10,12 @@ AZURE_ENDPOINT=
 
 OPENROUTER_API_KEY=
 
+# Set this to use Anthropic API directly
+# If using via OpenRouter, OPENROUTER_API_KEY should be set instead
 ANTHROPIC_API_KEY=
 
 # You only need to set this if not using Anthropic API directly (eg. via proxy or AWS Bedrock)
-ANTHROPIC_ENDPOINT=
+# ANTHROPIC_ENDPOINT=
 
 # In case of Azure/OpenRouter endpoint, change this to your deployed model name
 MODEL_NAME=gpt-4-turbo-preview
diff --git a/pilot/const/function_calls.py b/pilot/const/function_calls.py
@@ -496,7 +496,7 @@ def command_definition(description_command='A single command that needs to be ex
                             "decision": {
                                 "type": "string",
                                 "enum": ["apply", "ignore", "rework"],
-                                "description": "Whether to apply this hunk (if it's a valid change with no problems), rework (a valid change but does something incorrectly), or ignore it (unwanted change)."
+                                "description": "Whether to apply this hunk, rework, or ignore it."
                             }
                         },
                         "required": ["number", "reason", "decision"],
diff --git a/pilot/helpers/agents/CodeMonkey.py b/pilot/helpers/agents/CodeMonkey.py
@@ -19,7 +19,7 @@
 # Regular expression pattern for matching hunk headers
 PATCH_HEADER_PATTERN = re.compile(r"^@@ -(\d+),?(\d+)? \+(\d+),?(\d+)? @@")
 
-MAX_REVIEW_RETRIES = 3
+MAX_REVIEW_RETRIES = 2
 
 class CodeMonkey(Agent):
     save_dev_steps = True
@@ -80,6 +80,8 @@ def implement_code_changes(
         :param convo: conversation to continue (must contain file coding/modification instructions)
         :param step: information about the step being implemented
         """
+        previous_temperature = convo.temperature
+        convo.temperature = 0.0
         code_change_description = step.get('code_change_description')
 
         files = self.project.get_all_coded_files()
@@ -121,6 +123,7 @@ def implement_code_changes(
             })
             if content:
                 content = self.remove_backticks(content)
+            convo.remove_last_x_messages(2)
 
         # If we have changes, update the file
         if content and content != file_content:
@@ -133,6 +136,7 @@ def implement_code_changes(
                 'content': content,
             })
 
+        convo.temperature = previous_temperature
         return convo
 
     def replace_complete_file(
@@ -157,10 +161,15 @@ def replace_complete_file(
 
         Note: if even this fails for any reason, the original content is returned instead.
         """
+        prev_message = convo.messages[-1]['content']
+        prev_message_prefix = " ".join(prev_message.split()[:5])
+        prev_message_postfix = " ".join(prev_message.split()[-5:])
         llm_response = convo.send_message('development/implement_changes.prompt', {
             "file_content": file_content,
             "file_name": file_name,
             "files": files,
+            "prev_message_prefix": prev_message_prefix,
+            "prev_message_postfix": prev_message_postfix,
         })
         convo.remove_last_x_messages(2)
         return self.remove_backticks(llm_response)
diff --git a/pilot/prompts/development/implement_changes.prompt b/pilot/prompts/development/implement_changes.prompt
@@ -3,17 +3,33 @@ I need to modify file `{{ file_name }}` that currently looks like this:
 {{ file_content }}
 ```
 
-I want you to implement changes described in previous message and show me the COMPLETE NEW VERSION of this file in this format:
+**IMPORTANT**
+I want you to implement changes described in previous message, that starts with `{{ prev_message_prefix }}` and ends with `{{ prev_message_postfix }}`. Make sure you don't make any mistakes, especially ones that could affect rest of project. Your changes will be reviewed by very detailed reviewer. Because of that, it is extremely important that you are STRICTLY following ALL the following rules while implementing changes:
+
+**IMPORTANT** Output format
+You must output the COMPLETE NEW VERSION of this file in following format:
 -----------------------format----------------------------
 ```
 the full contents of the updated file, without skipping over any content
 ```
 ------------------------end_of_format---------------------------
 
-**IMPORTANT**:If the instructions have comments like `// ..add code here...` or `# placeholder for code`, instead of copying the comment, interpret the instructions and output the relevant code.
+**IMPORTANT** Comprehensive Codebase Insight
+It's crucial to grasp the full scope of the codebase related to your tasks to avert mistakes. Check the initial conversation message for a list of files. Pay a lot of attention to files that are directly included in the file you are currently modifying or that are importing your file.
+Consider these examples to guide your approach and thought process:
+-----------------------start_of_examples----------------------------
+- UI components or templates: Instead of placing scripts directly on specific pages, integrating them in the <head> section or as reusable partials enhances application-wide consistency and reusability.
+- Database operations: Be careful not to execute an action, like password hashing, both in a routing function and a model's pre('save') hook, which could lead to redundancy and errors.
+- Adding backend logic: Prior to creating new functions, verify if an equivalent function exists in the codebase that you could import and use, preventing unnecessary code duplication and keeping the project efficient.
+-----------------------end_of_examples----------------------------
+
+**IMPORTANT** Coding principles
+Write high-quality code, first organize it logically with clear, meaningful names for variables, functions, and classes. Aim for simplicity and adhere to the DRY (Don't Repeat Yourself) principle to avoid code duplication. Ensure your codebase is structured and modular for easy navigation and updates.
+
+**IMPORTANT** If the instructions have comments like `// ..add code here...` or `# placeholder for code`, instead of copying the comment, interpret the instructions and output the relevant code.
 
-**IMPORTANT**: Your reply MUST NOT omit any code in the new implementation or substitute anything with comments like `// .. rest of the code goes here ..` or `# insert existing code here`, because I will overwrite the existing file with the content you provide. Output ONLY the content for this file, without additional explanation, suggestions or notes. Your output MUST start with ``` and MUST end with ``` and include only the complete file contents.
+**IMPORTANT** Your reply MUST NOT omit any code in the new implementation or substitute anything with comments like `// .. rest of the code goes here ..` or `# insert existing code here`, because I will overwrite the existing file with the content you provide. Output ONLY the content for this file, without additional explanation, suggestions or notes. Your output MUST start with ``` and MUST end with ``` and include only the complete file contents.
 
-**IMPORTANT**: For hardcoded configuration values that the user needs to change, mark the line that needs user configuration with `INPUT_REQUIRED {config_description}` comment,  where `config_description` is a description of the value that needs to be set by the user. Use appropriate syntax for comments in the file you're saving (for example `// INPUT_REQUIRED {config_description}` in JavaScript). NEVER ask the user to write code or provide implementation, even if the instructions suggest it! If the file type doesn't support comments (eg JSON), don't add any.
+**IMPORTANT** For hardcoded configuration values that the user needs to change, mark the line that needs user configuration with `INPUT_REQUIRED {config_description}` comment,  where `config_description` is a description of the value that needs to be set by the user. Use appropriate syntax for comments in the file you're saving (for example `// INPUT_REQUIRED {config_description}` in JavaScript). NEVER ask the user to write code or provide implementation, even if the instructions suggest it! If the file type doesn't support comments (eg JSON), don't add any.
 
 {{ logs_and_error_handling }}
diff --git a/pilot/prompts/development/review_changes.prompt b/pilot/prompts/development/review_changes.prompt
@@ -15,42 +15,15 @@ Here is the diff of the changes:
 
 As you can see, there {% if hunks|length == 1 %}is only one hunk in this diff, and it{% else %}are {{hunks|length}} hunks in this diff, and each{% endif %} starts with the `@@` header line.
 
-Think carefully about the instructions and review the proposed changes. For each hunk of change, provide a detailed rationale, and decide whether it should be:
-* applied - if the change is correct
-* ignored - for example if it is a code deletion or change that wasn't asked for
-* reworked - if the change does something correctly but also makes a serious mistake, in which case both applying and ignoring the entire hunk would be incorrect
+When reviewing the code changes, apply these principles to decide on each hunk:
+- Apply: Approve and integrate the hunk into our core codebase if it accurately delivers the intended functionality or enhancement, aligning with our project objectives. This action confirms the change is beneficial and meets our quality standards.
+- Ignore: Use this option sparingly, only when you're certain the entire hunk is incorrect or will introduce errors (logical, syntax, etc.) that could negatively impact the project. Ignoring means the hunk will be completely removed. This should be reserved for cases where the inclusion of the code is definitively more harmful than its absence. Emphasize careful consideration before choosing 'Ignore.' It's crucial for situations where the hunk's removal is the only option to prevent significant issues. Otherwise, 'Rework' might be the better choice to ensure the code's integrity and functionality.
+- Rework: Suggest this option if the concept behind the change is valid and necessary but is implemented in a way that introduces problems. This indicates a need for a revision of the hunk to refine its integration without fully discarding the underlying idea.
 
-Finally, if the changes miss something that was in the instructions, mention that. Keep in mind you're just reviewing one file, `{{ file_name }}`. You don't need to consider if other files are created, dependent packages installed, etc. Focus only on reviewing the changes in this file based on the instructions in the previous message.
+When deciding what should be done with the hunk you are currently reviewing, pick an option that most reviewers of your skill would choose. Your decisions have to be consistent.
 
-Note that the developer may add, modify or delete logging (including `gpt_pilot_debugging_log`) or error handling that's not explicitly asked for, but is a part of good development practice. Unless these logging and error handling additions break something, your decision to apply, ignore or rework the hunk should not be based on this. Base your decision only on functional changes - comments or logging are less important. Importantly, don't ask for a rework just because of logging or error handling changes. Also, take into account this is a junior developer and while the approach they take may not be the best practice, if it's not *wrong*, let it pass. Ask for rework only if the change is clearly bad and would break something.
+Keep in mind you're just reviewing current file. You don't need to consider if other files are created, dependent packages installed, etc. Focus only on reviewing the changes in this file based on the instructions in the previous message.
 
-Here is an example output if 2 of 4 hunks in the change should be applied, one of them should be ignored, one should be reworked, and no other changes are needed:
-```
-{
-    "hunks": [
-        {
-            "number": 1,
-            "reason": "Some explanation why this part of the change is important. The reasoning here should be as detailed as possible as that will help you reach the correct conclusion.",
-            "decision": "apply"
-        },
-        {
-            "number": 2,
-            "reason": "Another explanation, for the 2nd hunk",
-            "decision": "apply"
-        },
-        {
-            "number": 3,
-            "reason": "This hunk accidentally deletes important code without any useful change",
-            "decision": "ignore"
-        },
-        {
-            "number": 4,
-            "reason": "This hunk does something correctly but also does something really wrong. It would be incorrect to either apply or ignore it fully, so it should be reworked.",
-            "decision": "rework"
-        },
-    ],
-    "review_notes": "General review notes, if something is missing from the change you can comment about it here"
-}
-```
+Note that the developer may add, modify or delete logging (including `gpt_pilot_debugging_log`) or error handling that's not explicitly asked for, but is a part of good development practice. Unless these logging and error handling additions break something, your decision to apply, ignore or rework the hunk should not be based on this. Base your decision only on functional changes - comments or logging are less important. Importantly, don't ask for a rework just because of logging or error handling changes. Also, take into account this is a junior developer and while the approach they take may not be the best practice, if it's not *wrong*, let it pass. Ask for rework only if the change is clearly bad and would break something.
 
-IMPORTANT: The developer that wrote this is sloppy and has probably deleted some parts of the code that should not be deleted. Pay special attention to that in your review!
+The developer that wrote this is sometimes sloppy and has could have deleted some parts of the code that contain important functionality and should not be deleted. Pay special attention to that in your review.
diff --git a/pilot/prompts/development/review_feedback.prompt b/pilot/prompts/development/review_feedback.prompt
@@ -1,6 +1,6 @@
 Your changes have been reviewed.
 {% if content != original_content %}
-THe reviewer approved and applied some of your changes, but requested you rework the others.
+The reviewer approved and applied some of your changes, but requested you rework the others.
 
 Here's the file with the approved changes already applied:
 ```
diff --git a/pilot/utils/llm_connection.py b/pilot/utils/llm_connection.py
@@ -140,7 +140,7 @@ def create_gpt_chat_completion(messages: List[dict], req_type, project,
         model_provider = 'openai'
 
     try:
-        if model_provider == 'anthropic':
+        if model_provider == 'anthropic' and os.getenv('ENDPOINT') != 'OPENROUTER':
             if not os.getenv('ANTHROPIC_API_KEY'):
                 os.environ['ANTHROPIC_API_KEY'] = os.getenv('OPENAI_API_KEY')
             response = stream_anthropic(messages, function_call_message, gpt_data, model_name)
@@ -486,14 +486,14 @@ def return_result(result_data, lines_printed):
             try:
                 json_line = json.loads(line)
 
-                if len(json_line['choices']) == 0:
-                    continue
-
                 if 'error' in json_line:
                     logger.error(f'Error in LLM response: {json_line}')
                     telemetry.record_llm_request(token_count, time.time() - request_start_time, is_error=True)
                     raise ValueError(f'Error in LLM response: {json_line["error"]["message"]}')
 
+                if 'choices' not in json_line or len(json_line['choices']) == 0:
+                    continue
+
                 choice = json_line['choices'][0]
 
                 # if 'finish_reason' in choice and choice['finish_reason'] == 'function_call':
@@ -609,7 +609,7 @@ def stream_anthropic(messages, function_call_message, gpt_data, model_name = "cl
         raise RuntimeError("The 'anthropic' package is required to use the Anthropic Claude LLM.") from err
 
     client = anthropic.Anthropic(
-        base_url=os.getenv('ANTHROPIC_ENDPOINT'),
+        base_url=os.getenv('ANTHROPIC_ENDPOINT') or None,
     )
 
     claude_system = "You are a software development AI assistant."

Original file line number	Diff line number	Diff line change
`@@ -496,7 +496,7 @@ def command_definition(description_command='A single command that needs to be ex`
`496`	`496`	`"decision": {`
`497`	`497`	`"type": "string",`
`498`	`498`	`"enum": ["apply", "ignore", "rework"],`
`499`		`- "description": "Whether to apply this hunk (if it's a valid change with no problems), rework (a valid change but does something incorrectly), or ignore it (unwanted change)."`
	`499`	`+ "description": "Whether to apply this hunk, rework, or ignore it."`
`500`	`500`	`}`
`501`	`501`	`},`
`502`	`502`	`"required": ["number", "reason", "decision"],`