Merge pull request #35 from nervousapps/patch-1

Add VALIDATE_JSON_RETRY environment variable, and tests
2023-04-26 17:26:43 -07:00 · 2023-04-26 17:26:43 -07:00 · 756ddbdd61
commit 756ddbdd61
--- a/README.md
+++ b/README.md
@ -37,6 +37,13 @@ You can also use flag `--confirm=True` which will ask you `yes or no` before mak
    python -m wolverine examples/buggy_script.py "subtract" 20 3 --confirm=True
 ## :label: Environement variables
 | env name                       | description     | default value      |
 | -------------------------------| ----------------| -------------------|
 | OPENAI_API_KEY                   | OpenAI API key                                                       | None   |
 | DEFAULT_MODEL                   | GPT model to use                                                      | "gpt-4"   | 
 | VALIDATE_JSON_RETRY                   | Number of retries when requesting OpenAI API (-1 means unlimites)                                                       | -1   | 
 ## Future Plans
 This is just a quick prototype I threw together in a few hours. There are many possible extensions and contributions are welcome:
--- a/prompt.txt
+++ b/prompt.txt
@ -14,3 +14,5 @@ example response:
  {"operation": "Replace", "line": 18, "content": "        x += 1"},
  {"operation": "Delete", "line": 20, "content": ""}
 ]
 From now, your response must be only the json object, no talking, no comments.
--- a/tests/conftest.py
+++ b/tests/conftest.py
@ -0,0 +1,31 @@
 """
 Conftest
 """
 import os
 import pytest
 import tempfile
 TEST_FILES_DIR = os.path.join(os.path.dirname(__file__), "test_files")
@pytest.fixture(scope='function')
 def temp_file():
    # Create a temporary file
    with tempfile.NamedTemporaryFile(mode="w", delete=False) as f:
        f.write("first line\nsecond line\nthird line")
    file_path = f.name
    yield file_path
    # Clean up the temporary file
    os.remove(file_path)
 def mock_open_ai_response_object(mocker, content: str):
    """
    Mocks the response object from the openai api.
    """
    mock_generator_object = mocker.MagicMock()
    mock_message_object = mocker.MagicMock()
    mock_message_object.configure_mock(**{"message.content": content})
    mock_generator_object.configure_mock(**{"choices": [mock_message_object]})
    return mock_generator_object
--- a/tests/test_files/cc_resp.txt
+++ b/tests/test_files/cc_resp.txt
@ -0,0 +1,8 @@
 Explanation: The function `subtract_numbers` is never defined in the script, causing a `NameError` when it is called in the `calculate` function.
 [
  {"explanation": "The 'subtract_numbers' function is never defined in the script."},
  {"operation": "InsertAfter", "line": 12, "content": "\n# Define subtract_numbers function\ndef subtract_numbers(a, b):\n    return a - b\n"},
  {"operation": "Replace", "line": 18, "content": "    if operation == \"add\":\n        result = add_numbers(num1, num2)\n    elif operation == \"subtract\":\n        result = subtract_numbers(num1, num2)\n    elif operation == \"multiply\":\n        result = multiply_numbers(num1, num2)\n    elif operation == \"divide\":\n        result = divide_numbers(num1, num2)\n    else:\n        print(\"Invalid operation\")\n"},
  {"operation": "Replace", "line": 30, "content": "    return result\n"}
 ]
--- a/tests/test_files/cc_resp_fail.txt
+++ b/tests/test_files/cc_resp_fail.txt
@ -0,0 +1,7 @@
 Explanation: The function `subtract_numbers` is never defined in the script, causing a `NameError` when it is called in the `calculate` function.
 [
  {"explanation": "The 'subtract_numbers' function is never defined in the script."},
  {"operation": "InsertAfter", "line": 12, "content": "\n# Define subtract_numbers function\ndef subtract_numbers(a, b):\n    return a - b\n"},
  {"operation": "Replace", "line": 18, "content": "    if operation == \"add\":\n        result = add_numbers(num1, num2)\n    elif operation == \"subtract\":\n        result = subtract_numbers(num1, num2)\n    elif operation == \"multiply\":\n        result = multiply_numbers(num1, num2)\n    elif operation == \"divide\":\n        result = divide_numbers(num1, num2)\n    else:\n        print(\"Invalid operation\")\n"},
  {"operation": "Replace", "line": 30, "content": "    return result\n"}
--- a/tests/test_wolverine.py
+++ b/tests/test_wolverine.py
@ -1,18 +1,12 @@
 import os
 import pytest
 import tempfile
-from wolverine import apply_changes
+from wolverine import apply_changes, json_validated_response
-
+from .conftest import (
-@pytest.fixture(scope='function')
+    mock_open_ai_response_object,
-def temp_file():
+    TEST_FILES_DIR
-    # Create a temporary file
+)
    with tempfile.NamedTemporaryFile(mode="w", delete=False) as f:
        f.write("first line\nsecond line\nthird line")
    file_path = f.name
    yield file_path
    # Clean up the temporary file
    os.remove(file_path)
 def test_apply_changes_replace(temp_file):
@ -53,3 +47,40 @@ def test_apply_changes_insert(temp_file):
        content = f.read()
        assert content == 'first line\nsecond line\ninserted line\nthird line'
@pytest.mark.parametrize("chat_completion_response, nb_retry, fail", [
    (os.path.join(TEST_FILES_DIR, "cc_resp.txt"), 3, False),
    (os.path.join(TEST_FILES_DIR, "cc_resp_fail.txt"), 3, True),
    (os.path.join(TEST_FILES_DIR, "cc_resp_fail.txt"), 10, True),
 ])
 def test_json_validated_response(mocker, chat_completion_response, nb_retry, fail):
    # Open the test file
    with open(chat_completion_response, 'r') as file:
        response = file.read()
    # Mock the openAi chat completion API call
    mocker.patch(
        "openai.ChatCompletion.create",
        return_value=mock_open_ai_response_object(mocker=mocker, content=response))
    # ChatCompletion returned an invalid response
    if fail:
        with pytest.raises(Exception) as err:
            json_response = json_validated_response("gpt-4", [
                    {
                        "role": "user",
                        "content": "prompt"
                    }
                ],
                nb_retry=nb_retry
            )
            # Check that the exception is raised after nb_retry time
            assert err.value == f"No valid json response found after 3 tries. Exiting."
    else:
        json_response = json_validated_response("gpt-4", [
                {
                    "role": "user",
                    "content": "prompt"
                }
            ],
            nb_retry=nb_retry
        )
        assert json_response
--- a/wolverine/wolverine.py
+++ b/wolverine/wolverine.py
@ -6,6 +6,9 @@ import subprocess
 import sys
 import openai
 from typing import List, Dict
 from termcolor import cprint
 from dotenv import load_dotenv
 from termcolor import cprint
@ -13,14 +16,18 @@ from termcolor import cprint
 load_dotenv()
 openai.api_key = os.getenv("OPENAI_API_KEY")
 # Default model is GPT-4
 DEFAULT_MODEL = os.environ.get("DEFAULT_MODEL", "gpt-4")
 # Nb retries for json_validated_response, default to -1, infinite
 VALIDATE_JSON_RETRY = int(os.getenv("VALIDATE_JSON_RETRY", -1))
-with open("prompt.txt", encoding="utf-8") as file:
+# Read the system prompt
-    SYSTEM_PROMPT = file.read()
+with open(os.path.join(os.path.dirname(__file__), "..", "prompt.txt"), 'r') as f:
    SYSTEM_PROMPT = f.read()
-def run_script(script_name, script_args):
+def run_script(script_name: str, script_args: List) -> str:
    """
    If script_name.endswith(".py") then run with python
    else run with node
@ -42,53 +49,55 @@ def run_script(script_name, script_args):
    return result.decode("utf-8"), 0
-def json_validated_response(model, messages):
+def json_validated_response(model: str, messages: List[Dict], nb_retry: int = VALIDATE_JSON_RETRY) -> Dict:
    """
    This function is needed because the API can return a non-json response.
-    This will run recursively until a valid json response is returned.
+    This will run recursively VALIDATE_JSON_RETRY times.
-    todo: might want to stop after a certain number of retries
+    If VALIDATE_JSON_RETRY is -1, it will run recursively until a valid json response is returned.
    """
-    response = openai.ChatCompletion.create(
+    json_response = {}
-        model=model,
+    if nb_retry != 0:
-        messages=messages,
+        response = openai.ChatCompletion.create(
-        temperature=0.5,
+            model=model,
-    )
+            messages=messages,
-    messages.append(response.choices[0].message)
+            temperature=0.5,
    content = response.choices[0].message.content
    # see if json can be parsed
    try:
        json_start_index = content.index(
            "["
        )  # find the starting position of the JSON data
        json_data = content[
            json_start_index:
        ]  # extract the JSON data from the response string
        json_response = json.loads(json_data)
    except (json.decoder.JSONDecodeError, ValueError) as error:
        cprint(f"{error}. Re-running the query.", "red")
        # debug
        cprint(f"\nGPT RESPONSE:\n\n{content}\n\n", "yellow")
        # append a user message that says the json is invalid
        messages.append(
            {
                "role": "user",
                "content": (
                    "Your response could not be parsed by json.loads. "
                    "Please restate your last message as pure JSON."
                ),
            }
        )
-        # rerun the api call
+        messages.append(response.choices[0].message)
-        return json_validated_response(model, messages)
+        content = response.choices[0].message.content
-    except Exception as error:
+        # see if json can be parsed
-        cprint(f"Unknown error: {error}", "red")
+        try:
-        cprint(f"\nGPT RESPONSE:\n\n{content}\n\n", "yellow")
+            json_start_index = content.index(
-        raise error
+                "["
-    return json_response
+            )  # find the starting position of the JSON data
            json_data = content[
                json_start_index:
            ]  # extract the JSON data from the response string
            json_response = json.loads(json_data)
            return json_response
        except (json.decoder.JSONDecodeError, ValueError) as e:
            cprint(f"{e}. Re-running the query.", "red")
            # debug
            cprint(f"\nGPT RESPONSE:\n\n{content}\n\n", "yellow")
            # append a user message that says the json is invalid
            messages.append(
                {
                    "role": "user",
                    "content": "Your response could not be parsed by json.loads. Please restate your last message as pure JSON.",
                }
            )
            # dec nb_retry
            nb_retry-=1
            # rerun the api call
            return json_validated_response(model, messages, nb_retry)
        except Exception as e:
            cprint(f"Unknown error: {e}", "red")
            cprint(f"\nGPT RESPONSE:\n\n{content}\n\n", "yellow")
            raise e
    raise Exception(f"No valid json response found after {VALIDATE_JSON_RETRY} tries. Exiting.")
-def send_error_to_gpt(file_path, args, error_message, model=DEFAULT_MODEL):
+def send_error_to_gpt(file_path: str, args: List, error_message: str, model: str = DEFAULT_MODEL) -> Dict:
-    with open(file_path) as f:
+    with open(file_path, "r") as f:
        file_lines = f.readlines()
    file_with_lines = []
@ -122,7 +131,7 @@ def send_error_to_gpt(file_path, args, error_message, model=DEFAULT_MODEL):
    return json_validated_response(model, messages)
-def apply_changes(file_path, changes: list, confirm=False):
+def apply_changes(file_path: str, changes: List, confirm: bool = False):
    """
    Pass changes as loaded json (list of dicts)
    """