import json import re import subprocess from enum import Enum from typing import Callable, TypeVar from gpt_engineer.ai import AI from gpt_engineer.chat_to_files import to_files from gpt_engineer.db import DBs def setup_sys_prompt(dbs): return ( dbs.preprompts["generate"] + "\nUseful to know:\n" + dbs.preprompts["philosophy"] ) Step = TypeVar("Step", bound=Callable[[AI, DBs], list[dict]]) def simple_gen(ai: AI, dbs: DBs): """Run the AI on the main prompt and save the results""" messages = ai.start( setup_sys_prompt(dbs), dbs.input["main_prompt"], ) to_files(messages[-1]["content"], dbs.workspace) return messages def clarify(ai: AI, dbs: DBs): """ Ask the user if they want to clarify anything and save the results to the workspace """ messages = [ai.fsystem(dbs.preprompts["qa"])] user = dbs.input["main_prompt"] while True: messages = ai.next(messages, user) if messages[-1]["content"].strip().lower().startswith("no"): break print() user = input('(answer in text, or "c" to move on)\n') print() if not user or user == "c": break user += ( "\n\n" "Is anything else unclear? If yes, only answer in the form:\n" "{remaining unclear areas} remaining questions.\n" "{Next question}\n" 'If everything is sufficiently clear, only answer "no".' ) print() return messages def gen_spec(ai: AI, dbs: DBs): """ Generate a spec from the main prompt + clarifications and save the results to the workspace """ messages = [ ai.fsystem(setup_sys_prompt(dbs)), ai.fsystem(f"Instructions: {dbs.input['main_prompt']}"), ] messages = ai.next(messages, dbs.preprompts["spec"]) dbs.memory["specification"] = messages[-1]["content"] return messages def respec(ai: AI, dbs: DBs): messages = json.loads(dbs.logs[gen_spec.__name__]) messages += [ai.fsystem(dbs.preprompts["respec"])] messages = ai.next(messages) messages = ai.next( messages, ( "Based on the conversation so far, please reiterate the specification for " "the program. " "If there are things that can be improved, please incorporate the " "improvements. " "If you are satisfied with the specification, just write out the " "specification word by word again." ), ) dbs.memory["specification"] = messages[-1]["content"] return messages def gen_unit_tests(ai: AI, dbs: DBs): """ Generate unit tests based on the specification, that should work. """ messages = [ ai.fsystem(setup_sys_prompt(dbs)), ai.fuser(f"Instructions: {dbs.input['main_prompt']}"), ai.fuser(f"Specification:\n\n{dbs.memory['specification']}"), ] messages = ai.next(messages, dbs.preprompts["unit_tests"]) dbs.memory["unit_tests"] = messages[-1]["content"] to_files(dbs.memory["unit_tests"], dbs.workspace) return messages def gen_clarified_code(ai: AI, dbs: DBs): # get the messages from previous step messages = json.loads(dbs.logs[clarify.__name__]) messages = [ ai.fsystem(setup_sys_prompt(dbs)), ] + messages[1:] messages = ai.next(messages, dbs.preprompts["use_qa"]) to_files(messages[-1]["content"], dbs.workspace) return messages def gen_code(ai: AI, dbs: DBs): # get the messages from previous step messages = [ ai.fsystem(setup_sys_prompt(dbs)), ai.fuser(f"Instructions: {dbs.input['main_prompt']}"), ai.fuser(f"Specification:\n\n{dbs.memory['specification']}"), ai.fuser(f"Unit tests:\n\n{dbs.memory['unit_tests']}"), ] messages = ai.next(messages, dbs.preprompts["use_qa"]) to_files(messages[-1]["content"], dbs.workspace) return messages def execute_entrypoint(ai, dbs): command = dbs.workspace["run.sh"] print("Do you want to execute this code?") print() print(command) print() print('If yes, press enter. Otherwise, type "no"') print() if input() not in ["", "y", "yes"]: print("Ok, not executing the code.") return [] print("Executing the code...") print( "\033[92m" # green color + "Note: If it does not work as expected, please consider running the code'" + " in another way than above." + "\033[0m" ) print() subprocess.run("bash run.sh", shell=True, cwd=dbs.workspace.path) return [] def gen_entrypoint(ai, dbs): messages = ai.start( system=( "You will get information about a codebase that is currently on disk in " "the current folder.\n" "From this you will answer with code blocks that includes all the necessary " "unix terminal commands to " "a) install dependencies " "b) run all necessary parts of the codebase (in parallell if necessary).\n" "Do not install globally. Do not use sudo.\n" "Do not explain the code, just give the commands.\n" "Do not use placeholders, use example values (like . for a folder argument) " "if necessary.\n" ), user="Information about the codebase:\n\n" + dbs.workspace["all_output.txt"], ) print() regex = r"```\S*\n(.+?)```" matches = re.finditer(regex, messages[-1]["content"], re.DOTALL) dbs.workspace["run.sh"] = "\n".join(match.group(1) for match in matches) return messages def use_feedback(ai: AI, dbs: DBs): messages = [ ai.fsystem(setup_sys_prompt(dbs)), ai.fuser(f"Instructions: {dbs.input['main_prompt']}"), ai.fassistant(dbs.workspace["all_output.txt"]), ai.fsystem(dbs.preprompts["use_feedback"]), ] messages = ai.next(messages, dbs.input["feedback"]) to_files(messages[-1]["content"], dbs.workspace) return messages def fix_code(ai: AI, dbs: DBs): code_output = json.loads(dbs.logs[gen_code.__name__])[-1]["content"] messages = [ ai.fsystem(setup_sys_prompt(dbs)), ai.fuser(f"Instructions: {dbs.input['main_prompt']}"), ai.fuser(code_output), ai.fsystem(dbs.preprompts["fix_code"]), ] messages = ai.next(messages, "Please fix any errors in the code above.") to_files(messages[-1]["content"], dbs.workspace) return messages class Config(str, Enum): DEFAULT = "default" BENCHMARK = "benchmark" SIMPLE = "simple" TDD = "tdd" TDD_PLUS = "tdd+" CLARIFY = "clarify" RESPEC = "respec" EXECUTE_ONLY = "execute_only" USE_FEEDBACK = "use_feedback" # Different configs of what steps to run STEPS = { Config.DEFAULT: [ clarify, gen_clarified_code, gen_entrypoint, execute_entrypoint, ], Config.BENCHMARK: [simple_gen, gen_entrypoint], Config.SIMPLE: [simple_gen, gen_entrypoint, execute_entrypoint], Config.TDD: [ gen_spec, gen_unit_tests, gen_code, gen_entrypoint, execute_entrypoint, ], Config.TDD_PLUS: [ gen_spec, gen_unit_tests, gen_code, fix_code, gen_entrypoint, execute_entrypoint, ], Config.CLARIFY: [ clarify, gen_clarified_code, gen_entrypoint, execute_entrypoint, ], Config.RESPEC: [ gen_spec, respec, gen_unit_tests, gen_code, fix_code, gen_entrypoint, execute_entrypoint, ], Config.USE_FEEDBACK: [use_feedback, gen_entrypoint, execute_entrypoint], Config.EXECUTE_ONLY: [gen_entrypoint, execute_entrypoint], } # Future steps that can be added: # run_tests_and_fix_files # execute_entrypoint_and_fix_files_if_needed