diff --git a/gpt_engineer/chat_to_files.py b/gpt_engineer/chat_to_files.py
deleted file mode 100644
index ca8d6766ff..0000000000
--- a/gpt_engineer/chat_to_files.py
+++ /dev/null
@@ -1,163 +0,0 @@
-import os
-import re
-
-from typing import List, Tuple
-
-
-def parse_chat(chat) -> List[Tuple[str, str]]:
-    """
-    Extracts all code blocks from a chat and returns them
-    as a list of (filename, codeblock) tuples.
-
-    Parameters
-    ----------
-    chat : str
-        The chat to extract code blocks from.
-
-    Returns
-    -------
-    List[Tuple[str, str]]
-        A list of tuples, where each tuple contains a filename and a code block.
-    """
-    # Get all ``` blocks and preceding filenames
-    regex = r"(\S+)\n\s*```[^\n]*\n(.+?)```"
-    matches = re.finditer(regex, chat, re.DOTALL)
-
-    files = []
-    for match in matches:
-        # Strip the filename of any non-allowed characters and convert / to \
-        path = re.sub(r'[\:<>"|?*]', "", match.group(1))
-
-        # Remove leading and trailing brackets
-        path = re.sub(r"^\[(.*)\]$", r"\1", path)
-
-        # Remove leading and trailing backticks
-        path = re.sub(r"^`(.*)`$", r"\1", path)
-
-        # Remove trailing ]
-        path = re.sub(r"[\]\:]$", "", path)
-
-        # Get the code
-        code = match.group(2)
-
-        # Add the file to the list
-        files.append((path, code))
-
-    # Get all the text before the first ``` block
-    readme = chat.split("```")[0]
-    files.append(("LAST_MODIFICATION_README.md", readme))
-
-    # Return the files
-    return files
-
-
-def to_files(chat, workspace):
-    """
-    Parse the chat and add all extracted files to the workspace.
-
-    Parameters
-    ----------
-    chat : str
-        The chat to parse.
-    workspace : dict
-        The workspace to add the files to.
-    """
-    workspace["all_output.txt"] = chat
-
-    files = parse_chat(chat)
-    for file_name, file_content in files:
-        workspace[file_name] = file_content
-
-
-def to_files_(chat, dbs):
-    """
-    Parse the chat and add all extracted files to the workspace.
-
-    Parameters
-    ----------
-    chat : str
-        The chat to parse.
-    workspace : dict
-        The workspace to add the files to.
-    """
-    dbs.project_metadata["all_output.txt"] = chat
-
-    files = parse_chat(chat)
-    for file_name, file_content in files:
-        dbs.workspace[file_name] = file_content
-
-
-def overwrite_files(chat, dbs):
-    """
-    Replace the AI files with the older local files.
-
-    Parameters
-    ----------
-    chat : str
-        The chat containing the AI files.
-    dbs : DBs
-        The database containing the workspace.
-    replace_files : dict
-        A dictionary mapping file names to file paths of the local files.
-    """
-    dbs.project_metadata[
-        "all_output.txt"
-    ] = chat  # files_info = get_code_strings(dbs.project_metadata)
-
-    files = parse_chat(chat)
-    for file_name, file_content in files:
-        if file_name == "LAST_MODIFICATION_README.md":
-            dbs.project_metadata["LAST_MODIFICATION_README.md"] = file_content
-        else:
-            dbs.workspace[file_name] = file_content
-
-
-def get_code_strings(input) -> dict[str, str]:
-    """
-    Read file_list.txt and return file names and their content.
-
-    Parameters
-    ----------
-    input : dict
-        A dictionary containing the file_list.txt.
-
-    Returns
-    -------
-    dict[str, str]
-        A dictionary mapping file names to their content.
-    """
-    files_paths = input["file_list.txt"].strip().split("\n")
-    files_dict = {}
-    for full_file_path in files_paths:
-        with open(full_file_path, "r") as file:
-            file_data = file.read()
-        if file_data:
-            # TODO: Should below be the full path?
-            file_name = os.path.relpath(full_file_path, input.path)
-            files_dict[file_name] = file_data
-    return files_dict
-
-
-def format_file_to_input(file_name: str, file_content: str) -> str:
-    """
-    Format a file string to use as input to the AI agent.
-
-    Parameters
-    ----------
-    file_name : str
-        The name of the file.
-    file_content : str
-        The content of the file.
-
-    Returns
-    -------
-    str
-        The formatted file string.
-    """
-    file_str = f"""
-    {file_name}
-    ```
-    {file_content}
-    ```
-    """
-    return file_str
diff --git a/gpt_engineer/main.py b/gpt_engineer/main.py
deleted file mode 100644
index 4d78203a47..0000000000
--- a/gpt_engineer/main.py
+++ /dev/null
@@ -1,108 +0,0 @@
-import logging
-import os
-
-from pathlib import Path
-
-import openai
-import typer
-
-from dotenv import load_dotenv
-
-from gpt_engineer.ai import AI
-from gpt_engineer.collect import collect_learnings
-from gpt_engineer.db import DB, DBs, archive
-from gpt_engineer.learning import collect_consent
-from gpt_engineer.steps import STEPS, Config as StepsConfig
-
-app = typer.Typer()  # creates a CLI app
-
-
-def load_env_if_needed():
-    if os.getenv("OPENAI_API_KEY") is None:
-        load_dotenv()
-    openai.api_key = os.getenv("OPENAI_API_KEY")
-
-
-@app.command()
-def main(
-    project_path: str = typer.Argument("projects/example", help="path"),
-    model: str = typer.Argument("gpt-4", help="model id string"),
-    temperature: float = 0.1,
-    steps_config: StepsConfig = typer.Option(
-        StepsConfig.DEFAULT, "--steps", "-s", help="decide which steps to run"
-    ),
-    improve_option: bool = typer.Option(
-        False,
-        "--improve",
-        "-i",
-        help="Improve code from existing project.",
-    ),
-    azure_endpoint: str = typer.Option(
-        "",
-        "--azure",
-        "-a",
-        help="""Endpoint for your Azure OpenAI Service (https://xx.openai.azure.com).
-            In that case, the given model is the deployment name chosen in the Azure AI Studio.""",
-    ),
-    verbose: bool = typer.Option(False, "--verbose", "-v"),
-):
-    logging.basicConfig(level=logging.DEBUG if verbose else logging.INFO)
-
-    # For the improve option take current project as path and add .gpteng folder
-    if improve_option:
-        # The default option for the --improve is the IMPROVE_CODE, not DEFAULT
-        if steps_config == StepsConfig.DEFAULT:
-            steps_config = StepsConfig.IMPROVE_CODE
-
-    load_env_if_needed()
-
-    ai = AI(
-        model_name=model,
-        temperature=temperature,
-        azure_endpoint=azure_endpoint,
-    )
-
-    input_path = Path(project_path).absolute()
-    workspace_path = input_path
-    base_metadata_path = input_path / ".gpteng"
-    memory_path = base_metadata_path / "memory"
-    archive_path = base_metadata_path / "archive"
-
-    dbs = DBs(
-        memory=DB(memory_path),
-        logs=DB(memory_path / "logs"),
-        input=DB(workspace_path),
-        workspace=DB(workspace_path),
-        preprompts=DB(
-            Path(__file__).parent / "preprompts"
-        ),  # Loads preprompts from the preprompts directory
-        archive=DB(archive_path),
-        project_metadata=DB(base_metadata_path),
-    )
-
-    if steps_config not in [
-        StepsConfig.EXECUTE_ONLY,
-        StepsConfig.USE_FEEDBACK,
-        StepsConfig.EVALUATE,
-        StepsConfig.IMPROVE_CODE,
-    ]:
-        archive(dbs)
-
-        if not dbs.input.get("prompt"):
-            dbs.input["prompt"] = input(
-                "\nWhat application do you want gpt-engineer to generate?\n"
-            )
-
-    steps = STEPS[steps_config]
-    for step in steps:
-        messages = step(ai, dbs)
-        dbs.logs[step.__name__] = AI.serialize_messages(messages)
-
-    if collect_consent():
-        collect_learnings(model, temperature, steps, dbs)
-
-    dbs.logs["token_usage"] = ai.format_token_usage_log()
-
-
-if __name__ == "__main__":
-    app()
diff --git a/gpt_engineer/steps.py b/gpt_engineer/steps.py
deleted file mode 100644
index b0be9425a8..0000000000
--- a/gpt_engineer/steps.py
+++ /dev/null
@@ -1,503 +0,0 @@
-import inspect
-import os
-import re
-import subprocess
-
-from enum import Enum
-from typing import List, Union
-
-from langchain.schema import AIMessage, HumanMessage, SystemMessage
-from termcolor import colored
-
-from gpt_engineer.ai import AI
-from gpt_engineer.chat_to_files import (
-    format_file_to_input,
-    get_code_strings,
-    overwrite_files,
-    to_files,
-    to_files_,
-)
-from gpt_engineer.db import DBs
-from gpt_engineer.file_selector import FILE_LIST_NAME, ask_for_files
-from gpt_engineer.learning import human_review_input
-
-Message = Union[AIMessage, HumanMessage, SystemMessage]
-
-
-def setup_sys_prompt(dbs: DBs) -> str:
-    """
-    Primes the AI with instructions as to how it should
-    generate code and the philosophy to follow
-    """
-    return (
-        dbs.preprompts["roadmap"]
-        + dbs.preprompts["generate"]
-        + "\nUseful to know:\n"
-        + dbs.preprompts["philosophy"]
-    )
-
-
-def setup_sys_prompt_existing_code(dbs: DBs) -> str:
-    """
-    Similar to code generation, but using an existing code base.
-    """
-    return (
-        dbs.preprompts["implement_on_existing"]
-        + "\nUseful to know:\n"
-        + dbs.preprompts["philosophy"]
-    )
-
-
-def get_prompt(dbs: DBs) -> str:
-    """
-    Loads the user's prompt for the project from prompt file
-    (While we migrate we have this fallback getter)
-    """
-    assert (
-        "prompt" in dbs.input or "main_prompt" in dbs.input
-    ), "Please put your prompt in the file `prompt` in the project directory"
-
-    if "prompt" not in dbs.input:
-        print(
-            colored("Please put the prompt in the file `prompt`, not `main_prompt", "red")
-        )
-        print()
-        return dbs.input["main_prompt"]
-
-    return dbs.input["prompt"]
-
-
-def curr_fn() -> str:
-    """
-    Get the name of the current function
-    NOTE: This will be the name of the function that called this function,
-    so it serves to ensure we don't hardcode the function name in the step,
-    but allow the step names to be refactored
-    """
-    return inspect.stack()[1].function
-
-
-# All steps below have the Step signature
-
-
-def simple_gen(ai: AI, dbs: DBs) -> List[Message]:
-    """Run the AI on the main prompt and save the results"""
-    messages = ai.start(setup_sys_prompt(dbs), get_prompt(dbs), step_name=curr_fn())
-
-    SERVICE_MODE = os.environ.get("SERVICE_MODE", False)
-
-    if SERVICE_MODE:
-        to_files_(messages[-1].content.strip(), dbs)
-    else:
-        to_files(messages[-1].content.strip(), dbs.workspace)
-
-    return messages
-
-
-def clarify(ai: AI, dbs: DBs) -> List[Message]:
-    """
-    Ask the user if they want to clarify anything and save the results to the workspace
-    """
-    messages: List[Message] = [ai.fsystem(dbs.preprompts["clarify"])]
-    user_input = get_prompt(dbs)
-    while True:
-        messages = ai.next(messages, user_input, step_name=curr_fn())
-        msg = messages[-1].content.strip()
-
-        if msg == "Nothing more to clarify.":
-            break
-
-        if msg.lower().startswith("no"):
-            print("Nothing more to clarify.")
-            break
-
-        print()
-        user_input = input('(answer in text, or "c" to move on)\n')
-        print()
-
-        if not user_input or user_input == "c":
-            print("(letting gpt-engineer make its own assumptions)")
-            print()
-            messages = ai.next(
-                messages,
-                "Make your own assumptions and state them explicitly before starting",
-                step_name=curr_fn(),
-            )
-            print()
-            return messages
-
-        user_input += (
-            "\n\n"
-            "Is anything else unclear? If yes, only answer in the form:\n"
-            "{remaining unclear areas} remaining questions.\n"
-            "{Next question}\n"
-            'If everything is sufficiently clear, only answer "Nothing more to clarify.".'
-        )
-
-    print()
-    return messages
-
-
-def gen_spec(ai: AI, dbs: DBs) -> List[Message]:
-    """
-    Generate a spec from the main prompt + clarifications and save the results to
-    the workspace
-    """
-    messages = [
-        ai.fsystem(setup_sys_prompt(dbs)),
-        ai.fsystem(f"Instructions: {dbs.input['prompt']}"),
-    ]
-
-    messages = ai.next(messages, dbs.preprompts["spec"], step_name=curr_fn())
-
-    dbs.memory["specification"] = messages[-1].content.strip()
-
-    return messages
-
-
-def respec(ai: AI, dbs: DBs) -> List[Message]:
-    """Asks the LLM to review the specs so far and reiterate them if necessary"""
-    messages = AI.deserialize_messages(dbs.logs[gen_spec.__name__])
-    messages += [ai.fsystem(dbs.preprompts["respec"])]
-
-    messages = ai.next(messages, step_name=curr_fn())
-    messages = ai.next(
-        messages,
-        (
-            "Based on the conversation so far, please reiterate the specification for "
-            "the program. "
-            "If there are things that can be improved, please incorporate the "
-            "improvements. "
-            "If you are satisfied with the specification, just write out the "
-            "specification word by word again."
-        ),
-        step_name=curr_fn(),
-    )
-
-    dbs.memory["specification"] = messages[-1].content.strip()
-    return messages
-
-
-def gen_unit_tests(ai: AI, dbs: DBs) -> List[dict]:
-    """
-    Generate unit tests based on the specification, that should work.
-    """
-    messages = [
-        ai.fsystem(setup_sys_prompt(dbs)),
-        ai.fuser(f"Instructions: {dbs.input['prompt']}"),
-        ai.fuser(f"Specification:\n\n{dbs.memory['specification']}"),
-    ]
-
-    messages = ai.next(messages, dbs.preprompts["unit_tests"], step_name=curr_fn())
-
-    dbs.memory["unit_tests"] = messages[-1].content.strip()
-    to_files(dbs.memory["unit_tests"], dbs.workspace)
-
-    return messages
-
-
-def gen_clarified_code(ai: AI, dbs: DBs) -> List[dict]:
-    """Takes clarification and generates code"""
-    messages = AI.deserialize_messages(dbs.logs[clarify.__name__])
-
-    messages = [
-        ai.fsystem(setup_sys_prompt(dbs)),
-    ] + messages[
-        1:
-    ]  # skip the first clarify message, which was the original clarify priming prompt
-    messages = ai.next(messages, dbs.preprompts["generate"], step_name=curr_fn())
-
-    to_files(messages[-1].content.strip(), dbs.workspace)
-    return messages
-
-
-def gen_code_after_unit_tests(ai: AI, dbs: DBs) -> List[dict]:
-    """Generates project code after unit tests have been produced"""
-    messages = [
-        ai.fsystem(setup_sys_prompt(dbs)),
-        ai.fuser(f"Instructions: {dbs.input['prompt']}"),
-        ai.fuser(f"Specification:\n\n{dbs.memory['specification']}"),
-        ai.fuser(f"Unit tests:\n\n{dbs.memory['unit_tests']}"),
-    ]
-    messages = ai.next(messages, dbs.preprompts["generate"], step_name=curr_fn())
-    to_files(messages[-1].content.strip(), dbs.workspace)
-    return messages
-
-
-def execute_entrypoint(ai: AI, dbs: DBs) -> List[dict]:
-    command = dbs.workspace["run.sh"]
-
-    print()
-    print(
-        colored(
-            "Do you want to execute this code? (y/n)",
-            "red",
-        )
-    )
-    print()
-    print(command)
-    print()
-    print("To execute, you can also press enter.")
-    print()
-    if input() not in ["", "y", "yes"]:
-        print("Ok, not executing the code.")
-        return []
-    print("Executing the code...")
-    print()
-    print(
-        colored(
-            "Note: If it does not work as expected, consider running the code"
-            + " in another way than above.",
-            "green",
-        )
-    )
-    print()
-    print("You can press ctrl+c *once* to stop the execution.")
-    print()
-
-    p = subprocess.Popen("bash run.sh", shell=True, cwd=dbs.workspace.path)
-    try:
-        p.wait()
-    except KeyboardInterrupt:
-        print()
-        print("Stopping execution.")
-        print("Execution stopped.")
-        p.kill()
-        print()
-
-    return []
-
-
-def gen_entrypoint(ai: AI, dbs: DBs) -> List[dict]:
-    messages = ai.start(
-        system=(
-            "You will get information about a codebase that is currently on disk in "
-            "the current folder.\n"
-            "From this you will answer with code blocks that includes all the necessary "
-            "unix terminal commands to "
-            "a) install dependencies "
-            "b) run all necessary parts of the codebase (in parallel if necessary).\n"
-            "Do not install globally. Do not use sudo.\n"
-            "Do not explain the code, just give the commands.\n"
-            "Do not use placeholders, use example values (like . for a folder argument) "
-            "if necessary.\n"
-        ),
-        user="Information about the codebase:\n\n"
-        + dbs.project_metadata["all_output.txt"],
-        step_name=curr_fn(),
-    )
-    print()
-
-    regex = r"```\S*\n(.+?)```"
-    matches = re.finditer(regex, messages[-1].content.strip(), re.DOTALL)
-    dbs.workspace["run.sh"] = "\n".join(match.group(1) for match in matches)
-    return messages
-
-
-def use_feedback(ai: AI, dbs: DBs):
-    messages = [
-        ai.fsystem(setup_sys_prompt(dbs)),
-        ai.fuser(f"Instructions: {dbs.input['prompt']}"),
-        ai.fassistant(
-            dbs.workspace["all_output.txt"]
-        ),  # reload previously generated code
-    ]
-    if dbs.input["feedback"]:
-        messages = ai.next(messages, dbs.input["feedback"], step_name=curr_fn())
-        to_files(messages[-1].content.strip(), dbs.workspace)
-        return messages
-    else:
-        print(
-            "No feedback was found in the input folder. Please create a file "
-            + "called 'feedback' in the same folder as the prompt file."
-        )
-        exit(1)
-
-
-def set_improve_filelist(ai: AI, dbs: DBs):
-    """Sets the file list for files to work with in existing code mode."""
-    ask_for_files(dbs.input)  # stores files as full paths.
-    return []
-
-
-def assert_files_ready(ai: AI, dbs: DBs):
-    """Checks that the required files are present for headless
-    improve code execution."""
-    assert (
-        "file_list.txt" in dbs.input
-    ), "For auto_mode file_list.txt need to be in your project folder."
-    assert "prompt" in dbs.input, "For auto_mode a prompt file must exist."
-    return []
-
-
-def get_improve_prompt(ai: AI, dbs: DBs):
-    """
-    Asks the user what they would like to fix.
-    """
-
-    if not dbs.input.get("prompt"):
-        dbs.input["prompt"] = input(
-            "\nWhat do you need to improve with the selected files?\n"
-        )
-
-    confirm_str = "\n".join(
-        [
-            "-----------------------------",
-            "The following files will be used in the improvement process:",
-            f"{FILE_LIST_NAME}:",
-            str(dbs.input["file_list.txt"]),
-            "",
-            "The inserted prompt is the following:",
-            f"'{dbs.input['prompt']}'",
-            "-----------------------------",
-            "",
-            "You can change these files in your project before proceeding.",
-            "",
-            "Press enter to proceed with modifications.",
-            "",
-        ]
-    )
-    input(confirm_str)
-    return []
-
-
-def improve_existing_code(ai: AI, dbs: DBs):
-    """
-    After the file list and prompt have been aquired, this function is called
-    to sent the formatted prompt to the LLM.
-    """
-
-    files_info = get_code_strings(dbs.input)
-
-    messages = [
-        ai.fsystem(setup_sys_prompt_existing_code(dbs)),
-        ai.fuser(f"Instructions: {dbs.input['prompt']}"),
-    ]
-    # Add files as input
-    for file_name, file_str in files_info.items():
-        code_input = format_file_to_input(file_name, file_str)
-        messages.append(ai.fuser(f"{code_input}"))
-
-    output_format_str = """
-    Make sure the output of any files is in the following format where
-    FILENAME is the file name including the file extension, and the file path.  Do not
-    forget to include the file path.
-    LANG is the markup code block language for the code's language, and CODE is the code:
-
-    FILENAME
-    ```LANG
-    CODE
-    ```
-    """
-
-    messages = ai.next(messages, output_format_str, step_name=curr_fn())
-    # Maybe we should add another step called "replace" or "overwrite"
-    overwrite_files(messages[-1].content.strip(), dbs)
-    return messages
-
-
-def fix_code(ai: AI, dbs: DBs):
-    messages = AI.deserialize_messages(dbs.logs[gen_code_after_unit_tests.__name__])
-    code_output = messages[-1].content.strip()
-    messages = [
-        ai.fsystem(setup_sys_prompt(dbs)),
-        ai.fuser(f"Instructions: {dbs.input['prompt']}"),
-        ai.fuser(code_output),
-        ai.fsystem(dbs.preprompts["fix_code"]),
-    ]
-    messages = ai.next(
-        messages, "Please fix any errors in the code above.", step_name=curr_fn()
-    )
-    to_files(messages[-1].content.strip(), dbs.workspace)
-    return messages
-
-
-def human_review(ai: AI, dbs: DBs):
-    """Collects and stores human review of the code"""
-    review = human_review_input()
-    if review is not None:
-        dbs.memory["review"] = review.to_json()  # type: ignore
-    return []
-
-
-class Config(str, Enum):
-    DEFAULT = "default"
-    BENCHMARK = "benchmark"
-    SIMPLE = "simple"
-    TDD = "tdd"
-    TDD_PLUS = "tdd+"
-    CLARIFY = "clarify"
-    RESPEC = "respec"
-    EXECUTE_ONLY = "execute_only"
-    EVALUATE = "evaluate"
-    USE_FEEDBACK = "use_feedback"
-    IMPROVE_CODE = "improve_code"
-    EVAL_IMPROVE_CODE = "eval_improve_code"
-
-
-# Define the steps to run for different configs
-STEPS = {
-    Config.DEFAULT: [
-        clarify,
-        gen_clarified_code,
-        gen_entrypoint,
-        execute_entrypoint,
-        human_review,
-    ],
-    Config.BENCHMARK: [
-        simple_gen,
-        gen_entrypoint,
-    ],
-    Config.SIMPLE: [
-        simple_gen,
-        gen_entrypoint,
-        # execute_entrypoint,
-    ],
-    Config.TDD: [
-        gen_spec,
-        gen_unit_tests,
-        gen_code_after_unit_tests,
-        gen_entrypoint,
-        execute_entrypoint,
-        human_review,
-    ],
-    Config.TDD_PLUS: [
-        gen_spec,
-        gen_unit_tests,
-        gen_code_after_unit_tests,
-        fix_code,
-        gen_entrypoint,
-        execute_entrypoint,
-        human_review,
-    ],
-    Config.CLARIFY: [
-        clarify,
-        gen_clarified_code,
-        gen_entrypoint,
-        execute_entrypoint,
-        human_review,
-    ],
-    Config.RESPEC: [
-        gen_spec,
-        respec,
-        gen_unit_tests,
-        gen_code_after_unit_tests,
-        fix_code,
-        gen_entrypoint,
-        execute_entrypoint,
-        human_review,
-    ],
-    Config.USE_FEEDBACK: [use_feedback, gen_entrypoint, execute_entrypoint, human_review],
-    Config.EXECUTE_ONLY: [execute_entrypoint],
-    Config.EVALUATE: [execute_entrypoint, human_review],
-    Config.IMPROVE_CODE: [
-        set_improve_filelist,
-        get_improve_prompt,
-        improve_existing_code,
-    ],
-    Config.EVAL_IMPROVE_CODE: [assert_files_ready, improve_existing_code],
-}
-
-# Future steps that can be added:
-# run_tests_and_fix_files
-# execute_entrypoint_and_fix_files_if_it_results_in_error