workflows/merico/unit_tests/write_tests.py

from functools import partial
from typing import List, Optional

from devchat.llm.chat import chat_completion_stream_out
from find_context import Context
from llm_conf import (
    CONTEXT_SIZE,
    DEFAULT_CONTEXT_SIZE,
    DEFAULT_ENCODING,
    USE_USER_MODEL,
    USER_LLM_MODEL,
)
from model import FuncToTest, TokenBudgetExceededException
from openai_util import create_chat_completion_chunks
from prompts import WRITE_TESTS_PROMPT
from tools.file_util import retrieve_file_content
from tools.tiktoken_util import get_encoding

MODEL = USER_LLM_MODEL if USE_USER_MODEL else "gpt-4-turbo-preview"
ENCODING = (
    get_encoding(DEFAULT_ENCODING)  # Use default encoding as an approximation
    if USE_USER_MODEL
    else get_encoding("cl100k_base")
)
TOKEN_BUDGET = int(CONTEXT_SIZE.get(MODEL, DEFAULT_CONTEXT_SIZE) * 0.9)


def _mk_write_tests_msg(
    root_path: str,
    func_to_test: FuncToTest,
    test_cases: List[str],
    chat_language: str,
    reference_files: Optional[List[str]] = None,
    # context_files: Optional[List[str]] = None,
    symbol_contexts: Optional[List[Context]] = None,
    user_requirements: str = "",
) -> Optional[str]:
    additional_requirements = ""
    if user_requirements:
        additional_requirements = f"Additional requirements\n\n{user_requirements}\n\n"

    test_cases_str = ""
    for i, test_case in enumerate(test_cases, 1):
        test_cases_str += f"{i}. {test_case}\n"

    reference_content = "\nContent of reference test code:\n\n"
    if reference_files:
        for i, fp in enumerate(reference_files, 1):
            reference_test_content = retrieve_file_content(fp, root_path)
            reference_content += f"{i}. {fp}\n\n"
            reference_content += f"```{reference_test_content}```\n\n"
    else:
        reference_content += "No reference test cases provided.\n\n"

    func_content = f"\nfunction code\n```\n{func_to_test.func_content}\n```\n"
    class_content = ""
    if func_to_test.container_content is not None:
        class_content = f"\nclass code\n```\n{func_to_test.container_content}\n```\n"

    context_content = ""
    if symbol_contexts:
        context_content += "\n\nrelevant context\n\n"
        context_content += "\n\n".join([str(c) for c in symbol_contexts])
        context_content += "\n\n"

    # if context_files:
    #     context_content += "\n\nrelevant context files\n\n"
    #     for i, fp in enumerate(context_files, 1):
    #         context_file_content = retrieve_file_content(fp, root_path)
    #         context_content += f"{i}. {fp}\n\n"
    #         context_content += f"```{context_file_content}```\n\n"

    # Prepare a list of user messages to fit the token budget
    # by adjusting the relevant content and reference content
    content_fmt = partial(
        WRITE_TESTS_PROMPT.format,
        function_name=func_to_test.func_name,
        file_path=func_to_test.file_path,
        test_cases_str=test_cases_str,
        chat_language=chat_language,
        additional_requirements=additional_requirements,
    )

    # NOTE: adjust symbol_context content more flexibly if needed
    msg_0 = content_fmt(
        relevant_content="\n".join([func_content, class_content, context_content]),
        reference_content=reference_content,
    )

    # 1. func content & class content & reference file content
    msg_1 = content_fmt(
        relevant_content="\n".join([func_content, class_content]),
        reference_content=reference_content,
    )
    # 2. func content & class content
    msg_2 = content_fmt(
        relevant_content="\n".join([func_content, class_content]),
        reference_content="",
    )
    # 3. func content only
    msg_3 = content_fmt(
        relevant_content=func_content,
        reference_content="",
    )

    prioritized_msgs = [msg_0, msg_1, msg_2, msg_3]

    for msg in prioritized_msgs:
        tokens = len(ENCODING.encode(msg, disallowed_special=()))
        if tokens <= TOKEN_BUDGET:
            return msg

    # 3. even func content exceeds the token budget
    raise TokenBudgetExceededException(
        f"Token budget exceeded while writing test cases for <{func_to_test}>. "
        f"({tokens}/{TOKEN_BUDGET})"
    )


def write_and_print_tests(
    root_path: str,
    func_to_test: FuncToTest,
    test_cases: List[str],
    reference_files: Optional[List[str]] = None,
    symbol_contexts: Optional[List[Context]] = None,
    user_requirements: str = "",
    chat_language: str = "English",
) -> None:
    user_msg = _mk_write_tests_msg(
        root_path=root_path,
        func_to_test=func_to_test,
        test_cases=test_cases,
        reference_files=reference_files,
        symbol_contexts=symbol_contexts,
        user_requirements=user_requirements,
        chat_language=chat_language,
    )

    if USE_USER_MODEL:
        # Use the wrapped api
        response = chat_completion_stream_out(
            messages=[{"role": "user", "content": user_msg}],
            llm_config={"model": MODEL, "temperature": 0.1},
        )
        if not response.get("content", None):
            raise response["error"]

    else:
        # Use the openai api parameters
        chunks = create_chat_completion_chunks(
            model=MODEL,
            messages=[{"role": "user", "content": user_msg}],
            temperature=0.1,
        )
        for chunk in chunks:
            if chunk.choices[0].finish_reason == "stop":
                break

            content = chunk.choices[0].delta.content
            if content is not None:
                print(content, flush=True, end="")
Improve adjusting context to fit token budget 2024-01-02 20:36:13 +08:00			`from functools import partial`
Sort and format import blocks 2024-01-05 12:27:57 +08:00			`from typing import List, Optional`
Init /gen_ut 2023-12-18 20:46:16 +08:00
Use chat_completion_stream_out for streaming output 2024-04-24 21:03:50 +08:00			`from devchat.llm.chat import chat_completion_stream_out`
Include file path info in Context 2024-03-06 15:35:21 +08:00			`from find_context import Context`
Be able to switch between openai api & wrapped api 2024-03-12 20:41:39 +08:00			`from llm_conf import (`
			`CONTEXT_SIZE,`
			`DEFAULT_CONTEXT_SIZE,`
			`DEFAULT_ENCODING,`
			`USE_USER_MODEL,`
			`USER_LLM_MODEL,`
			`)`
Sort and format import blocks 2024-01-05 12:27:57 +08:00			`from model import FuncToTest, TokenBudgetExceededException`
Use create completion wrappers in propose_test and write_tests 2023-12-24 19:15:43 +08:00			`from openai_util import create_chat_completion_chunks`
Manage prompts in a single file and ignore line-too-long error 2023-12-24 19:43:29 +08:00			`from prompts import WRITE_TESTS_PROMPT`
Implement other utils in current repo 2024-01-17 15:29:04 +08:00			`from tools.file_util import retrieve_file_content`
Revert "Revert "/unit_tests switch to devchat env"" 2024-01-17 17:56:29 +08:00			`from tools.tiktoken_util import get_encoding`
Init /gen_ut 2023-12-18 20:46:16 +08:00
Be able to switch between openai api & wrapped api 2024-03-12 20:41:39 +08:00			`MODEL = USER_LLM_MODEL if USE_USER_MODEL else "gpt-4-turbo-preview"`
			`ENCODING = (`
			`get_encoding(DEFAULT_ENCODING) # Use default encoding as an approximation`
			`if USE_USER_MODEL`
			`else get_encoding("cl100k_base")`
			`)`
			`TOKEN_BUDGET = int(CONTEXT_SIZE.get(MODEL, DEFAULT_CONTEXT_SIZE) * 0.9)`
Init /gen_ut 2023-12-18 20:46:16 +08:00

Output the final answer in streaming mode 2023-12-24 17:21:31 +08:00			`def _mk_write_tests_msg(`
Init /gen_ut 2023-12-18 20:46:16 +08:00			`root_path: str,`
Adjust content to fit token budget and handle budget exceeded exception 2023-12-28 15:56:15 +08:00			`func_to_test: FuncToTest,`
Init /gen_ut 2023-12-18 20:46:16 +08:00			`test_cases: List[str],`
Support different languages in write_tests 2023-12-24 18:38:59 +08:00			`chat_language: str,`
Init /gen_ut 2023-12-18 20:46:16 +08:00			`reference_files: Optional[List[str]] = None,`
Improve finding context by both definition & type definition 2024-02-27 16:29:18 +08:00			`# context_files: Optional[List[str]] = None,`
Include file path info in Context 2024-03-06 15:35:21 +08:00			`symbol_contexts: Optional[List[Context]] = None,`
Allow use to add customized requirements for tests 2024-03-06 16:08:43 +08:00			`user_requirements: str = "",`
Output the final answer in streaming mode 2023-12-24 17:21:31 +08:00			`) -> Optional[str]:`
Improve the principles for writing tests 2024-03-18 09:30:11 +08:00			`additional_requirements = ""`
			`if user_requirements:`
			`additional_requirements = f"Additional requirements\n\n{user_requirements}\n\n"`
Allow use to add customized requirements for tests 2024-03-06 16:08:43 +08:00
Init /gen_ut 2023-12-18 20:46:16 +08:00			`test_cases_str = ""`
			`for i, test_case in enumerate(test_cases, 1):`
			`test_cases_str += f"{i}. {test_case}\n"`

Improve adjusting context to fit token budget 2024-01-02 20:36:13 +08:00			`reference_content = "\nContent of reference test code:\n\n"`
Init /gen_ut 2023-12-18 20:46:16 +08:00			`if reference_files:`
			`for i, fp in enumerate(reference_files, 1):`
Use relative path in inner logic 2023-12-24 20:13:30 +08:00			`reference_test_content = retrieve_file_content(fp, root_path)`
Improve adjusting context to fit token budget 2024-01-02 20:36:13 +08:00			`reference_content += f"{i}. {fp}\n\n"`
			reference_content += f"```{reference_test_content}```\n\n"
Init /gen_ut 2023-12-18 20:46:16 +08:00			`else:`
Improve adjusting context to fit token budget 2024-01-02 20:36:13 +08:00			`reference_content += "No reference test cases provided.\n\n"`
Init /gen_ut 2023-12-18 20:46:16 +08:00
Improve adjusting context to fit token budget 2024-01-02 20:36:13 +08:00			func_content = f"\nfunction code\n```\n{func_to_test.func_content}\n```\n"
Adjust content to fit token budget and handle budget exceeded exception 2023-12-28 15:56:15 +08:00			`class_content = ""`
			`if func_to_test.container_content is not None:`
Improve adjusting context to fit token budget 2024-01-02 20:36:13 +08:00			class_content = f"\nclass code\n```\n{func_to_test.container_content}\n```\n"
Adjust content to fit token budget and handle budget exceeded exception 2023-12-28 15:56:15 +08:00
Integrate finding context in the workflow 2024-02-19 19:40:18 +08:00			`context_content = ""`
Include file path info in Context 2024-03-06 15:35:21 +08:00			`if symbol_contexts:`
			`context_content += "\n\nrelevant context\n\n"`
			`context_content += "\n\n".join([str(c) for c in symbol_contexts])`
			`context_content += "\n\n"`
Integrate finding context in the workflow 2024-02-19 19:40:18 +08:00
Improve finding context by both definition & type definition 2024-02-27 16:29:18 +08:00			`# if context_files:`
			`# context_content += "\n\nrelevant context files\n\n"`
			`# for i, fp in enumerate(context_files, 1):`
			`# context_file_content = retrieve_file_content(fp, root_path)`
			`# context_content += f"{i}. {fp}\n\n"`
			# context_content += f"```{context_file_content}```\n\n"

Improve adjusting context to fit token budget 2024-01-02 20:36:13 +08:00			`# Prepare a list of user messages to fit the token budget`
			`# by adjusting the relevant content and reference content`
			`content_fmt = partial(`
			`WRITE_TESTS_PROMPT.format,`
Adjust content to fit token budget and handle budget exceeded exception 2023-12-28 15:56:15 +08:00			`function_name=func_to_test.func_name,`
			`file_path=func_to_test.file_path,`
Init /gen_ut 2023-12-18 20:46:16 +08:00			`test_cases_str=test_cases_str,`
Support different languages in write_tests 2023-12-24 18:38:59 +08:00			`chat_language=chat_language,`
Allow use to add customized requirements for tests 2024-03-06 16:08:43 +08:00			`additional_requirements=additional_requirements,`
Init /gen_ut 2023-12-18 20:46:16 +08:00			`)`
Integrate finding context in the workflow 2024-02-19 19:40:18 +08:00
			`# NOTE: adjust symbol_context content more flexibly if needed`
			`msg_0 = content_fmt(`
			`relevant_content="\n".join([func_content, class_content, context_content]),`
			`reference_content=reference_content,`
			`)`

Improve adjusting context to fit token budget 2024-01-02 20:36:13 +08:00			`# 1. func content & class content & reference file content`
			`msg_1 = content_fmt(`
			`relevant_content="\n".join([func_content, class_content]),`
			`reference_content=reference_content,`
			`)`
			`# 2. func content & class content`
			`msg_2 = content_fmt(`
			`relevant_content="\n".join([func_content, class_content]),`
			`reference_content="",`
			`)`
			`# 3. func content only`
			`msg_3 = content_fmt(`
			`relevant_content=func_content,`
			`reference_content="",`
Adjust content to fit token budget and handle budget exceeded exception 2023-12-28 15:56:15 +08:00			`)`
Improve adjusting context to fit token budget 2024-01-02 20:36:13 +08:00
Integrate finding context in the workflow 2024-02-19 19:40:18 +08:00			`prioritized_msgs = [msg_0, msg_1, msg_2, msg_3]`
Improve adjusting context to fit token budget 2024-01-02 20:36:13 +08:00
			`for msg in prioritized_msgs:`
Be able to switch between openai api & wrapped api 2024-03-12 20:41:39 +08:00			`tokens = len(ENCODING.encode(msg, disallowed_special=()))`
Improve adjusting context to fit token budget 2024-01-02 20:36:13 +08:00			`if tokens <= TOKEN_BUDGET:`
			`return msg`
Init /gen_ut 2023-12-18 20:46:16 +08:00
Adjust content to fit token budget and handle budget exceeded exception 2023-12-28 15:56:15 +08:00			`# 3. even func content exceeds the token budget`
			`raise TokenBudgetExceededException(`
Improve the output of token budget exception 2023-12-28 16:40:42 +08:00			`f"Token budget exceeded while writing test cases for <{func_to_test}>. "`
Adjust content to fit token budget and handle budget exceeded exception 2023-12-28 15:56:15 +08:00			`f"({tokens}/{TOKEN_BUDGET})"`
			`)`
Output the final answer in streaming mode 2023-12-24 17:21:31 +08:00

			`def write_and_print_tests(`
			`root_path: str,`
Adjust content to fit token budget and handle budget exceeded exception 2023-12-28 15:56:15 +08:00			`func_to_test: FuncToTest,`
Output the final answer in streaming mode 2023-12-24 17:21:31 +08:00			`test_cases: List[str],`
			`reference_files: Optional[List[str]] = None,`
Include file path info in Context 2024-03-06 15:35:21 +08:00			`symbol_contexts: Optional[List[Context]] = None,`
Cache user requirement of tests for each repo 2024-03-06 22:46:54 +08:00			`user_requirements: str = "",`
Support different languages in write_tests 2023-12-24 18:38:59 +08:00			`chat_language: str = "English",`
Use relative path in inner logic 2023-12-24 20:13:30 +08:00			`) -> None:`
Output the final answer in streaming mode 2023-12-24 17:21:31 +08:00			`user_msg = _mk_write_tests_msg(`
			`root_path=root_path,`
Adjust content to fit token budget and handle budget exceeded exception 2023-12-28 15:56:15 +08:00			`func_to_test=func_to_test,`
Output the final answer in streaming mode 2023-12-24 17:21:31 +08:00			`test_cases=test_cases,`
			`reference_files=reference_files,`
Include file path info in Context 2024-03-06 15:35:21 +08:00			`symbol_contexts=symbol_contexts,`
Allow use to add customized requirements for tests 2024-03-06 16:08:43 +08:00			`user_requirements=user_requirements,`
Support different languages in write_tests 2023-12-24 18:38:59 +08:00			`chat_language=chat_language,`
Init /gen_ut 2023-12-18 20:46:16 +08:00			`)`
Output the final answer in streaming mode 2023-12-24 17:21:31 +08:00
Be able to switch between openai api & wrapped api 2024-03-12 20:41:39 +08:00			`if USE_USER_MODEL:`
			`# Use the wrapped api`
fix: Handle error cases and exit with non-zero status - Added error handling to main functions in multiple modules - Ensured sys.exit(1) is called when responses are not successful - Improved robustness by checking response validity before proceeding 2024-06-18 18:21:25 +08:00			`response = chat_completion_stream_out(`
Be able to switch between openai api & wrapped api 2024-03-12 20:41:39 +08:00			`messages=[{"role": "user", "content": user_msg}],`
			`llm_config={"model": MODEL, "temperature": 0.1},`
			`)`
fix: Handle error cases and exit with non-zero status - Added error handling to main functions in multiple modules - Ensured sys.exit(1) is called when responses are not successful - Improved robustness by checking response validity before proceeding 2024-06-18 18:21:25 +08:00			`if not response.get("content", None):`
			`raise response["error"]`
Init /gen_ut 2023-12-18 20:46:16 +08:00
Be able to switch between openai api & wrapped api 2024-03-12 20:41:39 +08:00			`else:`
			`# Use the openai api parameters`
			`chunks = create_chat_completion_chunks(`
			`model=MODEL,`
			`messages=[{"role": "user", "content": user_msg}],`
			`temperature=0.1,`
			`)`
			`for chunk in chunks:`
			`if chunk.choices[0].finish_reason == "stop":`
			`break`
Improve the usage of the wrapped api 2024-03-13 10:58:07 +08:00
			`content = chunk.choices[0].delta.content`
			`if content is not None:`
			`print(content, flush=True, end="")`