workflows/gen_ut/propose_test.py

from typing import List
import tiktoken
import json

from openai_util import create_chat_completion_content
from prompts import PROPOSE_TEST_PROMPT
from model import FuncToTest, TokenBudgetExceededException


MODEL = "gpt-3.5-turbo-1106"
# MODEL = "gpt-4-1106-preview"
TOKEN_BUDGET = int(16000 * 0.9)


def _mk_user_msg(
    user_prompt: str,
    func_to_test: FuncToTest,
    chat_language: str,
) -> str:
    """
    Create a user message to be sent to the model within the token budget.
    """
    encoding: tiktoken.Encoding = tiktoken.encoding_for_model(MODEL)

    func_content = f"function code\n```\n{func_to_test.func_content}\n```\n"
    class_content = ""
    if func_to_test.container_content is not None:
        class_content = f"class code\n```\n{func_to_test.container_content}\n```\n"

    # Adjust relevant content to fit the token budget

    # 1. both func content and class content
    relevant_content = "\n".join([func_content, class_content])
    usr_msg = PROPOSE_TEST_PROMPT.format(
        user_prompt=user_prompt,
        function_name=func_to_test.func_name,
        file_path=func_to_test.file_path,
        relevant_content=relevant_content,
        chat_language=chat_language,
    )
    token_count = len(encoding.encode(usr_msg))
    if token_count <= TOKEN_BUDGET:
        return usr_msg

    # 2. only func content
    relevant_content = func_content
    usr_msg = PROPOSE_TEST_PROMPT.format(
        user_prompt=user_prompt,
        function_name=func_to_test.func_name,
        file_path=func_to_test.file_path,
        relevant_content=relevant_content,
        chat_language=chat_language,
    )
    token_count = len(encoding.encode(usr_msg))
    if token_count <= TOKEN_BUDGET:
        return usr_msg

    # 3. even func content exceeds the token budget
    raise TokenBudgetExceededException(
        f"Token budget exceeded while proposing test cases for <{func_to_test}>. "
        f"({token_count}/{TOKEN_BUDGET})"
    )


def propose_test(
    user_prompt: str,
    func_to_test: FuncToTest,
    chat_language: str = "English",
) -> List[str]:
    """Propose test cases for a specified function based on a user prompt

    Args:
        user_prompt (str): The prompt or description for which test cases need to be generated.
        function_name (str): The name of the function to generate test cases for.
        file_path (str): The absolute path to the file containing the target function for which
                         test cases will be generated.

    Returns:
        List[str]: A list of test case descriptions.
    """
    user_msg = _mk_user_msg(
        user_prompt=user_prompt,
        func_to_test=func_to_test,
        chat_language=chat_language,
    )

    content = create_chat_completion_content(
        model=MODEL,
        messages=[{"role": "user", "content": user_msg}],
        response_format={"type": "json_object"},
        temperature=0.1,
    )

    cases = json.loads(content).get("test_cases", [])

    descriptions = []
    for case in cases:
        description = case.get("description", None)
        if description:
            descriptions.append(description)

    return descriptions
Manage prompts in a single file and ignore line-too-long error 2023-12-24 19:43:29 +08:00			`from typing import List`
Init /gen_ut 2023-12-18 20:46:16 +08:00			`import tiktoken`
			`import json`
Use create completion wrappers in propose_test and write_tests 2023-12-24 19:15:43 +08:00
			`from openai_util import create_chat_completion_content`
Manage prompts in a single file and ignore line-too-long error 2023-12-24 19:43:29 +08:00			`from prompts import PROPOSE_TEST_PROMPT`
Adjust content to fit token budget and handle budget exceeded exception 2023-12-28 15:56:15 +08:00			`from model import FuncToTest, TokenBudgetExceededException`
Init /gen_ut 2023-12-18 20:46:16 +08:00

Extract function content when line numbers are provided 2023-12-18 22:21:12 +08:00			`MODEL = "gpt-3.5-turbo-1106"`
			`# MODEL = "gpt-4-1106-preview"`
Update token budgets 2023-12-28 17:09:06 +08:00			`TOKEN_BUDGET = int(16000 * 0.9)`
Adjust content to fit token budget and handle budget exceeded exception 2023-12-28 15:56:15 +08:00

			`def _mk_user_msg(`
			`user_prompt: str,`
			`func_to_test: FuncToTest,`
			`chat_language: str,`
			`) -> str:`
			`"""`
			`Create a user message to be sent to the model within the token budget.`
			`"""`
			`encoding: tiktoken.Encoding = tiktoken.encoding_for_model(MODEL)`

			func_content = f"function code\n```\n{func_to_test.func_content}\n```\n"
			`class_content = ""`
			`if func_to_test.container_content is not None:`
			class_content = f"class code\n```\n{func_to_test.container_content}\n```\n"

			`# Adjust relevant content to fit the token budget`

			`# 1. both func content and class content`
			`relevant_content = "\n".join([func_content, class_content])`
			`usr_msg = PROPOSE_TEST_PROMPT.format(`
			`user_prompt=user_prompt,`
			`function_name=func_to_test.func_name,`
			`file_path=func_to_test.file_path,`
			`relevant_content=relevant_content,`
			`chat_language=chat_language,`
			`)`
			`token_count = len(encoding.encode(usr_msg))`
			`if token_count <= TOKEN_BUDGET:`
			`return usr_msg`

			`# 2. only func content`
			`relevant_content = func_content`
			`usr_msg = PROPOSE_TEST_PROMPT.format(`
			`user_prompt=user_prompt,`
			`function_name=func_to_test.func_name,`
			`file_path=func_to_test.file_path,`
			`relevant_content=relevant_content,`
			`chat_language=chat_language,`
			`)`
			`token_count = len(encoding.encode(usr_msg))`
			`if token_count <= TOKEN_BUDGET:`
			`return usr_msg`

			`# 3. even func content exceeds the token budget`
			`raise TokenBudgetExceededException(`
Improve the output of token budget exception 2023-12-28 16:40:42 +08:00			`f"Token budget exceeded while proposing test cases for <{func_to_test}>. "`
Adjust content to fit token budget and handle budget exceeded exception 2023-12-28 15:56:15 +08:00			`f"({token_count}/{TOKEN_BUDGET})"`
			`)`
Init /gen_ut 2023-12-18 20:46:16 +08:00

			`def propose_test(`
			`user_prompt: str,`
Adjust content to fit token budget and handle budget exceeded exception 2023-12-28 15:56:15 +08:00			`func_to_test: FuncToTest,`
Support different languages in llm chatting 2023-12-24 17:31:35 +08:00			`chat_language: str = "English",`
Init /gen_ut 2023-12-18 20:46:16 +08:00			`) -> List[str]:`
			`"""Propose test cases for a specified function based on a user prompt`

			`Args:`
			`user_prompt (str): The prompt or description for which test cases need to be generated.`
			`function_name (str): The name of the function to generate test cases for.`
			`file_path (str): The absolute path to the file containing the target function for which`
			`test cases will be generated.`
Extract function content when line numbers are provided 2023-12-18 22:21:12 +08:00
Init /gen_ut 2023-12-18 20:46:16 +08:00			`Returns:`
			`List[str]: A list of test case descriptions.`
			`"""`
Adjust content to fit token budget and handle budget exceeded exception 2023-12-28 15:56:15 +08:00			`user_msg = _mk_user_msg(`
Init /gen_ut 2023-12-18 20:46:16 +08:00			`user_prompt=user_prompt,`
Adjust content to fit token budget and handle budget exceeded exception 2023-12-28 15:56:15 +08:00			`func_to_test=func_to_test,`
Support different languages in llm chatting 2023-12-24 17:31:35 +08:00			`chat_language=chat_language,`
Init /gen_ut 2023-12-18 20:46:16 +08:00			`)`

Use create completion wrappers in propose_test and write_tests 2023-12-24 19:15:43 +08:00			`content = create_chat_completion_content(`
Init /gen_ut 2023-12-18 20:46:16 +08:00			`model=MODEL,`
			`messages=[{"role": "user", "content": user_msg}],`
			`response_format={"type": "json_object"},`
			`temperature=0.1,`
			`)`

			`cases = json.loads(content).get("test_cases", [])`

			`descriptions = []`
			`for case in cases:`
			`description = case.get("description", None)`
			`if description:`
			`descriptions.append(description)`
Extract function content when line numbers are provided 2023-12-18 22:21:12 +08:00
Init /gen_ut 2023-12-18 20:46:16 +08:00			`return descriptions`