workflows/libs/llm_api/openai.py

# flake8: noqa: E402
import json
import os
import re
import sys
from typing import Dict, List

import openai

sys.path.append(os.path.join(os.path.dirname(__file__), ".."))

from ide_services.services import log_warn


def _try_remove_markdown_block_flag(content):
    """
    如果content是一个markdown块，则删除它的头部```xxx和尾部```
    """
    # 定义正则表达式模式，用于匹配markdown块的头部和尾部
    pattern = r"^\s*```\s*(\w+)\s*\n(.*?)\n\s*```\s*$"

    # 使用re模块进行匹配
    match = re.search(pattern, content, re.DOTALL | re.MULTILINE)

    if match:
        # 如果匹配成功，则提取出markdown块的内容并返回
        _ = match.group(1)  # language
        markdown_content = match.group(2)
        return markdown_content.strip()
    else:
        # 如果匹配失败，则返回原始内容
        return content


def chat_completion_stream(
    messages: List[Dict],  # [{"role": "user", "content": "hello"}]
    llm_config: Dict,  # {"model": "...", ...}
    error_out: bool = True,
    stream_out=False,
) -> str:
    """
    通过ChatCompletion API获取OpenAI聊天机器人的回复。

    Args:
        messages: 一个列表，包含用户输入的消息。
        llm_config: 一个字典，包含ChatCompletion API的配置信息。
        error_out: 如果为True，遇到异常时输出错误信息并返回None，否则返回None。

    Returns:
        如果成功获取到聊天机器人的回复，返回一个字符串类型的回复消息。如果连接失败，则返回None。

    """
    for try_times in range(3):
        try:
            client = openai.OpenAI(
                api_key=os.environ.get("OPENAI_API_KEY", None),
                base_url=os.environ.get("OPENAI_API_BASE", None),
            )

            llm_config["stream"] = True
            llm_config["timeout"] = 8
            response = client.chat.completions.create(messages=messages, **llm_config)

            response_result = {"content": None, "function_name": None, "parameters": ""}
            for chunk in response:  # pylint: disable=E1133
                chunk = chunk.dict()
                delta = chunk["choices"][0]["delta"]
                if "tool_calls" in delta and delta["tool_calls"]:
                    tool_call = delta["tool_calls"][0]["function"]
                    if tool_call.get("name", None):
                        response_result["function_name"] = tool_call["name"]
                    if tool_call.get("arguments", None):
                        response_result["parameters"] += tool_call["arguments"]
                if delta.get("content", None):
                    if stream_out:
                        print(delta["content"], end="", flush=True)
                    if response_result["content"]:
                        response_result["content"] += delta["content"]
                    else:
                        response_result["content"] = delta["content"]
            return response_result
        except (openai.APIConnectionError, openai.APITimeoutError) as err:
            log_warn(f"Exception: {err.__class__.__name__}: {err}")
            if try_times >= 2:
                return {"content": None, "function_name": None, "parameters": "", "error": err}
            continue
        except openai.APIError as err:
            if error_out:
                print("Exception:", err, file=sys.stderr, flush=True)
            return {"content": None, "function_name": None, "parameters": "", "error": err}
        except Exception as err:
            if error_out:
                print("Exception:", err, file=sys.stderr, flush=True)
            return {"content": None, "function_name": None, "parameters": "", "error": err}


def chat_completion_no_stream_return_json(messages, llm_config, error_out: bool = True):
    """
    尝试三次从聊天完成API获取结果，并返回JSON对象。
    如果无法解析JSON，将尝试三次，直到出现错误或达到最大尝试次数。

    Args:
        messages (List[str]): 用户输入的消息列表。
        llm_config (Dict[str, Any]): 聊天配置字典。
        error_out (bool, optional): 如果为True，则如果出现错误将打印错误消息并返回None。默认为True。

    Returns:
        Dict[str, Any]: 从聊天完成API获取的JSON对象。
            如果无法解析JSON或达到最大尝试次数，则返回None。
    """
    for _1 in range(3):
        response = chat_completion_stream(messages, llm_config)
        if not response["content"]:
            return None

        try:
            # json will format as ```json ... ``` in 1106 model
            response_content = _try_remove_markdown_block_flag(response["content"])
            response_obj = json.loads(response_content)
            return response_obj
        except json.JSONDecodeError:
            log_warn(f"JSONDecodeError: {response['content']}")
            continue
        except Exception as err:
            if error_out:
                print("Exception: ", err, file=sys.stderr, flush=True)
            return None
    if error_out:
        print("Not valid json response:", response["content"], file=sys.stderr, flush=True)
    return None
-												Add log_info function to ide_services.services.py

											
										
										
											2023-12-20 21:13:05 +08:00
+								# flake8: noqa: E402
-												Sort and format import blocks

											
										
										
											2024-01-05 12:27:57 +08:00
+								import json
-												update openai to 1.0

											
										
										
											2023-12-13 14:18:08 +08:00
+								import os
-												Sort and format import blocks

											
										
										
											2024-01-05 12:27:57 +08:00
+								import re
-												feat: Integrate LLM API and UI utility functions

- Added new LLM API functions for non-streaming chat completions
- Introduced UI utility functions for input/output interaction
- Implemented multi-select and single-select UI components

											
										
										
											2023-12-08 10:37:32 +08:00
+								import sys
-												chore: Correct lint errors

- Refactored language_prompt to handle Chinese characters
- Updated model_token_limit_error message formatting
- Modified function signature for chat_completion_stream

											
										
										
											2024-01-24 17:34:27 +08:00
+								from typing import Dict, List
-												feat: Integrate LLM API and UI utility functions

- Added new LLM API functions for non-streaming chat completions
- Introduced UI utility functions for input/output interaction
- Implemented multi-select and single-select UI components

											
										
										
											2023-12-08 10:37:32 +08:00
 								import openai
-												Add log_info function to ide_services.services.py

											
										
										
											2023-12-20 21:13:05 +08:00
+								sys.path.append(os.path.join(os.path.dirname(__file__), ".."))
 								from ide_services.services import log_warn
-												refactor: Update LLM configs and add markdown flag removal

- Updated model version in various LLM configs to 'gpt-3.5-turbo-1106'
- Added '_try_remove_markdown_block_flag' function in openai.py

											
										
										
											2023-12-08 10:55:48 +08:00
 								def _try_remove_markdown_block_flag(content):
 								    """
 								    如果content是一个markdown块，则删除它的头部```xxx和尾部```
 								    """
 								    # 定义正则表达式模式，用于匹配markdown块的头部和尾部
-												Fix format

											
										
										
											2023-12-08 18:28:36 +08:00
+								    pattern = r"^\s*```\s*(\w+)\s*\n(.*?)\n\s*```\s*$"
-												refactor: Update LLM configs and add markdown flag removal

- Updated model version in various LLM configs to 'gpt-3.5-turbo-1106'
- Added '_try_remove_markdown_block_flag' function in openai.py

											
										
										
											2023-12-08 10:55:48 +08:00
+								    # 使用re模块进行匹配
 								    match = re.search(pattern, content, re.DOTALL | re.MULTILINE)
-												Fix format

											
										
										
											2023-12-08 18:28:36 +08:00
-												refactor: Update LLM configs and add markdown flag removal

- Updated model version in various LLM configs to 'gpt-3.5-turbo-1106'
- Added '_try_remove_markdown_block_flag' function in openai.py

											
										
										
											2023-12-08 10:55:48 +08:00
+								    if match:
 								        # 如果匹配成功，则提取出markdown块的内容并返回
-												Fix lint errors

											
										
										
											2023-12-08 18:38:12 +08:00
+								        _ = match.group(1)  # language
-												refactor: Update LLM configs and add markdown flag removal

- Updated model version in various LLM configs to 'gpt-3.5-turbo-1106'
- Added '_try_remove_markdown_block_flag' function in openai.py

											
										
										
											2023-12-08 10:55:48 +08:00
+								        markdown_content = match.group(2)
 								        return markdown_content.strip()
 								    else:
 								        # 如果匹配失败，则返回原始内容
 								        return content
-												Fix format

											
										
										
											2023-12-08 18:28:36 +08:00
-												chore: Correct lint errors

- Refactored language_prompt to handle Chinese characters
- Updated model_token_limit_error message formatting
- Modified function signature for chat_completion_stream

											
										
										
											2024-01-24 17:34:27 +08:00
+								def chat_completion_stream(
 								    messages: List[Dict],  # [{"role": "user", "content": "hello"}]
 								    llm_config: Dict,  # {"model": "...", ...}
 								    error_out: bool = True,
-												Fix commit message length limit

											
										
										
											2024-01-24 18:01:29 +08:00
+								    stream_out=False,
-												chore: Correct lint errors

- Refactored language_prompt to handle Chinese characters
- Updated model_token_limit_error message formatting
- Modified function signature for chat_completion_stream

											
										
										
											2024-01-24 17:34:27 +08:00
+								) -> str:
-												refactor: Update response format and enhance documentation

- Updated the response format to include file paths in filename keys
- Added docstrings to chat_completion functions for better clarity

											
										
										
											2023-12-08 11:08:36 +08:00
+								    """
 								    通过ChatCompletion API获取OpenAI聊天机器人的回复。
-												Fix format

											
										
										
											2023-12-08 18:28:36 +08:00
-												refactor: Update response format and enhance documentation

- Updated the response format to include file paths in filename keys
- Added docstrings to chat_completion functions for better clarity

											
										
										
											2023-12-08 11:08:36 +08:00
+								    Args:
 								        messages: 一个列表，包含用户输入的消息。
 								        llm_config: 一个字典，包含ChatCompletion API的配置信息。
 								        error_out: 如果为True，遇到异常时输出错误信息并返回None，否则返回None。
-												Fix format

											
										
										
											2023-12-08 18:28:36 +08:00
-												refactor: Update response format and enhance documentation

- Updated the response format to include file paths in filename keys
- Added docstrings to chat_completion functions for better clarity

											
										
										
											2023-12-08 11:08:36 +08:00
+								    Returns:
 								        如果成功获取到聊天机器人的回复，返回一个字符串类型的回复消息。如果连接失败，则返回None。
-												Fix format

											
										
										
											2023-12-08 18:28:36 +08:00
-												refactor: Update response format and enhance documentation

- Updated the response format to include file paths in filename keys
- Added docstrings to chat_completion functions for better clarity

											
										
										
											2023-12-08 11:08:36 +08:00
+								    """
-												update openai to 1.0

											
										
										
											2023-12-13 14:18:08 +08:00
+								    for try_times in range(3):
-												feat: Integrate LLM API and UI utility functions

- Added new LLM API functions for non-streaming chat completions
- Introduced UI utility functions for input/output interaction
- Implemented multi-select and single-select UI components

											
										
										
											2023-12-08 10:37:32 +08:00
+								        try:
-												update openai to 1.0

											
										
										
											2023-12-13 14:18:08 +08:00
+								            client = openai.OpenAI(
 								                api_key=os.environ.get("OPENAI_API_KEY", None),
-												reformat

											
										
										
											2023-12-14 11:01:04 +08:00
+								                base_url=os.environ.get("OPENAI_API_BASE", None),
-												update openai to 1.0

											
										
										
											2023-12-13 14:18:08 +08:00
+								            )
-												reformat

											
										
										
											2023-12-14 11:01:04 +08:00
+								            llm_config["stream"] = True
 								            llm_config["timeout"] = 8
 								            response = client.chat.completions.create(messages=messages, **llm_config)
 								            response_result = {"content": None, "function_name": None, "parameters": ""}
 								            for chunk in response:  # pylint: disable=E1133
-												update openai to 1.0

											
										
										
											2023-12-13 14:18:08 +08:00
+								                chunk = chunk.dict()
 								                delta = chunk["choices"][0]["delta"]
-												reformat

											
										
										
											2023-12-14 11:01:04 +08:00
+								                if "tool_calls" in delta and delta["tool_calls"]:
 								                    tool_call = delta["tool_calls"][0]["function"]
 								                    if tool_call.get("name", None):
 								                        response_result["function_name"] = tool_call["name"]
-												update openai to 1.0

											
										
										
											2023-12-13 14:18:08 +08:00
+								                    if tool_call.get("arguments", None):
 								                        response_result["parameters"] += tool_call["arguments"]
-												reformat

											
										
										
											2023-12-14 11:01:04 +08:00
+								                if delta.get("content", None):
-												feat: Add stream_out parameter to chat_completion_no_stream

- Add stream_out parameter to chat_completion_no_stream function
- Print delta content when stream_out is True
- Ensure seamless streaming of chat completion response

											
										
										
											2024-01-02 21:37:02 +08:00
+								                    if stream_out:
 								                        print(delta["content"], end="", flush=True)
-												update openai to 1.0

											
										
										
											2023-12-13 14:18:08 +08:00
+								                    if response_result["content"]:
 								                        response_result["content"] += delta["content"]
 								                    else:
 								                        response_result["content"] = delta["content"]
 								            return response_result
 								        except (openai.APIConnectionError, openai.APITimeoutError) as err:
-												refactor: Improve user experience and streamline commit workflow

- Simplify and clarify user prompts and output messages
- Remove unnecessary print statements and text
- Handle commit abort and errors more gracefully
- Improve error logging in OpenAI chat stream handler

											
										
										
											2024-01-04 10:59:46 +08:00
+								            log_warn(f"Exception: {err.__class__.__name__}: {err}")
-												update openai to 1.0

											
										
										
											2023-12-13 14:18:08 +08:00
+								            if try_times >= 2:
-												fix: Improve error handling for context overflows

- Refactor error output for token limit issues to ensure clarity
- Update the error handling strategy to unify exception responses
- Remove redundant error handling blocks for streamlining

											
										
										
											2024-01-24 17:34:27 +08:00
+								                return {"content": None, "function_name": None, "parameters": "", "error": err}
-												feat: Integrate LLM API and UI utility functions

- Added new LLM API functions for non-streaming chat completions
- Introduced UI utility functions for input/output interaction
- Implemented multi-select and single-select UI components

											
										
										
											2023-12-08 10:37:32 +08:00
+								            continue
-												update openai to 1.0

											
										
										
											2023-12-13 14:18:08 +08:00
+								        except openai.APIError as err:
-												feat: Integrate LLM API and UI utility functions

- Added new LLM API functions for non-streaming chat completions
- Introduced UI utility functions for input/output interaction
- Implemented multi-select and single-select UI components

											
										
										
											2023-12-08 10:37:32 +08:00
+								            if error_out:
-												fix: Improve error handling for context overflows

- Refactor error output for token limit issues to ensure clarity
- Update the error handling strategy to unify exception responses
- Remove redundant error handling blocks for streamlining

											
										
										
											2024-01-24 17:34:27 +08:00
+								                print("Exception:", err, file=sys.stderr, flush=True)
 								            return {"content": None, "function_name": None, "parameters": "", "error": err}
-												fix: Resolve context overflow commit failure

- Updated commit/command.yml to use "en" language code
- Updated commit/commit.py to handle model's maximum context length error
- Updated commit/zh/command.yml to use "zh" language code
- Updated libs/llm_api/openai.py to ignore tokens limit error

Closes devchat-ai/devchat#189

											
										
										
											2024-01-24 17:34:27 +08:00
+								        except Exception as err:
 								            if error_out:
-												fix: Improve error handling for context overflows

- Refactor error output for token limit issues to ensure clarity
- Update the error handling strategy to unify exception responses
- Remove redundant error handling blocks for streamlining

											
										
										
											2024-01-24 17:34:27 +08:00
+								                print("Exception:", err, file=sys.stderr, flush=True)
 								            return {"content": None, "function_name": None, "parameters": "", "error": err}
-												feat: Integrate LLM API and UI utility functions

- Added new LLM API functions for non-streaming chat completions
- Introduced UI utility functions for input/output interaction
- Implemented multi-select and single-select UI components

											
										
										
											2023-12-08 10:37:32 +08:00
-												Fix format

											
										
										
											2023-12-08 18:28:36 +08:00
 								def chat_completion_no_stream_return_json(messages, llm_config, error_out: bool = True):
-												refactor: Update response format and enhance documentation

- Updated the response format to include file paths in filename keys
- Added docstrings to chat_completion functions for better clarity

											
										
										
											2023-12-08 11:08:36 +08:00
+								    """
-												Fix lint errors

											
										
										
											2023-12-08 18:38:12 +08:00
+								    尝试三次从聊天完成API获取结果，并返回JSON对象。
 								    如果无法解析JSON，将尝试三次，直到出现错误或达到最大尝试次数。
-												Fix format

											
										
										
											2023-12-08 18:28:36 +08:00
-												refactor: Update response format and enhance documentation

- Updated the response format to include file paths in filename keys
- Added docstrings to chat_completion functions for better clarity

											
										
										
											2023-12-08 11:08:36 +08:00
+								    Args:
 								        messages (List[str]): 用户输入的消息列表。
 								        llm_config (Dict[str, Any]): 聊天配置字典。
 								        error_out (bool, optional): 如果为True，则如果出现错误将打印错误消息并返回None。默认为True。
-												Fix format

											
										
										
											2023-12-08 18:28:36 +08:00
-												refactor: Update response format and enhance documentation

- Updated the response format to include file paths in filename keys
- Added docstrings to chat_completion functions for better clarity

											
										
										
											2023-12-08 11:08:36 +08:00
+								    Returns:
-												Fix lint errors

											
										
										
											2023-12-08 18:38:12 +08:00
+								        Dict[str, Any]: 从聊天完成API获取的JSON对象。
 								            如果无法解析JSON或达到最大尝试次数，则返回None。
-												refactor: Update response format and enhance documentation

- Updated the response format to include file paths in filename keys
- Added docstrings to chat_completion functions for better clarity

											
										
										
											2023-12-08 11:08:36 +08:00
+								    """
-												feat: Integrate LLM API and UI utility functions

- Added new LLM API functions for non-streaming chat completions
- Introduced UI utility functions for input/output interaction
- Implemented multi-select and single-select UI components

											
										
										
											2023-12-08 10:37:32 +08:00
+								    for _1 in range(3):
-												fix: Update chat_completion_stream function names

- Update function names in openai.py
- Modify function import in __init__.py
- Update function call in openai.py

											
										
										
											2024-01-03 11:08:38 +08:00
+								        response = chat_completion_stream(messages, llm_config)
-												fix: Improve error handling for context overflows

- Refactor error output for token limit issues to ensure clarity
- Update the error handling strategy to unify exception responses
- Remove redundant error handling blocks for streamlining

											
										
										
											2024-01-24 17:34:27 +08:00
+								        if not response["content"]:
-												feat: Integrate LLM API and UI utility functions

- Added new LLM API functions for non-streaming chat completions
- Introduced UI utility functions for input/output interaction
- Implemented multi-select and single-select UI components

											
										
										
											2023-12-08 10:37:32 +08:00
+								            return None
 								        try:
-												refactor: Update LLM configs and add markdown flag removal

- Updated model version in various LLM configs to 'gpt-3.5-turbo-1106'
- Added '_try_remove_markdown_block_flag' function in openai.py

											
										
										
											2023-12-08 10:55:48 +08:00
+								            # json will format as ```json ... ``` in 1106 model
 								            response_content = _try_remove_markdown_block_flag(response["content"])
 								            response_obj = json.loads(response_content)
-												feat: Integrate LLM API and UI utility functions

- Added new LLM API functions for non-streaming chat completions
- Introduced UI utility functions for input/output interaction
- Implemented multi-select and single-select UI components

											
										
										
											2023-12-08 10:37:32 +08:00
+								            return response_obj
-												update openai to 1.0

											
										
										
											2023-12-13 14:18:08 +08:00
+								        except json.JSONDecodeError:
-												Add log_info function to ide_services.services.py

											
										
										
											2023-12-20 21:13:05 +08:00
+								            log_warn(f"JSONDecodeError: {response['content']}")
-												feat: Integrate LLM API and UI utility functions

- Added new LLM API functions for non-streaming chat completions
- Introduced UI utility functions for input/output interaction
- Implemented multi-select and single-select UI components

											
										
										
											2023-12-08 10:37:32 +08:00
+								            continue
-												update openai to 1.0

											
										
										
											2023-12-13 14:18:08 +08:00
+								        except Exception as err:
 								            if error_out:
-												reformat

											
										
										
											2023-12-14 11:01:04 +08:00
+								                print("Exception: ", err, file=sys.stderr, flush=True)
-												update openai to 1.0

											
										
										
											2023-12-13 14:18:08 +08:00
+								            return None
-												feat: Integrate LLM API and UI utility functions

- Added new LLM API functions for non-streaming chat completions
- Introduced UI utility functions for input/output interaction
- Implemented multi-select and single-select UI components

											
										
										
											2023-12-08 10:37:32 +08:00
+								    if error_out:
 								        print("Not valid json response:", response["content"], file=sys.stderr, flush=True)
 								    return None