Merge pull request #547 from devchat-ai/add_debug_config_for_code_completions

Refactor LLM Code for Completion Endpoint and Performance Optimization
2024-06-04 13:28:26 +08:00 · 2024-06-04 13:28:26 +08:00 · 91aa2a3e65
commit 91aa2a3e65
parent a05caa9f31 a05e6caee1
2 changed files with 29 additions and 1 deletions
--- a/src/contributes/codecomplete/llm.ts
+++ b/src/contributes/codecomplete/llm.ts
@ -186,13 +186,19 @@ export async function * ollamaDeepseekComplete(prompt: string) : AsyncGenerator<

 export async function * devchatComplete(prompt: string) : AsyncGenerator<CodeCompletionChunk> {
    const devchatEndpoint = DevChatConfig.getInstance().get("providers.devchat.api_base");
-    const completionApiBase = devchatEndpoint + "/completions";
+    const llmApiBase = DevChatConfig.getInstance().get("complete_api_base");
+    let completionApiBase = devchatEndpoint + "/completions";
+    if (llmApiBase) {
+        completionApiBase = llmApiBase + "/completions";
+    }

    let model = DevChatConfig.getInstance().get("complete_model");
    if (!model) {
        model = "ollama/starcoder2:15b";
    }

+    const startTimeLLM = process.hrtime();
+
 	const headers = {
 	    'Content-Type': 'application/json'
 	};
@ -217,7 +223,19 @@ export async function * devchatComplete(prompt: string) : AsyncGenerator<CodeCom
            const stream = response.body as any;
            const decoder = new TextDecoder("utf-8");

+            const endTimeLLM = process.hrtime(startTimeLLM);
+            const durationLLM = endTimeLLM[0] + endTimeLLM[1] / 1e9;
+            logger.channel()?.debug(`LLM api post took ${durationLLM} seconds`);
+
+            let hasFirstLine = false;
+            let hasFirstChunk = false;
            for await (const chunk of stream) {
+                if (!hasFirstChunk) {
+                    hasFirstChunk = true;
+                    const endTimeFirstChunk = process.hrtime(startTimeLLM);
+                    const durationFirstChunk = endTimeFirstChunk[0] + endTimeFirstChunk[1] / 1e9;
+                    logger.channel()?.debug(`LLM first chunk took ${durationFirstChunk} seconds`);
+                }
                const chunkDataText = decoder.decode(chunk).trim();
                // split chunkText by "data: ", for example:
                // data: 123 data: 456 will split to ["", "data: 123 ", "data: 456"]
@ -245,6 +263,12 @@ export async function * devchatComplete(prompt: string) : AsyncGenerator<CodeCom

                    try {
                        const data = JSON.parse(chunkText.substring(5).trim());
+                        if (!hasFirstLine && data.choices[0].text.indexOf("\n") !== -1) {
+                            hasFirstLine = true;
+                            const endTimeLine = process.hrtime(startTimeLLM);
+                            const durationLine = endTimeLine[0] + endTimeLine[1] / 1e9;
+                            logger.channel()?.debug(`LLM first line took ${durationLine} seconds`);
+                        }
                        yield {
                            text: data.choices[0].text,
                            id: data.id
--- a/src/contributes/codecomplete/promptCreator.ts
+++ b/src/contributes/codecomplete/promptCreator.ts
@ -677,6 +677,10 @@ export async function createPrompt(filePath: string, fileContent: string, line:
    }
    if (completeModel.indexOf("deepseek") > -1) {
        prompt = "<｜fim▁begin｜>" + taskDescriptionContextWithCommentPrefix + neighborFileContext + recentEditContext + symbolContext + callDefContext + similarBlockContext + gitDiffContext + `${commentPrefix}<filename>${filePath}\n\n` + prefix + "<｜fim▁hole｜>" + suffix + "<｜fim▁end｜>";
+    } else if (completeModel.indexOf("starcoder") > -1) {
+        prompt = "<fim_prefix>" + taskDescriptionContextWithCommentPrefix + neighborFileContext + recentEditContext + symbolContext + callDefContext + similarBlockContext + gitDiffContext + `${commentPrefix}<filename>${filePath}\n\n` + prefix + "<fim_suffix>" + suffix + "<fim_middle>";
+    } else if (completeModel.indexOf("codestral") > -1) {
+        prompt = "<s>[SUFFIX]" + suffix + "[PREFIX]" + taskDescriptionContextWithCommentPrefix + neighborFileContext + recentEditContext + symbolContext + callDefContext + similarBlockContext + gitDiffContext + `${commentPrefix}<filename>${filePath}\n\n` + prefix;
    } else {
        prompt = "<fim_prefix>" + taskDescriptionContextWithCommentPrefix + neighborFileContext + recentEditContext + symbolContext + callDefContext + similarBlockContext + gitDiffContext + `${commentPrefix}<filename>${filePath}\n\n` + prefix + "<fim_suffix>" + suffix + "<fim_middle>";
    }