Add patch for o# models on Azure

connect #3023 Note: depends on user naming the deployment correctly.
2025-02-05 11:34:03 -08:00 · 2025-02-05 11:34:03 -08:00 · a5ee6121e2
commit a5ee6121e2
parent 694aa85e43
1 changed files with 14 additions and 3 deletions
--- a/server/utils/AiProviders/azureOpenAi/index.js
+++ b/server/utils/AiProviders/azureOpenAi/index.js
@ -38,6 +38,16 @@ class AzureOpenAiLLM {
    );
  }

+  /**
+   * Check if the model is an o# type model.
+   * NOTE: This is HIGHLY dependent on if the user named their deployment "o1" or "o3-mini" or something else to match the model name.
+   * It cannot be determined by the model name alone since model deployments can be named arbitrarily.
+   * @returns {boolean}
+   */
+  get isOTypeModel() {
+    return this.model.startsWith("o");
+  }
+
  #log(text, ...args) {
    console.log(`\x1b[32m[AzureOpenAi]\x1b[0m ${text}`, ...args);
  }
@ -55,6 +65,7 @@ class AzureOpenAiLLM {
  }

  streamingEnabled() {
+    if (this.isOTypeModel && this.model !== "o3-mini") return false;
    return "streamGetChatCompletion" in this;
  }

@ -110,7 +121,7 @@ class AzureOpenAiLLM {
    attachments = [], // This is the specific attachment for only this prompt
  }) {
    const prompt = {
-      role: "system",
+      role: this.isOTypeModel ? "user" : "system",
      content: `${systemPrompt}${this.#appendContext(contextTexts)}`,
    };
    return [
@ -131,7 +142,7 @@ class AzureOpenAiLLM {

    const result = await LLMPerformanceMonitor.measureAsyncFunction(
      this.openai.getChatCompletions(this.model, messages, {
-        temperature,
+        ...(this.isOTypeModel ? {} : { temperature }),
      })
    );

@ -161,7 +172,7 @@ class AzureOpenAiLLM {

    const measuredStreamRequest = await LLMPerformanceMonitor.measureStream(
      await this.openai.streamChatCompletions(this.model, messages, {
-        temperature,
+        ...(this.isOTypeModel ? {} : { temperature }),
        n: 1,
      }),
      messages