openai-compat-endpoint

Public
Forked from will-lms/openai-compat-endpoint
Plugin
Revisions
Back
Project Files
src
config.ts
constants.ts
generator.ts
index.ts
manifest.json
package-lock.json
package.json
README.md
tsconfig.json
tsconfig.tsbuildinfo
src / generator.ts
// src/generator.ts
import { configSchematics, globalConfigSchematics } from "./config";
import { type Chat, type GeneratorController, type InferParsedConfig } from "@lmstudio/sdk";
import OpenAI from "openai";
import {
  type ChatCompletionMessageParam,
  type ChatCompletionMessageToolCall,
  type ChatCompletionTool,
  type ChatCompletionToolMessageParam,
} from "openai/resources/index";
import { FREE_MODELS } from "./constants";

/* -------------------------------------------------------------------------- */
/*                              Global Vars                                   */
/* -------------------------------------------------------------------------- */

const MAX_REQUESTS = 25;

// before 1st using of function
function getFormattedTime(): string {
  const now = new Date();
  const dateStr = now.toLocaleDateString('ru-RU');
  const timeStr = now.toLocaleTimeString('ru-RU', { hour12: false });
  return `${dateStr}, ${timeStr.split(':').slice(0, 2).join(':')} (UTC+3)`;
}

/* -------------------------------------------------------------------------- */
/*                                   Types                                    */
/* -------------------------------------------------------------------------- */

type ToolCallState = {
  id: string;
  name: string | null;
  index: number;
  arguments: string;
};

/* -------------------------------------------------------------------------- */
/*                               Build helpers                                */
/* -------------------------------------------------------------------------- */

function createOpenAI(globalConfig: any) {  //  any instead of typed
  const baseURL = globalConfig?.get("baseUrl") || "https://openrouter.ai/api/v1"; 
  const apiKey = globalConfig?.get("apiKey"); 
  return new OpenAI({
    apiKey,
    baseURL
  });
}

/** Convert internal chat history to the format expected by OpenAI. */

function toOpenAIMessages(history: Chat): ChatCompletionMessageParam[] {
  const messages: ChatCompletionMessageParam[] = [];

  for (const message of history) {
    switch (message.getRole()) {
      case "system":
        messages.push({ role: "system", content: message.getText() });
        break;

      case "user":
        messages.push({ role: "user", content: message.getText() });
        break;

      case "assistant": {
        const toolCalls: ChatCompletionMessageToolCall[] = message
          .getToolCallRequests()
          .map(toolCall => ({
            id: toolCall.id ?? "",
            type: "function",
            function: {
              name: toolCall.name,
              arguments: JSON.stringify(toolCall.arguments ?? {}),
            },
          }));

        messages.push({
          role: "assistant",
          content: message.getText(),
          ...(toolCalls.length ? { tool_calls: toolCalls } : {}),
        });
        break;
      }

      case "tool": {
        message.getToolCallResults().forEach(toolCallResult => {
          messages.push({
            role: "tool",
            tool_call_id: toolCallResult.toolCallId ?? "",
            content: toolCallResult.content,
          } as ChatCompletionToolMessageParam);
        });
        break;
      }
    }
  }

  return messages;
}

/** Convert LM Studio tool definitions to OpenAI function-tool descriptors. */
function toOpenAITools(ctl: GeneratorController): ChatCompletionTool[] | undefined {
  const tools = ctl.getToolDefinitions().map<ChatCompletionTool>(t => ({
    type: "function",
    function: {
      name: t.function.name,
      description: t.function.description,
      parameters: t.function.parameters ?? {},
    },
  }));
  return tools.length ? tools : undefined;
}

/* -------------------------------------------------------------------------- */
/*                            Stream-handling utils                           */
/* -------------------------------------------------------------------------- */

function wireAbort(ctl: GeneratorController, stream: { controller: AbortController }) {
  ctl.onAborted(() => {
    console.info("Generation aborted by user.");
    stream.controller.abort();
  });
}

async function consumeStream(stream: AsyncIterable<any>, ctl: GeneratorController) {
  let current: ToolCallState | null = null;

  function maybeFlushCurrentToolCall() {
    if (current === null || current.name === null) {
      return;
    }
    ctl.toolCallGenerationEnded({
      type: "function",
      name: current.name,
      arguments: JSON.parse(current.arguments),
      id: current.id,
    });
    current = null;
  }

  for await (const chunk of stream) {
    //console.info("Received chunk:", JSON.stringify(chunk));            //DEBUG in LOG - not my
    const delta = chunk.choices?.[0]?.delta as
      | {
          content?: string;
          tool_calls?: Array<{
            index: number;
            id?: string;
            function?: { name?: string; arguments?: string };
          }>;
        }
      | undefined;

    if (!delta) continue;

    /* Text streaming */
    if (delta.content) {
      ctl.fragmentGenerated(delta.content);
    }

    /* Tool-call streaming */
    for (const toolCall of delta.tool_calls ?? []) {
      if (toolCall.id !== undefined) {
        maybeFlushCurrentToolCall();
        current = { id: toolCall.id, name: null, index: toolCall.index, arguments: "" };
        ctl.toolCallGenerationStarted();
      }

      if (toolCall.function?.name && current) {
        current.name = toolCall.function.name;
        ctl.toolCallGenerationNameReceived(toolCall.function.name);
      }

      if (toolCall.function?.arguments && current) {
        current.arguments += toolCall.function.arguments;
        ctl.toolCallGenerationArgumentFragmentGenerated(toolCall.function.arguments);
      }
    }

    /* Finalize tool call */
    if (chunk.choices?.[0]?.finish_reason === "tool_calls" && current?.name) {
      maybeFlushCurrentToolCall();
    }
  }

  console.info("Generation completed.");
}

/* -------------------------------------------------------------------------- */
/*                                     API                                    */
/* -------------------------------------------------------------------------- */

export async function generate(ctl: GeneratorController, history: Chat) {
 console.log(`[DEBUG] [ENTER] generate() PID=${Math.random().toString(36).slice(-4)}`);
  const config = ctl.getPluginConfig(configSchematics as any) as any;
  const globalConfig = ctl.getGlobalPluginConfig(globalConfigSchematics as any) as any;

// +++ STATELESS COUNTER: parse from chat history
let requestCounter = 1;
const allMessages = Array.from(history);
//console.log('History length:', allMessages.length);  // DEBUG

for (let i = allMessages.length - 1; i >= 0; i--) {
  const msg = allMessages[i];
  if (msg.getRole() === "assistant") {
    const content = msg.getText();
    if (content) {
      const match = content.match(/✅ Request #(\d+)/);
      if (match) {
        requestCounter = parseInt(match[1], 10) + 1;
        break;
      }
    }
  }
}
// +++ 3.12.2025

console.log('[PLUGIN] History length:', Array.from(history).length);
const lastMsg = Array.from(history).slice(-1)[0];
if (lastMsg) console.log('[PLUGIN] Last role:', lastMsg.getRole(), 'preview:', lastMsg.getText()?.substring(0, 50));
console.log('[PLUGIN] Parsed counter:', requestCounter);
// +++ END DEBUG



  const apiKey = globalConfig.get("apiKey");      // string
  const baseUrl = globalConfig.get("baseUrl");    // string
  let model = config.get("model");                // "auto", "x-ai/grok 4.1-", "qwen/qwen-turbo" etc

  model = model || FREE_MODELS[1];  // Grok 4.1 free - fallback hardcoded

  if (model === "auto" || !model || model === "placeholder/free-model") {
    model = FREE_MODELS[1];      // Grok 4.1 free
  }

  console.info("Using fallback free model:", model);
  
  model = model.trim();

  const openai = createOpenAI(globalConfig);
  const messages = toOpenAIMessages(history);
  const tools = toOpenAITools(ctl);

 const timeStr = getFormattedTime();

try {
  const stream = await openai.chat.completions.create({
    model,
    messages,
    tools,
    stream: true
  });

  wireAbort(ctl, stream);
  await consumeStream(stream, ctl);

  // post-generation status 
  const timeStr = getFormattedTime();
  ctl.fragmentGenerated(`\n✅ Request #${requestCounter}/${MAX_REQUESTS} at ${timeStr}\n`);

} catch (error: unknown) {
  let msg = "❌ Generation failed.";
  if (typeof error === "object" && error !== null) {
    if ("status" in error && (error as any).status === 429) {
      msg = `❌ 429 Rate Limit Exceeded. You've used ${requestCounter}/${MAX_REQUESTS} free requests. Try again later or add your own API key.`;
      console.log('[PLUGIN] API key Limit exceeded/ Error: ', (error as any).status);
    } else if ("message" in error && typeof (error as any).message === "string") {
      const message = (error as any).message;
      if (message.includes("API Key")) {
        msg = "❌ Invalid or missing API key.";
      } else {
        msg = `❌ API error: ${message}`;
      }
    }
  }

  ctl.fragmentGenerated(`${msg}\n`);

  return;
}

}
//end.