Implement support for generic OpenAI api (#213)

* Implement support for generic OpenAI api - Implements support to route requests to any openAI capable provider ( Deepsek, Qwen, VLLM, LM Studio, Ollama ). - Keeps support for pure OpenAI and uses the new better responses api - Uses the /chat/completions api for the generic providers - If uri_base is not set, uses default implementation. * Fix json handling and indentation * Fix linter error indent * Fix tests to set env vars * Fix updating settings * Change to prefix checking for OAI models * FIX check model if custom uri is set * Change chat to sync calls Some local models don't support streaming. Revert to sync calls for generic OAI api * Fix tests * Fix tests * Fix for gpt5 message extraction - Finds the message output by filtering for "type" == "message" instead of assuming it's at index 0 - Safely extracts the text using safe navigation operators (&.) - Raises a clear error if no message content is found - Parses the JSON as before * Add more langfuse logging - Add Langfuse to auto categorizer and merchant detector - Fix monitoring on streaming chat responses - Add Langfuse traces also for model errors now * Update app/models/provider/openai.rb Co-authored-by: coderabbitai[bot] <136622811+coderabbitai[bot]@users.noreply.github.com> Signed-off-by: soky srm <sokysrm@gmail.com> * handle nil function results explicitly * Exposing some config vars. * Linter and nitpick comments * Drop back to `gpt-4.1` as default for now * Linter * Fix for strict tool schema in Gemini - This fixes tool calling in Gemini OpenAI api - Fix for getTransactions function, page size is not used. --------- Signed-off-by: soky srm <sokysrm@gmail.com> Co-authored-by: coderabbitai[bot] <136622811+coderabbitai[bot]@users.noreply.github.com> Co-authored-by: Juan José Mata <juanjo.mata@gmail.com>
2026-04-20 20:44:08 +00:00 · 2025-10-22 16:02:50 +02:00
parent ea7ce13a7d
commit 8cd109a5b2
24 changed files with 875 additions and 195 deletions
--- a/app/models/provider/openai/auto_categorizer.rb
+++ b/app/models/provider/openai/auto_categorizer.rb
@@ -1,31 +1,19 @@
 class Provider::Openai::AutoCategorizer
-  DEFAULT_MODEL = "gpt-4.1-mini"
-
-  def initialize(client, model: "", transactions: [], user_categories: [])
+  def initialize(client, model: "", transactions: [], user_categories: [], custom_provider: false, langfuse_trace: nil)
    @client = client
    @model = model
    @transactions = transactions
    @user_categories = user_categories
+    @custom_provider = custom_provider
+    @langfuse_trace = langfuse_trace
  end

  def auto_categorize
-    response = client.responses.create(parameters: {
-      model: model.presence || DEFAULT_MODEL,
-      input: [ { role: "developer", content: developer_message } ],
-      text: {
-        format: {
-          type: "json_schema",
-          name: "auto_categorize_personal_finance_transactions",
-          strict: true,
-          schema: json_schema
-        }
-      },
-      instructions: instructions
-    })
-
-    Rails.logger.info("Tokens used to auto-categorize transactions: #{response.dig("usage").dig("total_tokens")}")
-
-    build_response(extract_categorizations(response))
+    if custom_provider
+      auto_categorize_openai_generic
+    else
+      auto_categorize_openai_native
+    end
  end

  def instructions
@@ -50,7 +38,75 @@ class Provider::Openai::AutoCategorizer
  end

  private
-    attr_reader :client, :model, :transactions, :user_categories
+
+    def auto_categorize_openai_native
+      span = langfuse_trace&.span(name: "auto_categorize_api_call", input: {
+        model: model.presence || Provider::Openai::DEFAULT_MODEL,
+        transactions: transactions,
+        user_categories: user_categories
+      })
+
+      response = client.responses.create(parameters: {
+        model: model.presence || Provider::Openai::DEFAULT_MODEL,
+        input: [ { role: "developer", content: developer_message } ],
+        text: {
+          format: {
+            type: "json_schema",
+            name: "auto_categorize_personal_finance_transactions",
+            strict: true,
+            schema: json_schema
+          }
+        },
+        instructions: instructions
+      })
+      Rails.logger.info("Tokens used to auto-categorize transactions: #{response.dig("usage", "total_tokens")}")
+
+      categorizations = extract_categorizations_native(response)
+      result = build_response(categorizations)
+
+      span&.end(output: result.map(&:to_h), usage: response.dig("usage"))
+      result
+    rescue => e
+      span&.end(output: { error: e.message }, level: "ERROR")
+      raise
+    end
+
+    def auto_categorize_openai_generic
+      span = langfuse_trace&.span(name: "auto_categorize_api_call", input: {
+        model: model.presence || Provider::Openai::DEFAULT_MODEL,
+        transactions: transactions,
+        user_categories: user_categories
+      })
+
+      response = client.chat(parameters: {
+        model: model.presence || Provider::Openai::DEFAULT_MODEL,
+        messages: [
+          { role: "system", content: instructions },
+          { role: "user", content: developer_message }
+        ],
+        response_format: {
+          type: "json_schema",
+          json_schema: {
+            name: "auto_categorize_personal_finance_transactions",
+            strict: true,
+            schema: json_schema
+          }
+        }
+      })
+
+      Rails.logger.info("Tokens used to auto-categorize transactions: #{response.dig("usage", "total_tokens")}")
+
+      categorizations = extract_categorizations_generic(response)
+      result = build_response(categorizations)
+
+      span&.end(output: result.map(&:to_h), usage: response.dig("usage"))
+      result
+    rescue => e
+      span&.end(output: { error: e.message }, level: "ERROR")
+      raise
+    end
+
+    attr_reader :client, :model, :transactions, :user_categories, :custom_provider, :langfuse_trace

    AutoCategorization = Provider::LlmConcept::AutoCategorization

@@ -69,9 +125,23 @@ class Provider::Openai::AutoCategorizer
      category_name
    end

-    def extract_categorizations(response)
-      response_json = JSON.parse(response.dig("output")[0].dig("content")[0].dig("text"))
-      response_json.dig("categorizations")
+    def extract_categorizations_native(response)
+      # Find the message output (not reasoning output)
+      message_output = response["output"]&.find { |o| o["type"] == "message" }
+      raw = message_output&.dig("content", 0, "text")
+
+      raise Provider::Openai::Error, "No message content found in response" if raw.nil?
+
+      JSON.parse(raw).dig("categorizations")
+    rescue JSON::ParserError => e
+      raise Provider::Openai::Error, "Invalid JSON in native categorization: #{e.message}"
+    end
+
+    def extract_categorizations_generic(response)
+      raw = response.dig("choices", 0, "message", "content")
+      JSON.parse(raw).dig("categorizations")
+    rescue JSON::ParserError => e
+      raise Provider::Openai::Error, "Invalid JSON in generic categorization: #{e.message}"
    end

    def json_schema