Merge pull request #277 from marcklingen/fix-langfuse-filter

fix: langfuse filter pipeline cost tracking
2025-06-26 18:15:58 +00:00 · 2024-09-27 20:05:12 +02:00 · 2024-09-27 20:05:12 +02:00 · c1dd8987d4
commit c1dd8987d4
parent 0b99d06f23 5788998006
1 changed files with 24 additions and 12 deletions
--- a/examples/filters/langfuse_filter_pipeline.py
+++ b/examples/filters/langfuse_filter_pipeline.py
@ -1,23 +1,28 @@
 """
 title: Langfuse Filter Pipeline
 author: open-webui
-date: 2024-05-30
+date: 2024-09-27
-version: 1.3
+version: 1.4
 license: MIT
 description: A filter pipeline that uses Langfuse.
 requirements: langfuse
 """
 from typing import List, Optional
 from schemas import OpenAIChatMessage
 import os
 import uuid
-from utils.pipelines.main import get_last_user_message, get_last_assistant_message
+from utils.pipelines.main import get_last_assistant_message
 from pydantic import BaseModel
 from langfuse import Langfuse
 from langfuse.api.resources.commons.errors.unauthorized_error import UnauthorizedError
 def get_last_assistant_message_obj(messages: List[dict]) -> dict:
    for message in reversed(messages):
        if message["role"] == "assistant":
            return message
    return {}
 class Pipeline:
    class Valves(BaseModel):
@ -109,21 +114,28 @@ class Pipeline:
    async def outlet(self, body: dict, user: Optional[dict] = None) -> dict:
        print(f"outlet:{__name__}")
        print(f"Received body: {body}")
        if body["chat_id"] not in self.chat_generations:
            return body
        generation = self.chat_generations[body["chat_id"]]
        assistant_message = get_last_assistant_message(body["messages"])
-        # Extract usage information
+        
-        info = assistant_message.get("info", {})
+        # Extract usage information for models that support it
        usage = None
-        if "prompt_tokens" in info and "completion_tokens" in info:
+        assistant_message_obj = get_last_assistant_message_obj(body["messages"])
-            usage = {
+        if assistant_message_obj:
-                "input": info["prompt_tokens"],
+            info = assistant_message_obj.get("info", {})
-                "output": info["completion_tokens"],
+            if isinstance(info, dict):
-                "unit": "TOKENS",
+                input_tokens = info.get("prompt_eval_count") or info.get("prompt_tokens")
-            }
+                output_tokens = info.get("eval_count") or info.get("completion_tokens")
                if input_tokens is not None and output_tokens is not None:
                    usage = {
                        "input": input_tokens,
                        "output": output_tokens,
                        "unit": "TOKENS",
                    }
        # Update generation
        generation.end(