mirror of
https://github.com/open-webui/pipelines
synced 2025-05-13 17:10:45 +00:00
Added caching and optimization for Markdown table translation
This commit is contained in:
parent
8d3bc097e3
commit
539cbe1a4a
@ -8,13 +8,15 @@ description: This pipeline integrates Google Translate for automatic translation
|
|||||||
without requiring an API key. It supports multilingual communication by translating based on specified source
|
without requiring an API key. It supports multilingual communication by translating based on specified source
|
||||||
and target languages.
|
and target languages.
|
||||||
"""
|
"""
|
||||||
|
import re
|
||||||
from typing import List, Optional
|
from typing import List, Optional
|
||||||
from schemas import OpenAIChatMessage
|
from schemas import OpenAIChatMessage
|
||||||
from pydantic import BaseModel
|
from pydantic import BaseModel
|
||||||
import requests
|
import requests
|
||||||
import os
|
import os
|
||||||
import time
|
import time
|
||||||
|
import asyncio
|
||||||
|
from functools import lru_cache
|
||||||
|
|
||||||
from utils.pipelines.main import get_last_user_message, get_last_assistant_message
|
from utils.pipelines.main import get_last_user_message, get_last_assistant_message
|
||||||
|
|
||||||
@ -25,36 +27,33 @@ class Pipeline:
|
|||||||
source_user: Optional[str] = "auto"
|
source_user: Optional[str] = "auto"
|
||||||
target_user: Optional[str] = "en"
|
target_user: Optional[str] = "en"
|
||||||
source_assistant: Optional[str] = "en"
|
source_assistant: Optional[str] = "en"
|
||||||
target_assistant: Optional[str] = "uk"
|
target_assistant: Optional[str] = "es"
|
||||||
|
|
||||||
def __init__(self):
|
def __init__(self):
|
||||||
# Initialize the pipeline type and name
|
|
||||||
self.type = "filter"
|
self.type = "filter"
|
||||||
self.name = "Google Translate Filter"
|
self.name = "Google Translate Filter"
|
||||||
|
|
||||||
# Initialize Valves with default values
|
|
||||||
self.valves = self.Valves(
|
self.valves = self.Valves(
|
||||||
**{
|
**{
|
||||||
"pipelines": ["*"],
|
"pipelines": ["*"],
|
||||||
}
|
}
|
||||||
)
|
)
|
||||||
|
|
||||||
|
# Initialize translation cache
|
||||||
|
self.translation_cache = {}
|
||||||
|
|
||||||
async def on_startup(self):
|
async def on_startup(self):
|
||||||
# Function called when the server is started
|
|
||||||
print(f"on_startup:{__name__}")
|
print(f"on_startup:{__name__}")
|
||||||
pass
|
pass
|
||||||
|
|
||||||
async def on_shutdown(self):
|
async def on_shutdown(self):
|
||||||
# Function called when the server is stopped
|
|
||||||
print(f"on_shutdown:{__name__}")
|
print(f"on_shutdown:{__name__}")
|
||||||
pass
|
pass
|
||||||
|
|
||||||
async def on_valves_updated(self):
|
async def on_valves_updated(self):
|
||||||
# Function called when the valves are updated
|
|
||||||
pass
|
pass
|
||||||
|
|
||||||
|
@lru_cache(maxsize=128) # LRU cache to store translation results
|
||||||
def translate(self, text: str, source: str, target: str) -> str:
|
def translate(self, text: str, source: str, target: str) -> str:
|
||||||
# Function to translate text using Google Translate
|
|
||||||
url = "https://translate.googleapis.com/translate_a/single"
|
url = "https://translate.googleapis.com/translate_a/single"
|
||||||
params = {
|
params = {
|
||||||
"client": "gtx",
|
"client": "gtx",
|
||||||
@ -65,26 +64,29 @@ class Pipeline:
|
|||||||
}
|
}
|
||||||
|
|
||||||
try:
|
try:
|
||||||
# Make a GET request to Google Translate API
|
|
||||||
r = requests.get(url, params=params)
|
r = requests.get(url, params=params)
|
||||||
r.raise_for_status() # Raise an exception for bad status codes
|
r.raise_for_status()
|
||||||
|
|
||||||
# Parse the JSON response
|
|
||||||
result = r.json()
|
result = r.json()
|
||||||
translated_text = ''.join([sentence[0] for sentence in result[0]]) # Combine all translated sentences into one string
|
translated_text = ''.join([sentence[0] for sentence in result[0]])
|
||||||
return translated_text
|
return translated_text
|
||||||
except requests.exceptions.RequestException as e:
|
except requests.exceptions.RequestException as e:
|
||||||
# Handle network errors, retrying after a short pause
|
|
||||||
print(f"Network error: {e}")
|
print(f"Network error: {e}")
|
||||||
time.sleep(1) # Pause before retrying
|
time.sleep(1)
|
||||||
return self.translate(text, source, target) # Retry translation
|
return self.translate(text, source, target)
|
||||||
except Exception as e:
|
except Exception as e:
|
||||||
# Handle other exceptions
|
|
||||||
print(f"Error translating text: {e}")
|
print(f"Error translating text: {e}")
|
||||||
return text # Return original text in case of error
|
return text
|
||||||
|
|
||||||
|
def split_text_around_table(self, text: str) -> List[str]:
|
||||||
|
table_regex = r'((?:^.*?\|.*?\n)+)(?=\n[^\|\s].*?\|)'
|
||||||
|
matches = re.split(table_regex, text, flags=re.MULTILINE)
|
||||||
|
|
||||||
|
if len(matches) > 1:
|
||||||
|
return [matches[0], matches[1]]
|
||||||
|
else:
|
||||||
|
return [text, ""]
|
||||||
|
|
||||||
async def inlet(self, body: dict, user: Optional[dict] = None) -> dict:
|
async def inlet(self, body: dict, user: Optional[dict] = None) -> dict:
|
||||||
# Function to process incoming messages from the user
|
|
||||||
print(f"inlet:{__name__}")
|
print(f"inlet:{__name__}")
|
||||||
|
|
||||||
messages = body["messages"]
|
messages = body["messages"]
|
||||||
@ -92,16 +94,23 @@ class Pipeline:
|
|||||||
|
|
||||||
print(f"User message: {user_message}")
|
print(f"User message: {user_message}")
|
||||||
|
|
||||||
# Translate user message
|
parts = self.split_text_around_table(user_message)
|
||||||
translated_user_message = self.translate(
|
text_before_table, table_text = parts
|
||||||
user_message,
|
|
||||||
self.valves.source_user,
|
# Check translation cache for text before table
|
||||||
self.valves.target_user,
|
translated_before_table = self.translation_cache.get(text_before_table)
|
||||||
)
|
if translated_before_table is None:
|
||||||
|
translated_before_table = self.translate(
|
||||||
|
text_before_table,
|
||||||
|
self.valves.source_user,
|
||||||
|
self.valves.target_user,
|
||||||
|
)
|
||||||
|
self.translation_cache[text_before_table] = translated_before_table
|
||||||
|
|
||||||
|
translated_user_message = translated_before_table + table_text
|
||||||
|
|
||||||
print(f"Translated user message: {translated_user_message}")
|
print(f"Translated user message: {translated_user_message}")
|
||||||
|
|
||||||
# Update the translated message in the messages list
|
|
||||||
for message in reversed(messages):
|
for message in reversed(messages):
|
||||||
if message["role"] == "user":
|
if message["role"] == "user":
|
||||||
message["content"] = translated_user_message
|
message["content"] = translated_user_message
|
||||||
@ -111,7 +120,6 @@ class Pipeline:
|
|||||||
return body
|
return body
|
||||||
|
|
||||||
async def outlet(self, body: dict, user: Optional[dict] = None) -> dict:
|
async def outlet(self, body: dict, user: Optional[dict] = None) -> dict:
|
||||||
# Function to process outgoing messages from the assistant
|
|
||||||
print(f"outlet:{__name__}")
|
print(f"outlet:{__name__}")
|
||||||
|
|
||||||
messages = body["messages"]
|
messages = body["messages"]
|
||||||
@ -119,16 +127,23 @@ class Pipeline:
|
|||||||
|
|
||||||
print(f"Assistant message: {assistant_message}")
|
print(f"Assistant message: {assistant_message}")
|
||||||
|
|
||||||
# Translate assistant message
|
parts = self.split_text_around_table(assistant_message)
|
||||||
translated_assistant_message = self.translate(
|
text_before_table, table_text = parts
|
||||||
assistant_message,
|
|
||||||
self.valves.source_assistant,
|
# Check translation cache for text before table
|
||||||
self.valves.target_assistant,
|
translated_before_table = self.translation_cache.get(text_before_table)
|
||||||
)
|
if translated_before_table is None:
|
||||||
|
translated_before_table = self.translate(
|
||||||
|
text_before_table,
|
||||||
|
self.valves.source_assistant,
|
||||||
|
self.valves.target_assistant,
|
||||||
|
)
|
||||||
|
self.translation_cache[text_before_table] = translated_before_table
|
||||||
|
|
||||||
|
translated_assistant_message = translated_before_table + table_text
|
||||||
|
|
||||||
print(f"Translated assistant message: {translated_assistant_message}")
|
print(f"Translated assistant message: {translated_assistant_message}")
|
||||||
|
|
||||||
# Update the translated message in the messages list
|
|
||||||
for message in reversed(messages):
|
for message in reversed(messages):
|
||||||
if message["role"] == "assistant":
|
if message["role"] == "assistant":
|
||||||
message["content"] = translated_assistant_message
|
message["content"] = translated_assistant_message
|
||||||
|
Loading…
Reference in New Issue
Block a user