refac

2025-06-26 18:15:58 +00:00 · 2024-05-21 19:45:02 -07:00 · 2024-05-21 19:45:02 -07:00 · c37d3f726b
commit c37d3f726b
parent ee4544d4f9
7 changed files with 89 additions and 74 deletions
--- a/main.py
+++ b/main.py
@ -5,7 +5,7 @@ from fastapi.concurrency import run_in_threadpool

 from starlette.responses import StreamingResponse, Response
 from pydantic import BaseModel, ConfigDict
-from typing import List, Union, Generator
+from typing import List, Union, Generator, Iterator


 import time
@ -132,77 +132,88 @@ async def generate_openai_chat_completion(form_data: OpenAIChatCompletionForm):
                res = get_response(
                    user_message,
                    messages=form_data.messages,
-                    body=form_data.model_dump_json(),
+                    body=form_data.model_dump(),
                )

                print(f"stream:true:{res}")

-                if isinstance(res, str):
-                    message = stream_message_template(form_data.model, res)
-                    print(f"stream_content:str:{message}")
-                    yield f"data: {json.dumps(message)}\n\n"
-
-                elif isinstance(res, Generator):
-                    for message in res:
-                        print(f"stream_content:Generator:{message}")
-                        message = stream_message_template(form_data.model, message)
+                if isinstance(res, Iterator):
+                    for line in res:
+                        if line:
+                            # Decode the JSON data
+                            decoded_line = line.decode("utf-8")
+                            print(f"stream_content:Iterator:{decoded_line}")
+                            yield f"{decoded_line}\n\n"
+                else:
+                    if isinstance(res, str):
+                        message = stream_message_template(form_data.model, res)
+                        print(f"stream_content:str:{message}")
                        yield f"data: {json.dumps(message)}\n\n"

-                finish_message = {
-                    "id": f"{form_data.model}-{str(uuid.uuid4())}",
-                    "object": "chat.completion.chunk",
-                    "created": int(time.time()),
-                    "model": form_data.model,
-                    "choices": [
-                        {
-                            "index": 0,
-                            "delta": {},
-                            "logprobs": None,
-                            "finish_reason": "stop",
-                        }
-                    ],
-                }
+                    elif isinstance(res, Generator):
+                        for message in res:
+                            print(f"stream_content:Generator:{message}")
+                            message = stream_message_template(form_data.model, message)
+                            yield f"data: {json.dumps(message)}\n\n"

-                yield f"data: {json.dumps(finish_message)}\n\n"
-                yield f"data: [DONE]"
+                    finish_message = {
+                        "id": f"{form_data.model}-{str(uuid.uuid4())}",
+                        "object": "chat.completion.chunk",
+                        "created": int(time.time()),
+                        "model": form_data.model,
+                        "choices": [
+                            {
+                                "index": 0,
+                                "delta": {},
+                                "logprobs": None,
+                                "finish_reason": "stop",
+                            }
+                        ],
+                    }
+
+                    yield f"data: {json.dumps(finish_message)}\n\n"
+                    yield f"data: [DONE]"

            return StreamingResponse(stream_content(), media_type="text/event-stream")
        else:
            res = get_response(
                user_message,
                messages=form_data.messages,
-                body=form_data.model_dump_json(),
+                body=form_data.model_dump(),
            )
            print(f"stream:false:{res}")

-            message = ""
+            if isinstance(res, dict):
+                return res
+            else:
+                message = ""

-            if isinstance(res, str):
-                message = res
+                if isinstance(res, str):
+                    message = res

-            elif isinstance(res, Generator):
-                for stream in res:
-                    message = f"{message}{stream}"
+                elif isinstance(res, Generator):
+                    for stream in res:
+                        message = f"{message}{stream}"

-            print(f"stream:false:{message}")
+                print(f"stream:false:{message}")

-            return {
-                "id": f"{form_data.model}-{str(uuid.uuid4())}",
-                "object": "chat.completion",
-                "created": int(time.time()),
-                "model": form_data.model,
-                "choices": [
-                    {
-                        "index": 0,
-                        "message": {
-                            "role": "assistant",
-                            "content": message,
-                        },
-                        "logprobs": None,
-                        "finish_reason": "stop",
-                    }
-                ],
-            }
+                return {
+                    "id": f"{form_data.model}-{str(uuid.uuid4())}",
+                    "object": "chat.completion",
+                    "created": int(time.time()),
+                    "model": form_data.model,
+                    "choices": [
+                        {
+                            "index": 0,
+                            "message": {
+                                "role": "assistant",
+                                "content": message,
+                            },
+                            "logprobs": None,
+                            "finish_reason": "stop",
+                        }
+                    ],
+                }

    return await run_in_threadpool(job)

--- a/pipelines/examples/haystack_pipeline.py
+++ b/pipelines/examples/haystack_pipeline.py
@ -80,7 +80,7 @@ class Pipeline:

    def get_response(
        self, user_message: str, messages: List[OpenAIChatMessage], body: dict
-    ) -> Union[str, Generator]:
+    ) -> Union[str, Generator, Iterator]:
        # This is where you can add your custom RAG pipeline.
        # Typically, you would retrieve relevant information from your knowledge base and synthesize it to generate a response.

--- a/pipelines/examples/llamaindex_ollama_github_pipeline.py
+++ b/pipelines/examples/llamaindex_ollama_github_pipeline.py
@ -71,7 +71,7 @@ class Pipeline:

    def get_response(
        self, user_message: str, messages: List[OpenAIChatMessage], body: dict
-    ) -> Union[str, Generator]:
+    ) -> Union[str, Generator, Iterator]:
        # This is where you can add your custom RAG pipeline.
        # Typically, you would retrieve relevant information from your knowledge base and synthesize it to generate a response.

--- a/pipelines/examples/llamaindex_ollama_pipeline.py
+++ b/pipelines/examples/llamaindex_ollama_pipeline.py
@ -31,7 +31,7 @@ class Pipeline:

    def get_response(
        self, user_message: str, messages: List[OpenAIChatMessage], body: dict
-    ) -> Union[str, Generator]:
+    ) -> Union[str, Generator, Iterator]:
        # This is where you can add your custom RAG pipeline.
        # Typically, you would retrieve relevant information from your knowledge base and synthesize it to generate a response.

--- a/pipelines/examples/llamaindex_pipeline.py
+++ b/pipelines/examples/llamaindex_pipeline.py
@ -26,7 +26,7 @@ class Pipeline:

    def get_response(
        self, user_message: str, messages: List[OpenAIChatMessage], body: dict
-    ) -> Union[str, Generator]:
+    ) -> Union[str, Generator, Iterator]:
        # This is where you can add your custom RAG pipeline.
        # Typically, you would retrieve relevant information from your knowledge base and synthesize it to generate a response.

--- a/pipelines/examples/openai_pipeline.py
+++ b/pipelines/examples/openai_pipeline.py
@ -1,4 +1,4 @@
-from typing import List, Union, Generator
+from typing import List, Union, Generator, Iterator
 from schemas import OpenAIChatMessage
 import requests

@ -19,31 +19,35 @@ class Pipeline:

    def get_response(
        self, user_message: str, messages: List[OpenAIChatMessage], body: dict
-    ) -> Union[str, Generator]:
+    ) -> Union[str, Generator, Iterator]:
        # This is where you can add your custom pipelines like RAG.'
        print(f"get_response:{__name__}")

        print(messages)
        print(user_message)
-        OPENAI_API_KEY = "your-api-key-here"
+        OPENAI_API_KEY = "your-openai-api-key-here"

        headers = {}
        headers["Authorization"] = f"Bearer {OPENAI_API_KEY}"
        headers["Content-Type"] = "application/json"

-        r = requests.request(
-            method="POST",
-            url="https://api.openai.com/v1",
-            data=body,
-            headers=headers,
-            stream=True,
-        )
+        data = {**body, "model": "gpt-3.5-turbo"}

-        r.raise_for_status()
+        print(data)

-        # Check if response is SSE
-        if "text/event-stream" in r.headers.get("Content-Type", ""):
-            return r.iter_content(chunk_size=8192)
-        else:
-            response_data = r.json()
-            return f"{response_data['choices'][0]['text']}"
+        try:
+            r = requests.post(
+                url="https://api.openai.com/v1/chat/completions",
+                json={**body, "model": "gpt-3.5-turbo"},
+                headers=headers,
+                stream=True,
+            )
+
+            r.raise_for_status()
+
+            if data["stream"]:
+                return r.iter_lines()
+            else:
+                return r.json()
+        except Exception as e:
+            return f"Error: {e}"
--- a/pipelines/examples/pipeline_example.py
+++ b/pipelines/examples/pipeline_example.py
@ -18,7 +18,7 @@ class Pipeline:

    def get_response(
        self, user_message: str, messages: List[OpenAIChatMessage], body: dict
-    ) -> Union[str, Generator]:
+    ) -> Union[str, Generator, Iterator]:
        # This is where you can add your custom pipelines like RAG.'
        print(f"get_response:{__name__}")