renamed llm package

2025-08-29 21:50:09 +02:00
parent 50e9df2a42
commit c102970a0d
3 changed files with 131 additions and 1 deletions
--- a/src/llm_connector/init.py
+++ b/src/llm_connector/init.py
@@ -0,0 +1,3 @@
 from . llm import get_response, LLMBackend, LLMMessage
 __all__ = ['get_response', 'LLMBackend', 'LLMMessage']
--- a/src/llm_connector/llm.py
+++ b/src/llm_connector/llm.py
@@ -0,0 +1,127 @@
 import json
 from typing import Union, AsyncGenerator, TypedDict, Literal, List
 import logging
 import httpx
 logger = logging.getLogger(__name__)
 class LLMBackend(TypedDict):
    base_url: str
    api_token: str
    model: str
 class LLMMessage(TypedDict):
    role: Literal["system", "assistant", "user"]
    content: str
 async def get_response(backend: LLMBackend, messages: List[LLMMessage], stream: bool = False) -> Union[str, AsyncGenerator[str, None]]:
    try:
        # Prepare the request parameters
        request_params = {
            "model": backend["model"],
            "messages": messages,
            "stream": stream,
        }
        # Prepare headers
        headers = {
            "Content-Type": "application/json"
        }
        if len(backend["api_token"]):
            # Prepare headers
            headers['Authorization'] = f"Bearer {backend['api_token']}"
        print(request_params)
        print(headers)
        # Create httpx client
        async with httpx.AsyncClient(timeout=30.0) as client:
            url = f"{backend['base_url']}/chat/completions"
            if stream:
                # Stream the response
                async with client.stream(
                    "POST",
                    url,
                    headers=headers,
                    json=request_params,
                ) as response:
                    response.raise_for_status()
                    async for line in response.aiter_lines():
                        line = line.strip()
                        # Skip empty lines and non-data lines
                        if not line or not line.startswith("data: "):
                            continue
                        # Remove "data: " prefix
                        data = line[6:]
                        # Check for stream end
                        if data == "[DONE]":
                            break
                        try:
                            # Parse JSON chunk
                            chunk_data = json.loads(data)
                            if "choices" in chunk_data and chunk_data["choices"]:
                                choice = chunk_data["choices"][0]
                                delta = choice.get("delta", {})
                                # Handle reasoning content (for models that support it)
                                if "reasoning_content" in delta and delta["reasoning_content"]:
                                    yield {'reasoning': delta["reasoning_content"]}  # type: ignore
                                # Handle regular content
                                if "content" in delta and delta["content"]:
                                    yield {'content': delta["content"]}  # type: ignore
                        except json.JSONDecodeError:
                            # Skip malformed JSON chunks
                            continue
            else:
                # Non-streaming response
                response = await client.post(
                    url,
                    headers=headers,
                    json=request_params,
                )
                response.raise_for_status()
                response_data = response.json()
                content = ""
                if "choices" in response_data and response_data["choices"]:
                    message = response_data["choices"][0].get("message", {})
                    content = message.get("content", "")
                # FIX: Yield as dictionary to match streaming format
                if content:
                    yield {'content': content}  # type: ignore
    except httpx.HTTPStatusError as e:
        error_msg = f"HTTP error getting LLM response: {e.response.status_code} - {e.response.text}"
        logger.error(error_msg)
        yield ""
    except httpx.RequestError as e:
        error_msg = f"Request error getting LLM response: {str(e)}"
        logger.error(error_msg)
        yield ""
    except Exception as e:
        error_msg = f"Error getting LLM response: {str(e)}"
        logger.error(error_msg)
        yield ""
 async def _empty_async_generator() -> AsyncGenerator[str, None]:
    """Helper function for empty async generator"""
    if False:
        yield ""
--- a/src/main.py
+++ b/src/main.py
@@ -11,7 +11,7 @@ from dotenv import load_dotenv
 from nicegui import ui
-from lib import get_response, LLMBackend, LLMMessage
+from llm_connector import get_response, LLMBackend, LLMMessage
 load_dotenv()
		`@@ -0,0 +1,3 @@`
							`from . llm import get_response, LLMBackend, LLMMessage`

							`__all__ = ['get_response', 'LLMBackend', 'LLMMessage']`