hexabot/nlu/main.py

# from typing import Union
import asyncio
import os
from typing import Annotated, Union
from fastapi.responses import JSONResponse
import boilerplate as tfbp
from fastapi import Depends, FastAPI, HTTPException, status
from pydantic import BaseModel
import logging

# Set up logging configuration
logging.basicConfig(level=logging.DEBUG, format='%(asctime)s - %(levelname)s - %(message)s')

AUTH_TOKEN = os.getenv("AUTH_TOKEN", "TOKEN_MUST_BE_DEFINED")

AVAILABLE_LANGUAGES = os.getenv("AVAILABLE_LANGUAGES", "en,fr").split(',')
TFLC_REPO_ID = os.getenv("TFLC_REPO_ID")
JISF_REPO_ID = os.getenv("JISF_REPO_ID")


def load_language_classifier():
    # Init language classifier model
    Model = tfbp.get_model("tflc")
    kwargs = {}
    model = Model("", method="predict", repo_id=TFLC_REPO_ID, **kwargs)
    model.load_model()
    logging.info(f'Successfully loaded the language classifier model')
    return model


def load_intent_classifiers():
    Model = tfbp.get_model("jisf")
    models = {}
    for language in AVAILABLE_LANGUAGES:
        kwargs = {}
        models[language] = Model(save_dir=language, method="predict", repo_id=JISF_REPO_ID, **kwargs)
        models[language].load_model()
        logging.info(f'Successfully loaded the intent classifier {language} model')
    return models


def load_models():
    app.language_classifier = load_language_classifier()  # type: ignore
    app.intent_classifiers = load_intent_classifiers()  # type: ignore

app = FastAPI()


def authenticate(
    token: str
):
    if token != AUTH_TOKEN:
        raise HTTPException(
            status_code=status.HTTP_401_UNAUTHORIZED,
            detail="Unauthorized access",
        )
    return True


class ParseInput(BaseModel):
    q: str
    project: Union[str, None] = None


@app.on_event("startup")
async def startup_event():
    asyncio.create_task(asyncio.to_thread(load_models))


@app.get("/health", status_code=200,)
async def check_health():
    return "Startup checked"


@app.post("/parse")
def parse(input: ParseInput, is_authenticated: Annotated[str, Depends(authenticate)]):
    if not hasattr(app, 'language_classifier') or not hasattr(app, 'intent_classifiers'):
        headers = {"Retry-After": "120"}  # Suggest retrying after 2 minutes
        return JSONResponse(status_code=status.HTTP_503_SERVICE_UNAVAILABLE, content={"message": "Models are loading, please retry later."}, headers=headers)
    
    language = app.language_classifier.get_prediction(input.q)  # type: ignore
    lang = language.get("value")
    prediction = app.intent_classifiers[lang].get_prediction(
        input.q)  # type: ignore
    prediction.get("entities").append(language)
    return prediction
feat: initial commit 2024-09-10 09:50:11 +00:00			`# from typing import Union`
			`import asyncio`
			`import os`
			`from typing import Annotated, Union`
			`from fastapi.responses import JSONResponse`
			`import boilerplate as tfbp`
			`from fastapi import Depends, FastAPI, HTTPException, status`
			`from pydantic import BaseModel`
			`import logging`

			`# Set up logging configuration`
			`logging.basicConfig(level=logging.DEBUG, format='%(asctime)s - %(levelname)s - %(message)s')`

			`AUTH_TOKEN = os.getenv("AUTH_TOKEN", "TOKEN_MUST_BE_DEFINED")`

			`AVAILABLE_LANGUAGES = os.getenv("AVAILABLE_LANGUAGES", "en,fr").split(',')`
			`TFLC_REPO_ID = os.getenv("TFLC_REPO_ID")`
			`JISF_REPO_ID = os.getenv("JISF_REPO_ID")`


			`def load_language_classifier():`
			`# Init language classifier model`
			`Model = tfbp.get_model("tflc")`
			`kwargs = {}`
			`model = Model("", method="predict", repo_id=TFLC_REPO_ID, **kwargs)`
			`model.load_model()`
			`logging.info(f'Successfully loaded the language classifier model')`
			`return model`


			`def load_intent_classifiers():`
			`Model = tfbp.get_model("jisf")`
			`models = {}`
			`for language in AVAILABLE_LANGUAGES:`
			`kwargs = {}`
			`models[language] = Model(save_dir=language, method="predict", repo_id=JISF_REPO_ID, **kwargs)`
			`models[language].load_model()`
			`logging.info(f'Successfully loaded the intent classifier {language} model')`
			`return models`


			`def load_models():`
			`app.language_classifier = load_language_classifier() # type: ignore`
			`app.intent_classifiers = load_intent_classifiers() # type: ignore`

			`app = FastAPI()`


			`def authenticate(`
			`token: str`
			`):`
			`if token != AUTH_TOKEN:`
			`raise HTTPException(`
			`status_code=status.HTTP_401_UNAUTHORIZED,`
			`detail="Unauthorized access",`
			`)`
			`return True`


			`class ParseInput(BaseModel):`
			`q: str`
			`project: Union[str, None] = None`


			`@app.on_event("startup")`
			`async def startup_event():`
			`asyncio.create_task(asyncio.to_thread(load_models))`


			`@app.get("/health", status_code=200,)`
			`async def check_health():`
			`return "Startup checked"`


			`@app.post("/parse")`
			`def parse(input: ParseInput, is_authenticated: Annotated[str, Depends(authenticate)]):`
			`if not hasattr(app, 'language_classifier') or not hasattr(app, 'intent_classifiers'):`
			`headers = {"Retry-After": "120"} # Suggest retrying after 2 minutes`
			`return JSONResponse(status_code=status.HTTP_503_SERVICE_UNAVAILABLE, content={"message": "Models are loading, please retry later."}, headers=headers)`

			`language = app.language_classifier.get_prediction(input.q) # type: ignore`
			`lang = language.get("value")`
			`prediction = app.intent_classifiers[lang].get_prediction(`
			`input.q) # type: ignore`
			`prediction.get("entities").append(language)`
			`return prediction`