This repository has been archived on 2024-10-27. You can view files and clone it, but cannot push or open issues or pull requests.
local-llm-server/llm_server/llm/llm_backend.py

46 lines
1.7 KiB
Python
Raw Normal View History

from typing import Tuple, Union
2023-08-30 18:53:26 -06:00
2023-09-13 11:22:33 -06:00
import flask
2023-09-14 18:31:13 -06:00
from llm_server import opts
from llm_server.llm import get_token_count
2023-09-27 14:36:49 -06:00
from llm_server.routes.cache import redis
2023-09-14 18:31:13 -06:00
2023-08-30 18:53:26 -06:00
class LLMBackend:
_default_params: dict
2023-09-12 16:40:09 -06:00
def handle_response(self, success, request: flask.Request, response_json_body: dict, response_status_code: int, client_ip, token, prompt, elapsed_time, parameters, headers):
2023-08-30 18:53:26 -06:00
raise NotImplementedError
2023-09-11 20:47:19 -06:00
def validate_params(self, params_dict: dict) -> Tuple[bool, str | None]:
2023-08-30 18:53:26 -06:00
raise NotImplementedError
2023-09-11 20:47:19 -06:00
# def get_model_info(self) -> Tuple[dict | bool, Exception | None]:
# raise NotImplementedError
def get_parameters(self, parameters) -> Tuple[dict | None, str | None]:
"""
Validate and return the parameters for this backend.
Lets you set defaults for specific backends.
:param parameters:
:return:
"""
raise NotImplementedError
2023-09-12 16:40:09 -06:00
def validate_request(self, parameters: dict, prompt: str, request: flask.Request) -> Tuple[bool, Union[str, None]]:
"""
If a backend needs to do other checks not related to the prompt or parameters.
Default is no extra checks preformed.
:param parameters:
:return:
"""
return True, None
2023-09-14 18:31:13 -06:00
def validate_prompt(self, prompt: str) -> Tuple[bool, Union[str, None]]:
prompt_len = get_token_count(prompt)
if prompt_len > opts.context_size - 10:
2023-09-27 14:36:49 -06:00
model_name = redis.get('running_model', str, 'NO MODEL ERROR')
return False, f'Token indices sequence length is longer than the specified maximum sequence length for this model ({prompt_len} > {opts.context_size}, model: {model_name}). Please lower your context size'
2023-09-14 18:31:13 -06:00
return True, None