local-llm-server/llm_server/llm/generator.py

16 lines
559 B
Python
Raw Normal View History

2023-08-23 20:12:38 -06:00
from llm_server import opts
from llm_server.cluster.cluster_config import cluster_config
2023-08-23 20:12:38 -06:00
def generator(request_json_body, cluster_backend, timeout: int = None):
mode = cluster_config.get_backend(cluster_backend)['mode']
if mode == 'ooba':
# from .oobabooga.generate import generate
# return generate(request_json_body)
raise NotImplementedError
elif mode == 'vllm':
2023-09-11 20:47:19 -06:00
from .vllm.generate import generate
return generate(request_json_body, cluster_backend, timeout=timeout)
2023-08-23 20:12:38 -06:00
else:
raise Exception