2023-08-21 21:28:52 -06:00
|
|
|
import time
|
|
|
|
|
2023-08-23 16:40:20 -06:00
|
|
|
from flask import jsonify, request
|
2023-08-21 21:28:52 -06:00
|
|
|
|
|
|
|
from . import bp
|
2023-09-24 15:54:35 -06:00
|
|
|
from ..auth import requires_auth
|
2023-09-28 18:40:24 -06:00
|
|
|
from llm_server.custom_redis import flask_cache
|
2023-09-12 10:30:45 -06:00
|
|
|
from ... import opts
|
2023-08-22 19:58:31 -06:00
|
|
|
from ...llm.info import get_running_model
|
2023-08-21 21:28:52 -06:00
|
|
|
|
|
|
|
|
|
|
|
# @bp.route('/info', methods=['GET'])
|
|
|
|
# # @cache.cached(timeout=3600, query_string=True)
|
|
|
|
# def get_info():
|
|
|
|
# # requests.get()
|
|
|
|
# return 'yes'
|
|
|
|
|
|
|
|
|
|
|
|
@bp.route('/model', methods=['GET'])
|
|
|
|
def get_model():
|
2023-08-23 16:40:20 -06:00
|
|
|
# We will manage caching ourself since we don't want to cache
|
|
|
|
# when the backend is down. Also, Cloudflare won't cache 500 errors.
|
|
|
|
cache_key = 'model_cache::' + request.url
|
2023-09-26 22:09:11 -06:00
|
|
|
cached_response = flask_cache.get(cache_key)
|
2023-08-23 16:40:20 -06:00
|
|
|
|
|
|
|
if cached_response:
|
|
|
|
return cached_response
|
|
|
|
|
2023-09-12 10:30:45 -06:00
|
|
|
model_name, error = get_running_model()
|
|
|
|
if not model_name:
|
2023-08-23 16:40:20 -06:00
|
|
|
response = jsonify({
|
2023-08-23 16:07:43 -06:00
|
|
|
'code': 502,
|
2023-08-30 18:53:26 -06:00
|
|
|
'msg': 'failed to reach backend',
|
2023-08-23 16:07:43 -06:00
|
|
|
'type': error.__class__.__name__
|
2023-08-23 16:40:20 -06:00
|
|
|
}), 500 # return 500 so Cloudflare doesn't intercept us
|
2023-08-21 22:49:44 -06:00
|
|
|
else:
|
2023-09-12 01:04:11 -06:00
|
|
|
response = jsonify({
|
2023-09-12 10:30:45 -06:00
|
|
|
'result': opts.manual_model_name if opts.manual_model_name else model_name,
|
2023-09-12 01:04:11 -06:00
|
|
|
'timestamp': int(time.time())
|
|
|
|
}), 200
|
2023-09-26 22:09:11 -06:00
|
|
|
flask_cache.set(cache_key, response, timeout=60)
|
2023-08-23 16:40:20 -06:00
|
|
|
|
|
|
|
return response
|
2023-09-24 15:54:35 -06:00
|
|
|
|
|
|
|
|
|
|
|
@bp.route('/backend', methods=['GET'])
|
|
|
|
@requires_auth
|
|
|
|
def get_backend():
|
|
|
|
return jsonify({'backend': opts.backend_url, 'mode': opts.mode}), 200
|