local-llm-server/llm_server/routes/v1/proxy.py

26 lines
696 B
Python
Raw Normal View History

from flask import jsonify
2023-08-21 21:28:52 -06:00
from llm_server.custom_redis import flask_cache
2023-08-21 21:28:52 -06:00
from . import bp
2023-08-23 23:11:12 -06:00
from .generate_stats import generate_stats
from ..auth import requires_auth
2024-01-10 15:01:26 -07:00
from ...cluster.cluster_config import get_backends, cluster_config
from ...helpers import jsonify_pretty
2023-08-21 21:28:52 -06:00
@bp.route('/stats', methods=['GET'])
2023-09-26 22:09:11 -06:00
@flask_cache.cached(timeout=5, query_string=True)
2023-08-21 21:28:52 -06:00
def get_stats():
return jsonify_pretty(generate_stats())
@bp.route('/backends', methods=['GET'])
@requires_auth
def get_backend():
online, offline = get_backends()
result = {}
for i in online + offline:
info = cluster_config.get_backend(i)
result[info['hash']] = info
return jsonify(result), 200