local-llm-server/llm_server/routes/v1/proxy.py

22 lines
604 B
Python

import time
from datetime import datetime
from flask import jsonify
from llm_server import opts
from . import bp
from .. import stats
from llm_server.routes.v1.generate import concurrent_semaphore
from ..cache import cache
@bp.route('/stats', methods=['GET'])
@cache.cached(timeout=60, query_string=True)
def get_stats():
return jsonify({
'proompters_now': opts.concurrent_generates - concurrent_semaphore._value,
'total_proompts': stats.proompts.value,
'uptime': int((datetime.now() - stats.start_time).total_seconds()),
'timestamp': int(time.time())
}), 200