22 lines
604 B
Python
22 lines
604 B
Python
import time
|
|
from datetime import datetime
|
|
|
|
from flask import jsonify
|
|
|
|
from llm_server import opts
|
|
from . import bp
|
|
from .. import stats
|
|
from llm_server.routes.v1.generate import concurrent_semaphore
|
|
from ..cache import cache
|
|
|
|
|
|
@bp.route('/stats', methods=['GET'])
|
|
@cache.cached(timeout=60, query_string=True)
|
|
def get_stats():
|
|
return jsonify({
|
|
'proompters_now': opts.concurrent_generates - concurrent_semaphore._value,
|
|
'total_proompts': stats.proompts.value,
|
|
'uptime': int((datetime.now() - stats.start_time).total_seconds()),
|
|
'timestamp': int(time.time())
|
|
}), 200
|