diff --git a/llm_server/routes/v1/proxy.py b/llm_server/routes/v1/proxy.py index 445aeb7..d2346b5 100644 --- a/llm_server/routes/v1/proxy.py +++ b/llm_server/routes/v1/proxy.py @@ -6,6 +6,7 @@ from flask import jsonify, request from llm_server import opts from . import bp from .. import stats +from ..cache import cache from ..queue import priority_queue from ..stats import SemaphoreCheckerThread, calculate_avg_gen_time from ...llm.info import get_running_model