fix wrong datatype
This commit is contained in:
parent
b3f0c4b28f
commit
3ec9b2347f
|
@ -102,8 +102,12 @@ def openai_chat_completions(model_name=None):
|
||||||
pubsub = redis.pubsub()
|
pubsub = redis.pubsub()
|
||||||
pubsub.subscribe(event_id)
|
pubsub.subscribe(event_id)
|
||||||
for item in pubsub.listen():
|
for item in pubsub.listen():
|
||||||
if item['type'] == 'message' and item['data'].decode('utf-8') == 'begin':
|
if item['type'] == 'message':
|
||||||
break
|
msg = item['data'].decode('utf-8')
|
||||||
|
if msg == 'begin':
|
||||||
|
break
|
||||||
|
elif msg == 'offline':
|
||||||
|
return return_invalid_model_err(handler.request_json_body['model'])
|
||||||
time.sleep(0.1)
|
time.sleep(0.1)
|
||||||
|
|
||||||
# Double check the model is still online
|
# Double check the model is still online
|
||||||
|
|
|
@ -127,8 +127,12 @@ def openai_completions(model_name=None):
|
||||||
pubsub = redis.pubsub()
|
pubsub = redis.pubsub()
|
||||||
pubsub.subscribe(event_id)
|
pubsub.subscribe(event_id)
|
||||||
for item in pubsub.listen():
|
for item in pubsub.listen():
|
||||||
if item['type'] == 'message' and item['data'].decode('utf-8') == 'begin':
|
if item['type'] == 'message':
|
||||||
break
|
msg = item['data'].decode('utf-8')
|
||||||
|
if msg == 'begin':
|
||||||
|
break
|
||||||
|
elif msg == 'offline':
|
||||||
|
return return_invalid_model_err(handler.request_json_body['model'])
|
||||||
time.sleep(0.1)
|
time.sleep(0.1)
|
||||||
|
|
||||||
# Double check the model is still online
|
# Double check the model is still online
|
||||||
|
|
|
@ -143,8 +143,12 @@ def do_stream(ws, model_name):
|
||||||
pubsub = redis.pubsub()
|
pubsub = redis.pubsub()
|
||||||
pubsub.subscribe(event_id)
|
pubsub.subscribe(event_id)
|
||||||
for item in pubsub.listen():
|
for item in pubsub.listen():
|
||||||
if item['type'] == 'message' and item['data'].decode('utf-8') == 'begin':
|
if item['type'] == 'message':
|
||||||
break
|
msg = item['data'].decode('utf-8')
|
||||||
|
if msg == 'begin':
|
||||||
|
break
|
||||||
|
elif msg == 'offline':
|
||||||
|
return messages.BACKEND_OFFLINE, 404 # TODO: format this error
|
||||||
time.sleep(0.1)
|
time.sleep(0.1)
|
||||||
|
|
||||||
# Double check the model is still online
|
# Double check the model is still online
|
||||||
|
|
|
@ -2,7 +2,6 @@ import threading
|
||||||
import time
|
import time
|
||||||
import traceback
|
import traceback
|
||||||
|
|
||||||
from llm_server import messages
|
|
||||||
from llm_server.cluster.cluster_config import cluster_config
|
from llm_server.cluster.cluster_config import cluster_config
|
||||||
from llm_server.custom_redis import redis
|
from llm_server.custom_redis import redis
|
||||||
from llm_server.llm.generator import generator
|
from llm_server.llm.generator import generator
|
||||||
|
@ -14,10 +13,11 @@ def worker(backend_url):
|
||||||
while True:
|
while True:
|
||||||
(request_json_body, client_ip, token, parameters), event_id, selected_model = queue.get()
|
(request_json_body, client_ip, token, parameters), event_id, selected_model = queue.get()
|
||||||
backend_info = cluster_config.get_backend(backend_url)
|
backend_info = cluster_config.get_backend(backend_url)
|
||||||
|
pubsub = redis.pubsub()
|
||||||
|
pubsub.subscribe(event_id)
|
||||||
|
|
||||||
if not backend_info['online']:
|
if not backend_info['online']:
|
||||||
event = DataEvent(event_id)
|
redis.publish(event_id, 'offline')
|
||||||
event.set((False, None, messages.BACKEND_OFFLINE))
|
|
||||||
return
|
return
|
||||||
|
|
||||||
if not selected_model:
|
if not selected_model:
|
||||||
|
@ -34,8 +34,6 @@ def worker(backend_url):
|
||||||
# is finished. Since a lot of ratelimiting and stats are
|
# is finished. Since a lot of ratelimiting and stats are
|
||||||
# based off the number of active workers, we must keep
|
# based off the number of active workers, we must keep
|
||||||
# the generation based off the workers.
|
# the generation based off the workers.
|
||||||
pubsub = redis.pubsub()
|
|
||||||
pubsub.subscribe(event_id)
|
|
||||||
redis.publish(event_id, 'begin')
|
redis.publish(event_id, 'begin')
|
||||||
for item in pubsub.listen():
|
for item in pubsub.listen():
|
||||||
if item['type'] == 'message' and item['data'].decode('utf-8') == 'finished':
|
if item['type'] == 'message' and item['data'].decode('utf-8') == 'finished':
|
||||||
|
|
Reference in New Issue