This repository has been archived on 2024-10-27. You can view files and clone it, but cannot push or open issues or pull requests.
2023-08-21 23:25:53 -06:00
|
|
|
[Unit]
|
|
|
|
Description=Local LLM Proxy
|
|
|
|
Wants=basic.target
|
|
|
|
After=basic.target network.target
|
|
|
|
|
|
|
|
[Service]
|
|
|
|
User=server
|
|
|
|
Group=server
|
|
|
|
WorkingDirectory=/srv/server/local-llm-server
|
2023-08-23 01:14:19 -06:00
|
|
|
# Need a lot of workers since we have long-running requests
|
|
|
|
# Takes about 3.5G memory
|
|
|
|
ExecStart=/srv/server/local-llm-server/venv/bin/gunicorn --workers 20 --bind 0.0.0.0:5000 server:app --timeout 60 --worker-class gevent
|
2023-08-21 23:25:53 -06:00
|
|
|
Restart=always
|
|
|
|
RestartSec=2
|
|
|
|
|
|
|
|
[Install]
|
|
|
|
WantedBy=multi-user.target
|