local-llm-server/other/local-llm-server.service

[Unit]
Description=Local LLM Proxy Server
Wants=basic.target
After=basic.target network.target local-llm-daemon.service
Requires=local-llm-daemon.service

[Service]
User=server
WorkingDirectory=/srv/server/local-llm-server

# Sometimes the old processes aren't terminated when the service is restarted.
ExecStartPre=/usr/bin/pkill -9 -f "/srv/server/local-llm-server/venv/bin/python3 /srv/server/local-llm-server/venv/bin/gunicorn"

# TODO: make sure gunicorn logs to stdout and logging also goes to stdout

# Need a lot of workers since we have long-running requests. This takes about 3.5G memory.
ExecStart=/srv/server/local-llm-server/venv/bin/gunicorn --workers 20 --bind 0.0.0.0:5000 server:app --timeout 60 --worker-class gevent --access-logfile '-' --error-logfile '-'

Restart=always
RestartSec=2
SyslogIdentifier=local-llm-server

[Install]
WantedBy=multi-user.target
add systemctl service 2023-08-21 23:25:53 -06:00			`[Unit]`
update service 2023-12-21 13:22:47 -07:00			`Description=Local LLM Proxy Server`
add systemctl service 2023-08-21 23:25:53 -06:00			`Wants=basic.target`
update service 2023-12-21 13:22:47 -07:00			`After=basic.target network.target local-llm-daemon.service`
			`Requires=local-llm-daemon.service`
add systemctl service 2023-08-21 23:25:53 -06:00
			`[Service]`
			`User=server`
			`WorkingDirectory=/srv/server/local-llm-server`
adjust gunicorn logging and fix service 2024-01-10 15:35:29 -07:00
			`# Sometimes the old processes aren't terminated when the service is restarted.`
			`ExecStartPre=/usr/bin/pkill -9 -f "/srv/server/local-llm-server/venv/bin/python3 /srv/server/local-llm-server/venv/bin/gunicorn"`

refactor a lot of things, major cleanup, use postgresql 2024-05-07 17:03:41 -06:00			`# TODO: make sure gunicorn logs to stdout and logging also goes to stdout`

adjust gunicorn logging and fix service 2024-01-10 15:35:29 -07:00			`# Need a lot of workers since we have long-running requests. This takes about 3.5G memory.`
			`ExecStart=/srv/server/local-llm-server/venv/bin/gunicorn --workers 20 --bind 0.0.0.0:5000 server:app --timeout 60 --worker-class gevent --access-logfile '-' --error-logfile '-'`

add systemctl service 2023-08-21 23:25:53 -06:00			`Restart=always`
			`RestartSec=2`
update service 2023-12-21 13:22:47 -07:00			`SyslogIdentifier=local-llm-server`
add systemctl service 2023-08-21 23:25:53 -06:00
			`[Install]`
			`WantedBy=multi-user.target`
ready for public release 2024-03-18 12:42:44 -06:00