2022-10-18 07:19:03 -06:00
install-server :
2022-10-22 12:00:15 -06:00
cd server && make install
2022-10-18 07:19:03 -06:00
2023-06-08 06:51:52 -06:00
install-custom-kernels :
if [ " $$ BUILD_EXTENSIONS " = = "True" ] ; then cd server/custom_kernels && python setup.py install; else echo "Custom kernels are disabled, you need set to BUILD_EXTENSION environment variable to 'True' in order to build them. (Please read the docs, kernels might not work on all hardware)" ; fi
2023-05-15 15:36:30 -06:00
install-integration-tests :
cd integration-tests && pip install -r requirements.txt
2023-06-02 09:12:30 -06:00
cd clients/python && pip install .
2023-05-15 15:36:30 -06:00
2022-10-18 07:19:03 -06:00
install-router :
cd router && cargo install --path .
install-launcher :
cd launcher && cargo install --path .
2023-03-30 07:26:27 -06:00
install-benchmark :
cd benchmark && cargo install --path .
2023-06-08 06:51:52 -06:00
install : install -server install -router install -launcher install -custom -kernels
2022-10-22 12:00:15 -06:00
server-dev :
cd server && make run-dev
router-dev :
2023-03-07 10:52:22 -07:00
cd router && cargo run -- --port 8080
2022-10-18 07:19:03 -06:00
2023-05-15 15:36:30 -06:00
rust-tests : install -router install -launcher
2023-02-03 04:43:37 -07:00
cargo test
2023-05-15 15:36:30 -06:00
integration-tests : install -integration -tests
pytest -s -vv -m "not private" integration-tests
update-integration-tests : install -integration -tests
pytest -s -vv --snapshot-update integration-tests
2023-04-27 11:16:35 -06:00
python-server-tests :
2023-05-16 15:23:27 -06:00
HF_HUB_ENABLE_HF_TRANSFER = 1 pytest -s -vv -m "not private" server/tests
2023-04-27 11:16:35 -06:00
python-client-tests :
pytest clients/python/tests
python-tests : python -server -tests python -client -tests
2023-02-03 04:43:37 -07:00
2022-10-18 07:19:03 -06:00
run-bloom-560m :
2023-03-07 10:52:22 -07:00
text-generation-launcher --model-id bigscience/bloom-560m --num-shard 2 --port 8080
2022-10-18 07:19:03 -06:00
2022-10-27 06:25:29 -06:00
run-bloom-560m-quantize :
2023-03-07 10:52:22 -07:00
text-generation-launcher --model-id bigscience/bloom-560m --num-shard 2 --quantize --port 8080
2022-10-27 06:25:29 -06:00
download-bloom :
2023-03-03 10:42:20 -07:00
HF_HUB_ENABLE_HF_TRANSFER = 1 text-generation-server download-weights bigscience/bloom
2022-10-27 06:25:29 -06:00
2022-10-18 07:19:03 -06:00
run-bloom :
2023-03-07 10:52:22 -07:00
text-generation-launcher --model-id bigscience/bloom --num-shard 8 --port 8080
2022-10-27 06:25:29 -06:00
run-bloom-quantize :
2023-06-08 06:51:52 -06:00
text-generation-launcher --model-id bigscience/bloom --num-shard 8 --quantize --port 8080