xinference / entrypoint.sh
zhengr's picture
Update entrypoint.sh
7dba9f7 verified
raw
history blame
220 Bytes
#!/bin/bash
# Starting server
echo "Starting server"
xinference-local -H 0.0.0.0
xinference launch --model-engine llama.cpp --model-name llama-3-instruct --size-in-billions 8 --model-format ggufv2 --quantization Q4_K_M