entrypoint.sh 394 B

1234567891011121314
  1. #!/bin/bash
  2. set -xe
  3. cd /app/aphrodite-engine
  4. source activate aphrodite-engine
  5. echo 'Starting Aphrodite Engine API server...'
  6. python -u -m aphrodite.endpoints.api_server_kobold \
  7. --host 0.0.0.0 \
  8. --port 2242 \
  9. --model $MODEL_NAME \
  10. --tensor-parallel-size $NUM_GPUS \
  11. --quantization $QUANTIZATION \
  12. --dtype $DATATYPE