entrypoint.sh 447 B

12345678910111213141516171819
  1. #!/bin/bash
  2. set -xe
  3. cd /app/aphrodite-engine
  4. source activate aphrodite-engine
  5. echo 'Starting Aphrodite Engine API server...'
  6. CMD="python -u -m aphrodite.endpoints.kobold.api_server \
  7. --host 0.0.0.0 \
  8. --port 7860 \
  9. --model $MODEL_NAME \
  10. --tensor-parallel-size $NUM_GPUS \
  11. --dtype $DATATYPE"
  12. if [ -n "$QUANTIZATION" ]; then
  13. CMD="$CMD --quantization $QUANTIZATION"
  14. fi
  15. exec $CMD