12345678910111213141516171819 |
- #!/bin/bash
- set -xe
- cd /app/aphrodite-engine
- source activate aphrodite-engine
- echo 'Starting Aphrodite Engine API server...'
- CMD="python -u -m aphrodite.endpoints.kobold.api_server \
- --host 0.0.0.0 \
- --port 7860 \
- --model $MODEL_NAME \
- --tensor-parallel-size $NUM_GPUS \
- --dtype $DATATYPE"
- if [ -n "$QUANTIZATION" ]; then
- CMD="$CMD --quantization $QUANTIZATION"
- fi
- exec $CMD
|