1234567891011121314151617181920212223242526272829 |
- #!/bin/bash
- set -xe
- cd /app/aphrodite-engine
- echo 'Starting Aphrodite Engine API server...'
- CMD="python3 -m aphrodite.endpoints.openai.api_server \
- --host 0.0.0.0 \
- --port 7860 \
- --model $MODEL_NAME \
- --tensor-parallel-size $NUM_GPUS \
- --dtype $DATATYPE \
- --max-model-len $CONTEXT_LENGTH \
- --gmu $GPU_MEMORY_UTILIZATION"
- if [ -n "$QUANTIZATION" ]; then
- CMD="$CMD --quantization $QUANTIZATION --dtype half"
- fi
- if [ -n "$API_KEY" ]; then
- CMD="$CMD --api-keys $API_KEY"
- fi
- if [ -n "$ENFORCE_EAGER" ]; then
- CMD="$CMD --enforce-eager"
- fi
- if [ -n "$KVCACHE" ]; then
- CMD="$CMD --kv-cache-dtype $KVCACHE"
- fi
- exec $CMD
|