#!/bin/bash set -xe cd /app/aphrodite-engine source activate aphrodite-engine echo 'Starting Aphrodite Engine API server...' python -u -m aphrodite.endpoints.api_server_kobold \ --host 0.0.0.0 \ --port 2242 \ --model $MODEL_NAME \ --tensor-parallel-size $NUM_GPUS \ --quantization $QUANTIZATION \ --dtype $DATATYPE