sentencepiece # Required for LLaMA tokenizer. numpy transformers-neuronx >= 0.9.0 torch-neuronx >= 2.1.0 neuronx-cc fastapi uvicorn[standard] pydantic >= 2.0 # Required for OpenAI server. prometheus_client >= 0.18.0 requests psutil py-cpuinfo