123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230 |
- #!/usr/bin/env bash
- # Ruff formatter.
- #
- # Usage:
- # # Do work and commit your work.
- # # Format files that differ from origin/main.
- # bash formatting.sh
- #
- #
- # Cause the script to exit if a single command fails
- set -eo pipefail
- # this stops git rev-parse from failing if we run this from the .git directory
- builtin cd "$(dirname "${BASH_SOURCE:-$0}")"
- ROOT="$(git rev-parse --show-toplevel)"
- builtin cd "$ROOT" || exit 1
- RUFF_VERSION=$(ruff --version | awk '{print $2}')
- MYPY_VERSION=$(mypy --version | awk '{print $2}')
- CODESPELL_VERSION=$(codespell --version)
- ISORT_VERSION=$(isort --vn)
- CLANGFORMAT_VERSION=$(clang-format --version | awk '{print $3}')
- # # params: tool name, tool version, required version
- tool_version_check() {
- if [[ $2 != $3 ]]; then
- echo "Wrong $1 version installed: $3 is required, not $2."
- exit 1
- fi
- }
- tool_version_check "ruff" $RUFF_VERSION "$(grep "ruff==" requirements-lint.txt | cut -d'=' -f3)"
- tool_version_check "isort" "$ISORT_VERSION" "$(grep isort requirements-lint.txt | cut -d'=' -f3)"
- tool_version_check "codespell" "$CODESPELL_VERSION" "$(grep codespell requirements-lint.txt | cut -d'=' -f3)"
- tool_version_check "clang-format" "$CLANGFORMAT_VERSION" "$(grep clang-format requirements-lint.txt | cut -d'=' -f3)"
- # If git diff returns a file that is in the skip list, the file may be checked anyway:
- # https://github.com/codespell-project/codespell/issues/1915
- # Avoiding the "./" prefix and using "/**" globs for directories appears to solve the problem
- CODESPELL_EXCLUDES=(
- '--skip' './tests/benchmarks/sonnet.txt,build/**'
- )
- # check spelling of specified files
- spell_check() {
- codespell "$@"
- }
- spell_check_all(){
- codespell --toml pyproject.toml "${CODESPELL_EXCLUDES[@]}"
- }
- # Spelling check of files that differ from main branch.
- spell_check_changed() {
- # The `if` guard ensures that the list of filenames is not empty, which
- # could cause ruff to receive 0 positional arguments, making it hang
- # waiting for STDIN.
- #
- # `diff-filter=ACM` and $MERGEBASE is to ensure we only lint files that
- # exist on both branches.
- MERGEBASE="$(git merge-base origin/main HEAD)"
- if ! git diff --diff-filter=ACM --quiet --exit-code "$MERGEBASE" -- '*.py' '*.pyi' &>/dev/null; then
- git diff --name-only --diff-filter=ACM "$MERGEBASE" -- '*.py' '*.pyi' | xargs \
- codespell "${CODESPELL_EXCLUDES[@]}"
- fi
- }
- # Run Codespell
- ## This flag runs spell check of individual files. --files *must* be the first command line
- ## arg to use this option.
- if [[ "$1" == '--files' ]]; then
- spell_check "${@:2}"
- # If `--all` is passed, then any further arguments are ignored and the
- # entire python directory is linted.
- elif [[ "$1" == '--all' ]]; then
- spell_check_all
- else
- # Check spelling only of the files that changed in last commit.
- spell_check_changed
- fi
- echo 'Aphrodite codespell: Done'
- # Lint specified files
- lint() {
- ruff "$@"
- }
- # Lint files that differ from main branch. Ignores dirs that are not slated
- # for autolint yet.
- lint_changed() {
- # The `if` guard ensures that the list of filenames is not empty, which
- # could cause ruff to receive 0 positional arguments, making it hang
- # waiting for STDIN.
- #
- # `diff-filter=ACM` and $MERGEBASE is to ensure we only lint files that
- # exist on both branches.
- MERGEBASE="$(git merge-base origin/main HEAD)"
- if ! git diff --diff-filter=ACM --quiet --exit-code "$MERGEBASE" -- '*.py' '*.pyi' &>/dev/null; then
- git diff --name-only --diff-filter=ACM "$MERGEBASE" -- '*.py' '*.pyi' | xargs \
- ruff
- fi
- }
- # Run Ruff
- ### This flag lints individual files. --files *must* be the first command line
- ### arg to use this option.
- if [[ "$1" == '--files' ]]; then
- lint "${@:2}"
- # If `--all` is passed, then any further arguments are ignored and the
- # entire python directory is linted.
- elif [[ "$1" == '--all' ]]; then
- lint aphrodite tests
- else
- # Format only the files that changed in last commit.
- lint_changed
- fi
- echo 'Aphrodite ruff: Done'
- # check spelling of specified files
- isort_check() {
- isort "$@"
- }
- isort_check_all(){
- isort .
- }
- # Spelling check of files that differ from main branch.
- isort_check_changed() {
- # The `if` guard ensures that the list of filenames is not empty, which
- # could cause ruff to receive 0 positional arguments, making it hang
- # waiting for STDIN.
- #
- # `diff-filter=ACM` and $MERGEBASE is to ensure we only lint files that
- # exist on both branches.
- MERGEBASE="$(git merge-base origin/main HEAD)"
- if ! git diff --diff-filter=ACM --quiet --exit-code "$MERGEBASE" -- '*.py' '*.pyi' &>/dev/null; then
- git diff --name-only --diff-filter=ACM "$MERGEBASE" -- '*.py' '*.pyi' | xargs \
- isort
- fi
- }
- # Run Isort
- # This flag runs spell check of individual files. --files *must* be the first command line
- # arg to use this option.
- if [[ "$1" == '--files' ]]; then
- isort_check "${@:2}"
- # If `--all` is passed, then any further arguments are ignored and the
- # entire python directory is linted.
- elif [[ "$1" == '--all' ]]; then
- isort_check_all
- else
- # Check spelling only of the files that changed in last commit.
- isort_check_changed
- fi
- echo 'Aphrodite isort: Done'
- # Clang-format section
- # Exclude some files for formatting because they are vendored
- # NOTE: Keep up to date with .github/workflows/clang-format.yml
- CLANG_FORMAT_EXCLUDES=(
- 'kernels/moe/softmax.cu'
- 'kernels/punica/bgmv/bgmv_bf16_bf16_bf16.cu'
- 'kernels/punica/bgmv/bgmv_config.h'
- 'kernels/punica/bgmv/bgmv_impl.cuh'
- 'kernels/punica/bgmv/vec_dtypes.cuh'
- 'kernels/punica/punica_ops.cu'
- 'kernels/punica/type_convert.h'
- 'kernels/quantization/gguf/ggml-common.h'
- 'kernels/quantization/gguf/dequantize.cuh'
- 'kernels/quantization/gguf/vecdotq.cuh'
- 'kernels/quantization/gguf/mmq.cuh'
- 'kernels/quantization/gguf/mmvq.cuh'
- )
- # Format specified files with clang-format
- clang_format() {
- clang-format -i "$@"
- }
- # Format files that differ from main branch with clang-format.
- clang_format_changed() {
- # The `if` guard ensures that the list of filenames is not empty, which
- # could cause clang-format to receive 0 positional arguments, making it hang
- # waiting for STDIN.
- #
- # `diff-filter=ACM` and $MERGEBASE is to ensure we only format files that
- # exist on both branches.
- MERGEBASE="$(git merge-base origin/main HEAD)"
- # Get the list of changed files, excluding the specified ones
- changed_files=$(git diff --name-only --diff-filter=ACM "$MERGEBASE" -- '*.h' '*.cpp' '*.cu' '*.cuh' | grep -vFf <(printf "%s\n" "${CLANG_FORMAT_EXCLUDES[@]}"))
- if [ -n "$changed_files" ]; then
- echo "$changed_files" | xargs -P 5 clang-format -i
- fi
- }
- # Format all files with clang-format
- clang_format_all() {
- find kernels/ \( -name '*.h' -o -name '*.cpp' -o -name '*.cu' -o -name '*.cuh' \) -print \
- | grep -vFf <(printf "%s\n" "${CLANG_FORMAT_EXCLUDES[@]}") \
- | xargs clang-format -i
- }
- # Run clang-format
- if [[ "$1" == '--files' ]]; then
- clang_format "${@:2}"
- elif [[ "$1" == '--all' ]]; then
- clang_format_all
- else
- clang_format_changed
- fi
- echo 'Aphrodite clang-format: Done'
- if ! git diff --quiet &>/dev/null; then
- echo 'Reformatted files. Please review and stage the changes.'
- echo 'Changes not staged for commit:'
- echo
- git --no-pager diff --name-only
- exit 1
- fi
|