env_utils.h 1.2 KB

1234567891011121314151617181920212223242526272829303132333435363738
  1. /*
  2. * SPDX-FileCopyrightText: Copyright (c) 2022-2024 NVIDIA CORPORATION &
  3. * AFFILIATES. All rights reserved. SPDX-License-Identifier: Apache-2.0
  4. *
  5. * Licensed under the Apache License, Version 2.0 (the "License");
  6. * you may not use this file except in compliance with the License.
  7. * You may obtain a copy of the License at
  8. *
  9. * http://www.apache.org/licenses/LICENSE-2.0
  10. *
  11. * Unless required by applicable law or agreed to in writing, software
  12. * distributed under the License is distributed on an "AS IS" BASIS,
  13. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  14. * See the License for the specific language governing permissions and
  15. * limitations under the License.
  16. */
  17. #pragma once
  18. #include <cstdint>
  19. #include <optional>
  20. // XQA kernels (optimized kernels for generation phase).
  21. bool forceXQAKernels();
  22. // Whether XQA JIT is enabled.
  23. //
  24. // Returns the value of TRTLLM_ENABLE_XQA_JIT env var. If such env var doesn't
  25. // exist, std::nullopt is returned. std::optional<bool> getEnvEnableXQAJIT();
  26. // Tune the number of blocks per sequence for accuracy/performance purpose.
  27. // bool getEnvMmhaMultiblockDebug();
  28. // int getEnvMmhaBlocksPerSequence();
  29. // int getEnvMmhaKernelBlockSize();
  30. // Whether PDL is enabled.
  31. bool getEnvEnablePDL();