cuda_utils.cc 1.6 KB

12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455
  1. /*
  2. * Copyright (c) 2019-2023, NVIDIA CORPORATION. All rights reserved.
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "cuda_utils.h"
  17. namespace fastertransformer {
  18. /* ***************************** common utils ****************************** */
  19. cudaError_t getSetDevice(int i_device, int* o_device)
  20. {
  21. int current_dev_id = 0;
  22. cudaError_t err = cudaSuccess;
  23. if (o_device != NULL) {
  24. err = cudaGetDevice(&current_dev_id);
  25. if (err != cudaSuccess) {
  26. return err;
  27. }
  28. if (current_dev_id == i_device) {
  29. *o_device = i_device;
  30. }
  31. else {
  32. err = cudaSetDevice(i_device);
  33. if (err != cudaSuccess) {
  34. return err;
  35. }
  36. *o_device = current_dev_id;
  37. }
  38. }
  39. else {
  40. err = cudaSetDevice(i_device);
  41. if (err != cudaSuccess) {
  42. return err;
  43. }
  44. }
  45. return cudaSuccess;
  46. }
  47. /* ************************** end of common utils ************************** */
  48. } // namespace fastertransformer