Browse Source

measure end time within the cuda memory profiler

AlpinDale 7 months ago
parent
commit
072b30fb42
1 changed files with 1 additions and 1 deletions
  1. 1 1
      aphrodite/task_handler/model_runner.py

+ 1 - 1
aphrodite/task_handler/model_runner.py

@@ -167,10 +167,10 @@ class ModelRunner:
                 scheduler_config=self.scheduler_config,
                 cache_config=self.cache_config,
             )
+            end_time = time.time()
 
         self.model_memory_usage = m.consumed_memory
         tp = get_tensor_model_parallel_world_size()
-        end_time = time.time()
         total_time = end_time - start_time
         logger.info(
             f"Model weights loaded in {total_time:.2f} seconds.\nMemory usage: "