7 月之前 · ee174ea4fd
--- a/aphrodite/common/config.py
+++ b/aphrodite/common/config.py
@@ -1171,6 +1171,8 @@ class LoRAConfig:
 
															                 "Due to limitations of the custom LoRA CUDA kernel, "
														
 
															                 "max_num_batched_tokens must be <= 65528 when "
														
 
															                 "LoRA is enabled.")
														
 
															+        if scheduler_config.chunked_prefill_enabled:
														
 
															+            raise ValueError("LoRA is not supported with chunked prefill yet.")
														
 
															 @dataclass