7 months ago · ee174ea4fd
--- a/aphrodite/common/config.py
+++ b/aphrodite/common/config.py
@@ -1171,6 +1171,8 @@ class LoRAConfig:
 
				                 "Due to limitations of the custom LoRA CUDA kernel, "
			
 
				                 "max_num_batched_tokens must be <= 65528 when "
			
 
				                 "LoRA is enabled.")
			
 
				+        if scheduler_config.chunked_prefill_enabled:
			
 
				+            raise ValueError("LoRA is not supported with chunked prefill yet.")
			
 
				 
			
 
				 
			
 
				 @dataclass