|
@@ -85,8 +85,6 @@ def prepare_engine_payload(
|
|
|
"must be less than or equal to "
|
|
|
f"max_model_len ({max_model_len})")
|
|
|
|
|
|
- sampling_params = SamplingParams(max_tokens=kai_payload.max_length)
|
|
|
-
|
|
|
# KAI spec: top_k == 0 means disabled, aphrodite: top_k == -1 means disabled
|
|
|
# https://github.com/KoboldAI/KoboldAI-Client/wiki/Settings
|
|
|
kai_payload.top_k = kai_payload.top_k if kai_payload.top_k != 0.0 else -1
|