We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent b8b7f35 commit f41e457Copy full SHA for f41e457
1 file changed
fastdeploy/envs.py
@@ -290,7 +290,7 @@ def _validate_split_kv_size(value: int) -> int:
290
# Whether to enable FP8 quantization with pow2scale.
291
"FD_FP8_QUANT_WITH_POW2SCALE": lambda: bool(int(os.getenv("FD_FP8_QUANT_WITH_POW2SCALE", "0"))),
292
# Whether to enable top_p=1.0 optimization.
293
- "FD_ENABLE_TOP_P_ONE_OPT": lambda: bool(int(os.getenv("FD_ENABLE_TOP_P_ONE_OPT", "1"))),
+ "FD_ENABLE_TOP_P_ONE_OPT": lambda: bool(int(os.getenv("FD_ENABLE_TOP_P_ONE_OPT", "0"))),
294
}
295
296
0 commit comments