We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
1 parent b7cbefc commit b217489Copy full SHA for b217489
python/infinilm/base_config.py
@@ -71,8 +71,8 @@ def __init__(self):
71
self.endpoint = self.args.endpoint
72
self.ignore_eos = self.args.ignore_eos
73
74
- if self.enable_paged_attn and self.attn_backend == "default":
75
- self.attn_backend = "paged-attn"
+ if self.enable_paged_attn and self.attn == "default":
+ self.attn = "paged-attn"
76
77
def _add_common_args(self):
78
# --- base configuration ---
python/infinilm/server/inference_server.py
@@ -575,6 +575,7 @@ def main():
575
port=cfg.port,
576
enable_graph=cfg.enable_graph,
577
attn_backend=cfg.attn,
578
+ ignore_eos=cfg.ignore_eos,
579
)
580
server.start()
581
0 commit comments