@@ -91,7 +91,7 @@ class OptimizationLevel(IntEnum):
9191# if model_config is not None:
9292# IS_QUANTIZED = lambda c: c.model_config.is_quantized()
9393# IS_DENSE = lambda c: not c.model_config.is_model_moe()
94- # See https://github.com/aphrodite -project/aphrodite /issues/25689.
94+ # See https://github.com/vllm -project/vllm /issues/25689.
9595
9696
9797def enable_norm_fusion (cfg : "AphroditeConfig" ) -> bool :
@@ -129,10 +129,10 @@ def enable_allreduce_rms_fusion(cfg: "AphroditeConfig") -> bool:
129129 and has_flashinfer ()
130130 and (current_platform .is_device_capability_family (100 ) or current_platform .is_device_capability (90 ))
131131 # tp-dp combination broken:
132- # https://github.com/aphrodite -project/aphrodite /issues/34458
132+ # https://github.com/vllm -project/vllm /issues/34458
133133 and cfg .parallel_config .data_parallel_size == 1
134134 # tp-pp combination broken:
135- # https://github.com/aphrodite -project/aphrodite /issues/35426
135+ # https://github.com/vllm -project/vllm /issues/35426
136136 and cfg .parallel_config .pipeline_parallel_size == 1
137137 )
138138
@@ -881,7 +881,7 @@ def has_blocked_weights():
881881 # Enable quant_fp8 CUDA ops (TODO disable in follow up)
882882 # On H100 the CUDA kernel is faster than
883883 # native implementation
884- # https://github.com/aphrodite -project/aphrodite /issues/25094
884+ # https://github.com/vllm -project/vllm /issues/25094
885885 if has_blocked_weights ():
886886 custom_ops = self .compilation_config .custom_ops
887887 if "-quant_fp8" not in custom_ops :
@@ -1103,7 +1103,7 @@ def has_blocked_weights():
11031103 # incorrect residual shape.
11041104 # Use custom rms norm to unblock. In the future,
11051105 # the pass will operate on higher-level IR to avoid the issue.
1106- # TODO: https://github.com/aphrodite -project/aphrodite /issues/27894
1106+ # TODO: https://github.com/vllm -project/vllm /issues/27894
11071107 if self .compilation_config .mode != CompilationMode .APHRODITE_COMPILE :
11081108 logger .warning (
11091109 "Sequence parallelism is enabled, but running in wrong aphrodite compile mode: %s." ,
@@ -1246,7 +1246,7 @@ def has_blocked_weights():
12461246 # Enable quant_fp8 CUDA ops (TODO disable in follow up)
12471247 # On H100 the CUDA kernel is faster than
12481248 # native implementation
1249- # https://github.com/aphrodite -project/aphrodite /issues/25094
1249+ # https://github.com/vllm -project/vllm /issues/25094
12501250 if has_blocked_weights ():
12511251 custom_ops = self .compilation_config .custom_ops
12521252 if "-quant_fp8" not in custom_ops :
@@ -1657,18 +1657,18 @@ def _validate_v2_model_runner(self) -> None:
16571657 unsupported .append ("dual batch overlap" )
16581658
16591659 if self .model_config is not None and self .model_config .enable_return_routed_experts :
1660- # Will be added by https://github.com/aphrodite -project/aphrodite /pull/38163
1660+ # Will be added by https://github.com/vllm -project/vllm /pull/38163
16611661 unsupported .append ("routed experts capture" )
16621662
16631663 if self .model_config is not None and self .model_config .logits_processors :
16641664 unsupported .append ("custom logits processors" )
16651665
16661666 if self .cache_config .kv_sharing_fast_prefill :
1667- # Will be added by https://github.com/aphrodite -project/aphrodite /pull/35045
1667+ # Will be added by https://github.com/vllm -project/vllm /pull/35045
16681668 unsupported .append ("KV sharing fast prefill" )
16691669
16701670 if self .ec_transfer_config is not None :
1671- # Will be added by https://github.com/aphrodite -project/aphrodite /pull/38390
1671+ # Will be added by https://github.com/vllm -project/vllm /pull/38390
16721672 unsupported .append ("EC transfer" )
16731673
16741674 if unsupported :
0 commit comments