We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent d4acf51 commit 1b82fb0Copy full SHA for 1b82fb0
vllm/compilation/pass_manager.py
@@ -18,14 +18,14 @@
18
from .fusion import RMSNormQuantFusionPass
19
from .fusion_attn import AttnFusionPass
20
from .qk_norm_rope_fusion import QKNormRoPEFusionPass
21
+ from .sequence_parallelism import SequenceParallelismPass
22
23
if current_platform.is_cuda():
24
from .collective_fusion import AllReduceFusionPass, AsyncTPPass
25
26
from .fix_functionalization import FixFunctionalizationPass
27
from .inductor_pass import CustomGraphPass, InductorPass, get_pass_context
28
from .noop_elimination import NoOpEliminationPass
-from .sequence_parallelism import SequenceParallelismPass
29
30
logger = init_logger(__name__)
31
0 commit comments