cbensimon HF Staff commited on
Commit
a5c23d1
·
1 Parent(s): da26724

fuse_qkv_projections

Browse files
Files changed (1) hide show
  1. optimization.py +1 -0
optimization.py CHANGED
@@ -39,5 +39,6 @@ def optimize_pipeline_(pipeline: Callable[P, Any], *args: P.args, **kwargs: P.kw
39
 
40
  return spaces.aoti_compile(exported, INDUCTOR_CONFIGS)
41
 
 
42
  pipeline.transformer.set_attn_processor(FlashFusedFluxAttnProcessor3_0())
43
  spaces.aoti_apply(compile_transformer(), pipeline.transformer)
 
39
 
40
  return spaces.aoti_compile(exported, INDUCTOR_CONFIGS)
41
 
42
+ pipeline.transformer.fuse_qkv_projections()
43
  pipeline.transformer.set_attn_processor(FlashFusedFluxAttnProcessor3_0())
44
  spaces.aoti_apply(compile_transformer(), pipeline.transformer)