pytorch
diff --git a/‎examples/apps/flux-quantization-fp32.py
Lines changed: 0 additions & 168 deletions b/‎examples/apps/flux-quantization-fp32.py
Lines changed: 0 additions & 168 deletions
diff --git a/‎examples/apps/flux-quantization.py
Lines changed: 0 additions & 203 deletions b/‎examples/apps/flux-quantization.py
Lines changed: 0 additions & 203 deletions
diff --git a/‎examples/apps/register_sdpa.py
Lines changed: 5 additions & 3 deletions b/‎examples/apps/register_sdpa.py
Lines changed: 5 additions & 3 deletions
@@ -19,9 +19,11 @@
 
 # Remove decompositions for aten.scaled_dot_product_attention, aten._scaled_dot_product_efficient_attention, aten._scaled_dot_product_flash_attention
 # This is because we want to have SDPA as a standalone operator in the graph and invoke the custom converter for it.
-# TORCH_TRT_DECOMPOSITIONS.pop(torch.ops.aten.scaled_dot_product_attention.default)
-# TORCH_TRT_DECOMPOSITIONS.pop(torch.ops.aten._scaled_dot_product_efficient_attention.default)
-# TORCH_TRT_DECOMPOSITIONS.pop(torch.ops.aten._scaled_dot_product_flash_attention.default)
+TORCH_TRT_DECOMPOSITIONS.pop(torch.ops.aten.scaled_dot_product_attention.default)
+TORCH_TRT_DECOMPOSITIONS.pop(
+    torch.ops.aten._scaled_dot_product_efficient_attention.default
+)
+TORCH_TRT_DECOMPOSITIONS.pop(torch.ops.aten._scaled_dot_product_flash_attention.default)
 
 REPLACEABLE_ATEN_OPS = {
     torch.ops.aten._scaled_dot_product_efficient_attention.default,