|
12 | 12 | from ..lang import Grid, IndexMapping
|
13 | 13 | from ..lang.global_symbols import *
|
14 | 14 | from ..ops import wave_ops
|
15 |
| -from ..ops.wave_ops import Iterate, CustomOp, get_custom, IterArg |
| 15 | +from ..ops.wave_ops import Iterate, CustomOp, get_custom |
16 | 16 | from .._support.indexing import IndexingContext, IndexExpr
|
17 | 17 | from .symbolic_constraints import SymbolicAlias
|
18 | 18 | from .._support.tracing import (
|
|
50 | 50 | from .decompose_scan_ops import decompose_scan_ops
|
51 | 51 | from .decompose_dot_mma import decompose_dot_mma
|
52 | 52 | from .expansion.expansion import expand_graph, add_get_results
|
| 53 | +from .gather_to_shared import gather_to_shared |
53 | 54 | from .global_to_shared_gathers import global_to_shared_gathers
|
54 | 55 | from .hoisting import hoist_loop_invariant_ops
|
55 | 56 | from .minimize_global_loads import minimize_global_loads
|
|
86 | 87 | import inspect
|
87 | 88 | import sympy
|
88 | 89 | import warnings
|
89 |
| -from pathlib import Path |
90 |
| -import sys |
91 |
| -import subprocess |
92 |
| -import os |
93 |
| -import shutil |
94 |
| -import glob |
95 | 90 |
|
96 | 91 | __all__ = ["wave", "wave_trace_only"]
|
97 | 92 |
|
@@ -529,14 +524,15 @@ def _trace_and_get_kernel_signature(
|
529 | 524 | graph_passes = self.build_initial_pass_pipeline(
|
530 | 525 | trace, options, print_ir_before, print_ir_after
|
531 | 526 | )
|
532 |
| - |
| 527 | + breakpoint() |
533 | 528 | # Optimizations.
|
534 | 529 | graph_passes += [
|
535 | 530 | partial(decompose_vmma_ops, trace, self.constraints),
|
536 | 531 | partial(decompose_dot_mma, trace, self.constraints),
|
537 | 532 | partial(hoist_loop_invariant_ops, trace, self.constraints),
|
538 | 533 | partial(global_to_shared_gathers, trace, self.constraints),
|
539 | 534 | partial(minimize_global_loads, trace, self.constraints),
|
| 535 | + partial(gather_to_shared, trace, self.constraints), |
540 | 536 | partial(apply_shared_memory_indexing_corrections, trace, self.constraints),
|
541 | 537 | ]
|
542 | 538 |
|
|
0 commit comments