diff --git a/compiler/transforms/guarded_linalg_to_memref_stream.py b/compiler/transforms/guarded_linalg_to_memref_stream.py
deleted file mode 100644
index 257bfc18..00000000
--- a/compiler/transforms/guarded_linalg_to_memref_stream.py
+++ /dev/null
@@ -1,60 +0,0 @@
-from xdsl.context import MLContext
-from xdsl.dialects import linalg, memref_stream
-from xdsl.dialects.builtin import ModuleOp, StringAttr
-from xdsl.ir import Operation
-from xdsl.passes import ModulePass
-from xdsl.pattern_rewriter import (
-    GreedyRewritePatternApplier,
-    PatternRewriter,
-    PatternRewriteWalker,
-    RewritePattern,
-    op_type_rewrite_pattern,
-)
-from xdsl.transforms.convert_linalg_to_memref_stream import (
-    ConvertGenericOpPattern,
-    ConvertYieldOpPattern,
-)
-
-
-class GuardedGenericOpPattern(RewritePattern):
-    @op_type_rewrite_pattern
-    def match_and_rewrite(self, op: linalg.Generic, rewriter: PatternRewriter) -> None:
-        """
-        This pattern is a guarded version of the pattern in upstream xDSL.
-        This is required because we can't (or don't want to) lower all
-        generic calls through the stream dialects.
-        It only matches on linalg.generics that have a library call with
-        a `_stream` suffix. This pass removes that suffix.
-        """
-
-        if not op.library_call:
-            return
-
-        if op.library_call.data.endswith("_stream"):
-            op.library_call = StringAttr(op.library_call.data[: -len("_stream")])
-            ConvertGenericOpPattern().match_and_rewrite(op, rewriter)
-
-
-class GuardedYieldOpPattern(RewritePattern):
-    @op_type_rewrite_pattern
-    def match_and_rewrite(self, op: linalg.YieldOp, rewriter: PatternRewriter):
-        # find parent operation
-        parent_op = op.parent
-        while parent_op and not isinstance(parent_op, Operation):
-            parent_op = parent_op.parent
-
-        # only if parrent is memref generic
-        if isinstance(parent_op, memref_stream.GenericOp):
-            ConvertYieldOpPattern().match_and_rewrite(op, rewriter)
-
-
-class GuardedLinalgToMemrefStreamPass(ModulePass):
-    name = "guarded-linalg-to-memref-stream"
-
-    def apply(self, ctx: MLContext, op: ModuleOp) -> None:
-        PatternRewriteWalker(
-            GreedyRewritePatternApplier(
-                [GuardedGenericOpPattern(), GuardedYieldOpPattern()]
-            ),
-            apply_recursively=False,
-        ).rewrite_module(op)
diff --git a/compiler/transforms/schedule_memref_linalg.py b/compiler/transforms/schedule_memref_linalg.py
deleted file mode 100644
index 2c5738c1..00000000
--- a/compiler/transforms/schedule_memref_linalg.py
+++ /dev/null
@@ -1,318 +0,0 @@
-from xdsl.context import MLContext
-from xdsl.dialects import builtin, memref_stream, stream
-from xdsl.ir import Block, Region
-from xdsl.ir.affine import AffineConstantExpr, AffineDimExpr, AffineExpr, AffineMap
-from xdsl.passes import ModulePass
-from xdsl.pattern_rewriter import (
-    PatternRewriter,
-    PatternRewriteWalker,
-    RewritePattern,
-    op_type_rewrite_pattern,
-)
-from xdsl.rewriter import InsertPoint
-
-from compiler.dialects.kernel import QMacOp
-from compiler.util.canonicalize_affine import canonicalize_map
-
-
-def disable_dims(map: AffineMap, dim: int) -> AffineMap:
-    """
-    Returns an affine map with the leftmost `dim` dimensions set to 0
-
-    For example:
-        (d0, d1, d2) -> d0 + d1 + d2
-    For `dim` = 1, will return:
-        (d1, d2) -> d1 + d2
-    For `dim` = 2, will return:
-        (d2) -> d2
-    """
-    return canonicalize_map(
-        map.replace_dims_and_symbols(
-            [AffineConstantExpr(0) for _ in range(dim)]
-            + [AffineDimExpr(i) for i in range(map.num_dims - dim)],
-            [],
-            map.num_dims - dim,
-            0,
-        )
-    )
-
-
-def rotate_dims(map: AffineMap, dim: int) -> AffineMap:
-    """
-    Returns an affine map with the leftmost `dim` dimensions rotated
-
-    For example:
-        (d0, d1, d2) -> 1 * d0 + 2 * d1 + 3 * d2
-    For `dim` = 3, will return:
-        (d0, d1, d2) -> 3 * d0 + 1 * d1 + 2 * d2
-    For `dim` = 2, will return:
-        (d0, d1, d2) -> 2 * d0 + 1 * d1 + 3 * d2
-    """
-    new_dims = [AffineDimExpr(i) for i in range(dim)]
-    # rotate dims by popping first and appending
-    new_dims.append(new_dims.pop(0))
-    # keep remaining dims
-    new_dims = new_dims + [AffineDimExpr(i) for i in range(dim, map.num_dims)]
-    return canonicalize_map(
-        map.replace_dims_and_symbols(new_dims, [], len(new_dims), 0)
-    )
-
-
-def rotate_bounds(bounds: list[int | None], dim: int) -> list[int | None]:
-    """
-    Returns the bounds after rotating dims, as in rotate_dims
-    """
-    bounds = bounds.copy()
-    bounds.insert(0, bounds.pop(dim - 1))
-    return bounds
-
-
-def tile_dim(map: AffineMap, dim: int, template_bound: int) -> AffineMap:
-    """
-    Returns the bounds and a new affine map with the `dim` dimension split up into two
-    This translates to creating two for loops with adjusted bounds from one for loop
-
-
-    For example:
-        (d0, d1, d2) -> d0 + d1 + d2
-    For `dim` = 1, `template_bound` = 2:
-        (d0, d1, d2, d3) -> d0 + 2 * d1 + d2 + d3
-    """
-    # 1 extra dimension
-    # create result map (d0, d1, ... dn)
-    new_results: list[AffineExpr] = [AffineDimExpr(i) for i in range(map.num_dims + 1)]
-    # pop the result at dim
-    dim_sum = new_results.pop(dim)
-    # add it to dim multiplied by original bound // max_bound
-    new_results[dim] = new_results[dim] + dim_sum * template_bound
-    transform_map = AffineMap(map.num_dims + 1, 0, tuple(new_results))
-
-    result = canonicalize_map(map.compose(transform_map))
-
-    return result
-
-
-def tile_bounds(
-    bounds: list[int | None], dim: int, template_bound: int
-) -> list[int | None]:
-    """
-    Returns the bounds after applying `tile_dim` in similar fashion.
-
-    For example:
-        [2, 8, 2]
-    For `dim` = 1, `template_bound` = 2:
-        [2, 4, 2, 2]
-    """
-    bounds = bounds.copy()
-    bound = bounds[dim]
-    bounds[dim] = template_bound
-    bounds.insert(dim, bound // template_bound if bound else None)
-    return bounds
-
-
-class ScheduleMemrefLinalgRewriter(RewritePattern):
-    """
-    Takes a memref_stream.generic op as input and wraps it in a memref_stream streaming region op
-    to determine the access patterns, the operation is scheduled to an accelerator template.
-    """
-
-    @op_type_rewrite_pattern
-    def match_and_rewrite(self, op: memref_stream.GenericOp, rewriter: PatternRewriter):
-        if any(isinstance(operand.type, stream.StreamType) for operand in op.operands):
-            # Already streamified
-            return
-
-        if not (
-            isinstance(op.library_call, builtin.StringAttr)
-            and op.library_call.data in ("snax_alu", "snax_gemm", "snax_gemmx")
-        ):
-            raise NotImplementedError(
-                "only snax_alu and snax_gemm are supported right now"
-            )
-
-        # only handle snax_alu and snax_gemm for now
-        if op.library_call.data == "snax_alu":
-            template = [AffineMap.from_callable(lambda x, y: (4 * x + y,))] * 3
-            template_bounds = (None, 4)
-        elif op.library_call.data == "snax_gemm":
-            M, N, K, m, n, k = (AffineDimExpr(i) for i in range(6))
-            template = [
-                AffineMap(6, 0, (M * 8 + m, K * 8 + k)),
-                AffineMap(6, 0, (K * 8 + k, N * 8 + n)),
-                AffineMap(6, 0, (M * 8 + m, N * 8 + n)),
-            ]
-            template_bounds = (None, None, None, 8, 8, 8)
-        elif op.library_call.data == "snax_gemmx":
-            # TODO: move templates to accelerator definitions
-            if isinstance(op.body.block.first_op, QMacOp):
-                # gemm
-                M, N, K, m, n, k = (AffineDimExpr(i) for i in range(6))
-                template = [
-                    AffineMap(6, 0, (M * 8 + m, K * 8 + k)),
-                    AffineMap(6, 0, (K * 8 + k, N * 8 + n)),
-                    AffineMap(6, 0, (M * 8 + m, N * 8 + n)),
-                ]
-                template_bounds = (None, None, None, 8, 8, 8)
-            else:
-                # rescale function of gemmx
-                M, K, m, k = (AffineDimExpr(i) for i in range(4))
-                template = [
-                    AffineMap(4, 0, (M * 8 + m, K * 8 + k)),
-                    AffineMap(4, 0, (M * 8 + m, K * 8 + k)),
-                ]
-                template_bounds = (None, None, 8, 8)
-
-        # only take patterns of memref operands
-        schedule = [
-            imap.data
-            for imap, op in zip(op.indexing_maps.data, op.operands)
-            if isinstance(op.type, builtin.MemRefType)
-        ]
-
-        schedule_bounds: list[int | None] = [
-            bound.value.data for bound in op.bounds.data
-        ]
-
-        for i in range(template[0].num_dims):
-            # i = 0: look at the last dimension
-            # i = 1: look at the second to last dimension
-            template_dim = template[0].num_dims - i - 1
-            schedule_dim = schedule[0].num_dims - i - 1
-            match = False
-
-            for it in range(schedule_dim + 1):
-                # keep rotating the remaining dimensions until we have a match
-
-                template_check = tuple(
-                    disable_dims(map, template_dim) for map in template
-                )
-                schedule_check = tuple(
-                    disable_dims(map, schedule_dim) for map in schedule
-                )
-
-                if template_check == schedule_check:
-                    match = True
-                    break
-
-                # else rotate the for loops
-                schedule = tuple(rotate_dims(map, schedule_dim + 1) for map in schedule)
-                schedule_bounds = rotate_bounds(schedule_bounds, schedule_dim + 1)
-
-            if not match:
-                raise RuntimeError("failed to match template and schedule")
-
-            # now, check bounds and design potential transfomration map
-            if not (template_bound := template_bounds[template_dim]):
-                # nothing to worry about, continue to next dim
-                continue
-
-            schedule_bound = op.bounds.data[schedule_dim].value.data
-
-            if schedule_bound < template_bound:
-                # need to apply padding
-                raise NotImplementedError("padding not supported")
-            elif schedule_bound >= template_bound:
-                # need to split up the schedule
-                assert schedule_bound % template_bound == 0
-                schedule = [
-                    tile_dim(schedule_map, schedule_dim, template_bound)
-                    for schedule_map in schedule
-                ]
-                schedule_bounds = tile_bounds(
-                    schedule_bounds, schedule_dim, template_bound
-                )
-
-        # if we get here we have now successfully determined a schedule for the operator
-        # this can be implemented with a memref streaming region
-        # the rest of this function just creates the wrapping memref streaming region
-        # the original generic op stays the same
-        # the indexing maps of that generic op are now pretty meaningless, but should
-        # not be looked at in following passes i think
-
-        input_streams = [
-            stream.ReadableStreamType(input.type.element_type)
-            for input in op.inputs
-            if isinstance(input.type, builtin.MemRefType)
-        ]
-
-        output_streams = [
-            stream.WritableStreamType(output.type.element_type)
-            for output in op.outputs
-            if isinstance(output.type, builtin.MemRefType)
-        ]
-
-        bounds_attr = builtin.ArrayAttr(
-            [
-                builtin.IntegerAttr(val if val else -1, builtin.IndexType())
-                for val in schedule_bounds
-            ]
-        )
-        input_stride_patterns: list[memref_stream.StridePattern] = [
-            memref_stream.StridePattern(bounds_attr, builtin.AffineMapAttr(map))
-            for map in schedule
-        ]
-
-        streaming_region_op = memref_stream.StreamingRegionOp(
-            inputs=[
-                input
-                for input in op.inputs
-                if isinstance(input.type, builtin.MemRefType)
-            ],
-            outputs=[
-                output
-                for output in op.outputs
-                if isinstance(output.type, builtin.MemRefType)
-            ],
-            patterns=builtin.ArrayAttr(input_stride_patterns),
-            body=Region(Block(arg_types=input_streams + output_streams)),
-        )
-
-        streaming_args = list(streaming_region_op.body.block.args)
-        new_inputs = [
-            streaming_args.pop(0)
-            if isinstance(input.type, builtin.MemRefType)
-            else input
-            for input in op.inputs
-        ]
-        new_outputs = [
-            streaming_args.pop(0)
-            if isinstance(output.type, builtin.MemRefType)
-            else output
-            for output in op.outputs
-        ]
-
-        new_generic_op = memref_stream.GenericOp(
-            inputs=new_inputs,
-            outputs=new_outputs,
-            inits=op.inits,
-            body=rewriter.move_region_contents_to_new_regions(op.body),
-            indexing_maps=op.indexing_maps,
-            iterator_types=op.iterator_types,
-            bounds=op.bounds,
-            init_indices=op.init_indices,
-            doc=op.doc,
-            library_call=op.library_call,
-        )
-
-        rewriter.replace_matched_op(streaming_region_op)
-        rewriter.insert_op(
-            new_generic_op, InsertPoint.at_end(streaming_region_op.body.block)
-        )
-
-
-class ScheduleMemrefLinalg(ModulePass):
-    """
-    A pass to schedule a memref stream according
-    to an accelerator definition. The result is
-    wraped in a memref streaming region op that
-    contains the resulting schedule. The linalg
-    operation itself remains unchanged. As it is
-    schedule agnostic.
-    """
-
-    name = "schedule-memref-linalg"
-
-    def apply(self, ctx: MLContext, op: builtin.ModuleOp):
-        PatternRewriteWalker(
-            ScheduleMemrefLinalgRewriter(), apply_recursively=False
-        ).rewrite_module(op)