makslevental
diff --git a/‎mlir_utils/dialects/ext/arith.py‎
Lines changed: 3 additions & 1 deletion b/‎mlir_utils/dialects/ext/arith.py‎
Lines changed: 3 additions & 1 deletion
diff --git a/‎mlir_utils/dialects/ext/memref.py‎
Lines changed: 297 additions & 0 deletions b/‎mlir_utils/dialects/ext/memref.py‎
Lines changed: 297 additions & 0 deletions
@@ -203,12 +203,14 @@ def __call__(cls, *args, **kwargs):
             fold = kwargs.get("fold")
             if fold is not None and not isinstance(fold, bool):
                 raise ValueError(f"{fold=} is expected to be a bool.")
+            loc = kwargs.get("loc")
+            ip = kwargs.get("ip")
             # If we're wrapping a numpy array (effectively a tensor literal),
             # then we want to make sure no one else has access to that memory.
             # Otherwise, the array will get funneled down to DenseElementsAttr.get,
             # which by default (through the Python buffer protocol) does not copy;
             # see mlir/lib/Bindings/Python/IRAttributes.cpp#L556
-            val = constant(deepcopy(arg), dtype)
+            val = constant(deepcopy(arg), dtype, loc=loc, ip=ip)
         else:
             raise NotImplementedError(f"{cls.__name__} doesn't support wrapping {arg}.")
 
 
@@ -0,0 +1,297 @@
+import re
+from functools import cached_property
+from typing import Tuple, Sequence, Optional, Union
+
+from mlir.ir import Type, Value, MemRefType, ShapedType, MLIRError
+
+from mlir_utils.dialects import memref
+from mlir_utils.dialects.ext.arith import Scalar, constant
+from mlir_utils.dialects.ext.tensor import (
+    _indices_to_indexer,
+    compute_result_shape_reassoc_list,
+)
+import mlir_utils.types as T
+from mlir_utils.util import (
+    register_value_caster,
+    get_user_code_loc,
+    maybe_cast,
+    get_result_or_results,
+)
+
+S = ShapedType.get_dynamic_size()
+
+
+def _alloc(
+    op_ctor,
+    sizes: Sequence[Union[int]],
+    element_type: Type,
+    *,
+    loc=None,
+    ip=None,
+):
+    if loc is None:
+        loc = get_user_code_loc()
+    dynamic_sizes = []
+    result_type = T.memref(*sizes, element_type)
+    return maybe_cast(
+        get_result_or_results(op_ctor(result_type, dynamic_sizes, [], loc=loc, ip=ip))
+    )
+
+
+def alloc(sizes: Sequence[Union[int, Value]], element_type: Type, *, loc=None, ip=None):
+    if loc is None:
+        loc = get_user_code_loc()
+    return maybe_cast(
+        get_result_or_results(
+            _alloc(memref.AllocOp, sizes, element_type, loc=loc, ip=ip)
+        )
+    )
+
+
+def alloca(
+    sizes: Sequence[Union[int, Value]], element_type: Type, *, loc=None, ip=None
+):
+    if loc is None:
+        loc = get_user_code_loc()
+    return maybe_cast(
+        get_result_or_results(
+            _alloc(memref.AllocaOp, sizes, element_type, loc=loc, ip=ip)
+        )
+    )
+
+
+def load(mem: Value, indices: Sequence[Value | int], *, loc=None, ip=None):
+    if loc is None:
+        loc = get_user_code_loc()
+    indices = list(indices)
+    for idx, i in enumerate(indices):
+        if isinstance(i, int):
+            indices[idx] = constant(i, index=True)
+    return maybe_cast(
+        get_result_or_results(memref.LoadOp.__base__(mem, indices, loc=loc, ip=ip))
+    )
+
+
+def store(
+    value: Value, mem: Value, indices: Sequence[Value | int], *, loc=None, ip=None
+):
+    if loc is None:
+        loc = get_user_code_loc()
+    indices = list(indices)
+    for idx, i in enumerate(indices):
+        if isinstance(i, int):
+            indices[idx] = constant(i, index=True)
+    return maybe_cast(
+        get_result_or_results(memref.StoreOp(value, mem, indices, loc=loc, ip=ip))
+    )
+
+
+def subview(
+    source: "MemRef",
+    static_offsets: Optional[Sequence[int]] = None,
+    static_sizes: Optional[Sequence[int]] = None,
+    static_strides: Optional[Sequence[int]] = None,
+    *,
+    loc=None,
+    ip=None,
+):
+    if loc is None:
+        loc = get_user_code_loc()
+    assert static_sizes, f"this convenience method only handles static sizes"
+    offsets = sizes = strides = []
+    result = T.memref(*static_sizes, source.dtype)
+    val = memref.subview(
+        result,
+        source,
+        offsets,
+        sizes,
+        strides,
+        static_offsets,
+        static_sizes,
+        static_strides,
+        loc=loc,
+        ip=ip,
+    )
+    # dumbest hack ever - the default builder doesn't connect to inferReturnTypes
+    # but the diag message does
+    try:
+        val.owner.verify()
+        return val
+    except MLIRError as e:
+        diag = str(e.error_diagnostics[0])
+        correct_type = re.findall(r"'memref<(.*)>'", diag)
+        assert len(correct_type) == 1
+        correct_type = Type.parse(f"memref<{correct_type[0]}>")
+        val.owner.erase()
+        return memref.subview(
+            correct_type,
+            source,
+            offsets,
+            sizes,
+            strides,
+            static_offsets,
+            static_sizes,
+            static_strides,
+            loc=loc,
+            ip=ip,
+        )
+
+
+@register_value_caster(MemRefType.static_typeid)
+class MemRef(Value):
+    def __str__(self):
+        return f"{self.__class__.__name__}({self.get_name()}, {self.type})"
+
+    def __repr__(self):
+        return str(self)
+
+    @staticmethod
+    def isinstance(other: Value):
+        return isinstance(other, Value) and MemRefType.isinstance(other.type)
+
+    @cached_property
+    def _shaped_type(self) -> ShapedType:
+        return ShapedType(self.type)
+
+    def has_static_shape(self) -> bool:
+        return self._shaped_type.has_static_shape
+
+    def has_rank(self) -> bool:
+        return self._shaped_type.has_rank
+
+    @cached_property
+    def shape(self) -> Tuple[int, ...]:
+        return tuple(self._shaped_type.shape)
+
+    @cached_property
+    def dtype(self) -> Type:
+        return self._shaped_type.element_type
+
+    def __getitem__(self, idx: tuple) -> "MemRef":
+        loc = get_user_code_loc()
+
+        if not self.has_rank():
+            raise ValueError("only ranked memref slicing/indexing supported")
+
+        if idx == Ellipsis or idx == slice(None):
+            return self
+        if isinstance(idx, tuple) and all(i == slice(None) for i in idx):
+            return self
+        if idx is None:
+            return expand_shape(self, (0,), loc=loc)
+
+        idx = list((idx,) if isinstance(idx, int) else idx)
+        for i, d in enumerate(idx):
+            if isinstance(d, int):
+                idx[i] = constant(d, index=True, loc=loc)
+
+        if all(isinstance(d, Scalar) for d in idx) and len(idx) == len(self.shape):
+            return load(self, idx, loc=loc)
+        else:
+            return _subview(self, tuple(idx), loc=loc)
+
+    def __setitem__(self, idx, source):
+        loc = get_user_code_loc()
+
+        if not self.has_rank():
+            raise ValueError("only ranked memref slicing/indexing supported")
+
+        idx = list((idx,) if isinstance(idx, int) else idx)
+        for i, d in enumerate(idx):
+            if isinstance(d, int):
+                idx[i] = constant(d, index=True, loc=loc)
+
+        if all(isinstance(d, Scalar) for d in idx) and len(idx) == len(self.shape):
+            assert isinstance(
+                source, Scalar
+            ), "coordinate insert requires scalar element"
+            store(source, self, idx, loc=loc)
+        else:
+            _copy_to_subview(self, source, tuple(idx), loc=loc)
+
+
+def expand_shape(
+    inp,
+    newaxis_dims,
+    *,
+    loc=None,
+    ip=None,
+) -> MemRef:
+    """Expand the shape of a memref.
+
+    Insert a new axis that will appear at the `axis` position in the expanded
+    memref shape.
+
+    Args:
+      inp: Input memref-like.
+      axis: Position in the expanded axes where the new axis (or axes) is placed.
+
+    Returns:
+       View of `a` with the number of dimensions increased.
+
+    """
+    if loc is None:
+        loc = get_user_code_loc()
+
+    if len(newaxis_dims) == 0:
+        return inp
+
+    result_shape, reassoc_list = compute_result_shape_reassoc_list(
+        inp.shape, newaxis_dims
+    )
+
+    return MemRef(
+        memref.expand_shape(
+            T.memref(*result_shape, inp.dtype), inp, reassoc_list, loc=loc, ip=ip
+        )
+    )
+
+
+def _subview(
+    mem: MemRef,
+    idx,
+    *,
+    loc=None,
+    ip=None,
+) -> MemRef:
+    if loc is None:
+        loc = get_user_code_loc()
+
+    indexer = _indices_to_indexer(idx, mem.shape)
+    out = mem
+
+    if indexer.is_constant():
+        out = subview(
+            out,
+            static_offsets=indexer.static_offsets(),
+            static_sizes=indexer.static_sizes(),
+            static_strides=indexer.static_strides(),
+            loc=loc,
+            ip=ip,
+        )
+    else:
+        raise ValueError(f"non-constant indices not supported {indexer}")
+
+    # This adds newaxis/None dimensions.
+    return expand_shape(out, indexer.newaxis_dims, loc=loc, ip=ip)
+
+
+def _copy_to_subview(
+    dest: MemRef,
+    source: MemRef,
+    idx,
+    *,
+    loc=None,
+    ip=None,
+):
+    if loc is None:
+        loc = get_user_code_loc()
+    if isinstance(source, Scalar):
+        source = expand_shape(source, (0,), loc=loc, ip=ip)
+
+    dest_subview = _subview(dest, idx, loc=loc, ip=ip)
+    assert (
+        dest_subview.shape == source.shape
+    ), f"Expected matching shape for dest subview {dest_subview.shape} and source {source.shape=}"
+
+    return memref.copy(source, dest_subview, loc=loc, ip=ip)