better MaterializeMergeSchedule.cpp with %lane indexed batch computes

support for tensors of index values
2026-05-22 21:52:28 +02:00
parent 495186503c
commit c77ffa9c56
20 changed files with 398 additions and 300 deletions
@@ -31,13 +31,6 @@ static bool isExplicitHostOperand(Operation* op, unsigned operandIndex) {
  return false;
 }

-static int64_t getValueSizeInBytes(Value value) {
-  auto type = dyn_cast<ShapedType>(value.getType());
-  if (!type || !type.hasStaticShape())
-    return -1;
-  return type.getNumElements() * type.getElementTypeBitWidth() / 8;
-}
-
 template <typename CoreOpTy>
 static void materializeHostConstantsInCore(CoreOpTy coreOp,
                                           IRRewriter& rewriter,
@@ -82,7 +75,9 @@ static void materializeHostConstantsInCore(CoreOpTy coreOp,
        continue;
      }

-      int64_t totalBytes = getValueSizeInBytes(originalValue);
+      int64_t totalBytes = -1;
+      if (auto type = dyn_cast<ShapedType>(originalValue.getType()); type && type.hasStaticShape())
+        totalBytes = static_cast<int64_t>(getShapedTypeSizeInBytes(type));
      if (totalBytes < 0 || !llvm::isInt<32>(totalBytes) || !llvm::isInt<32>(resolvedAddress->byteOffset)) {
        op->emitOpError("host constant materialization requires 32-bit copy sizes and offsets");
        hasFailure = true;