// bits[0:N] = sub-vector element offset
// bits[N:M] = vector index
// clang-format on
- int64_t N =
+ int64_t n =
llvm::Log2_64(kDefaultVectorSizeBits / memrefTy.getElementTypeBitWidth());
- int64_t M = llvm::Log2_64(memrefTy.getDimSize(tgtDim));
+ int64_t m = llvm::Log2_64(memrefTy.getDimSize(tgtDim));
// Capture bits[0:(M-N)] of src by first creating a (M-N) mask.
- int64_t mask = (1LL << (M - N)) - 1;
+ int64_t mask = (1LL << (m - n)) - 1;
if (permuteEveryN > 1)
mask = mask << llvm::Log2_64(permuteEveryN);
Value srcBits = b.create<arith::ConstantIndexOp>(loc, mask);
// Use the src bits to permute the target bits b[N:M] containing the
// vector offset.
if (permuteEveryN > 1) {
- int64_t shlBits = N - llvm::Log2_64(permuteEveryN);
+ int64_t shlBits = n - llvm::Log2_64(permuteEveryN);
if (shlBits > 0) {
Value finalShiftVal = b.create<arith::ConstantIndexOp>(loc, shlBits);
srcBits = b.createOrFold<arith::ShLIOp>(loc, srcBits, finalShiftVal);
srcBits = b.createOrFold<arith::ShRUIOp>(loc, srcBits, finalShiftVal);
}
} else {
- Value finalShiftVal = b.create<arith::ConstantIndexOp>(loc, N);
+ Value finalShiftVal = b.create<arith::ConstantIndexOp>(loc, n);
srcBits = b.createOrFold<arith::ShLIOp>(loc, srcBits, finalShiftVal);
}