Lines Matching defs:numThreads
336 /// Returns true if the maximum tile offset `tileSize * numThreads-1` is less
339 OpFoldResult numThreads,
342 std::optional<int64_t> numThreadsConst = getConstantIntValue(numThreads);
369 ArrayRef<OpFoldResult> numThreads, SmallVector<Range> loopRanges,
379 numThreads, [](OpFoldResult ofr) { return !isConstantIntValue(ofr, 0); });
384 bool overflow = loopIdx >= numThreads.size();
385 bool isZero = !overflow && isConstantIntValue(numThreads[loopIdx], 0);
596 ArrayRef<OpFoldResult> numThreads, ArrayRef<OpFoldResult> tileSizes,
632 if (!tileSizes.empty() && tileSizes.size() != numThreads.size())
637 if (redDims.front() >= numThreads.size())
643 op.generateInitialTensorForPartialReduction(b, loc, numThreads,
658 numThreads, [](OpFoldResult ofr) { return !isConstantIntValue(ofr, 0); });
670 calculateTileOffsetsAndSizes(b, loc, forallOp, numThreads, iterationDomain,
689 SmallVector<OpFoldResult> strides(numThreads.size(), b.getIndexAttr(1));
690 SmallVector<OpFoldResult> outOffsets(numThreads.size(),
760 for (int64_t i = 0, e = numThreads.size(); i < e; ++i) {