40
40
#include " llvm/ADT/TypeSwitch.h"
41
41
#include " llvm/Support/Debug.h"
42
42
#include " llvm/Support/ErrorHandling.h"
43
+ #include " llvm/Support/InterleavedRange.h"
43
44
#include < type_traits>
44
45
45
46
using namespace mlir ;
@@ -450,20 +451,14 @@ static DiagnosedSilenceableFailure rewriteOneForallCommonImpl(
450
451
// Otherwise, we have a new insertion without a size -> use size 1.
451
452
tmpMappingSizes.push_back (1 );
452
453
}
453
- LLVM_DEBUG (
454
- llvm::interleaveComma (
455
- tmpMappingSizes,
456
- DBGS () << " ----tmpMappingSizes extracted from scf.forall op: " );
457
- llvm::dbgs () << " \n " );
454
+ LDBG (" ----tmpMappingSizes extracted from scf.forall op: "
455
+ << llvm::interleaved (tmpMappingSizes));
458
456
459
457
// Step 2. sort the values by the corresponding DeviceMappingAttrInterface.
460
458
SmallVector<int64_t > forallMappingSizes = getValuesSortedByKey (
461
459
forallMappingAttrs.getArrayRef (), tmpMappingSizes, comparator);
462
- LLVM_DEBUG (llvm::interleaveComma (forallMappingSizes,
463
- DBGS () << " ----forallMappingSizes: " );
464
- llvm::dbgs () << " \n " ; llvm::interleaveComma (
465
- forallMappingAttrs, DBGS () << " ----forallMappingAttrs: " );
466
- llvm::dbgs () << " \n " );
460
+ LDBG (" ----forallMappingSizes: " << llvm::interleaved (forallMappingSizes));
461
+ LDBG (" ----forallMappingAttrs: " << llvm::interleaved (forallMappingAttrs));
467
462
468
463
// Step 3. Generate the mappingIdOps using the provided generator.
469
464
Location loc = forallOp.getLoc ();
@@ -501,17 +496,10 @@ static DiagnosedSilenceableFailure rewriteOneForallCommonImpl(
501
496
SmallVector<int64_t > availableMappingSizes =
502
497
builderResult.availableMappingSizes ;
503
498
SmallVector<Value> activeIdOps = builderResult.activeIdOps ;
504
- // clang-format off
505
- LLVM_DEBUG (
506
- llvm::interleaveComma (
507
- activeMappingSizes, DBGS () << " ----activeMappingSizes: " );
508
- llvm::dbgs () << " \n " ;
509
- llvm::interleaveComma (
510
- availableMappingSizes, DBGS () << " ----availableMappingSizes: " );
511
- llvm::dbgs () << " \n " ;
512
- llvm::interleaveComma (activeIdOps, DBGS () << " ----activeIdOps: " );
513
- llvm::dbgs () << " \n " );
514
- // clang-format on
499
+ LDBG (" ----activeMappingSizes: " << llvm::interleaved (activeMappingSizes));
500
+ LDBG (" ----availableMappingSizes: "
501
+ << llvm::interleaved (availableMappingSizes));
502
+ LDBG (" ----activeIdOps: " << llvm::interleaved (activeIdOps));
515
503
for (auto [activeId, activeMappingSize, availableMappingSize] :
516
504
llvm::zip_equal (activeIdOps, activeMappingSizes,
517
505
availableMappingSizes)) {
@@ -566,11 +554,9 @@ static DiagnosedSilenceableFailure rewriteOneForallCommonImpl(
566
554
// Step 8. Erase old op.
567
555
rewriter.eraseOp (forallOp);
568
556
569
- LLVM_DEBUG (llvm::interleaveComma (forallMappingSizes,
570
- DBGS () << " ----result forallMappingSizes: " );
571
- llvm::dbgs () << " \n " ; llvm::interleaveComma (
572
- mappingIdOps, DBGS () << " ----result mappingIdOps: " );
573
- llvm::dbgs () << " \n " );
557
+ LDBG (" ----result forallMappingSizes: "
558
+ << llvm::interleaved (forallMappingSizes));
559
+ LDBG (" ----result mappingIdOps: " << llvm::interleaved (mappingIdOps));
574
560
575
561
result = ForallRewriteResult{forallMappingSizes, mappingIdOps};
576
562
return DiagnosedSilenceableFailure::success ();
@@ -740,7 +726,7 @@ static DiagnosedSilenceableFailure checkMappingSpec(
740
726
auto diag = definiteFailureHelper (
741
727
transformOp, forallOp,
742
728
Twine (" 3-D mapping: size of threadIdx.x must be a multiple of " ) +
743
- std::to_string (factor));
729
+ Twine (factor));
744
730
return diag;
745
731
}
746
732
if (computeProduct (numParallelIterations) * factor >
@@ -749,9 +735,9 @@ static DiagnosedSilenceableFailure checkMappingSpec(
749
735
transformOp, forallOp,
750
736
Twine (" the number of required parallel resources (blocks or "
751
737
" threads) " ) +
752
- std::to_string (computeProduct (numParallelIterations) * factor) +
753
- std::string ( " overflows the number of available resources " ) +
754
- std::to_string (computeProduct (blockOrGridSizes)));
738
+ Twine (computeProduct (numParallelIterations) * factor) +
739
+ " overflows the number of available resources " +
740
+ Twine (computeProduct (blockOrGridSizes)));
755
741
return diag;
756
742
}
757
743
return DiagnosedSilenceableFailure::success ();
0 commit comments