Use ForLoopSpecializationPass to help with vectorization of kernels.
PiperOrigin-RevId: 317843378 Change-Id: I4ead02c24f957269888af5491934567cd3e311fb
This commit is contained in:
parent
8eea0658d4
commit
af94e801cf
@ -505,6 +505,11 @@ Status LowerLHLOToGPU(mlir::ModuleOp module, LowerLHLOToGPUOptions options) {
|
||||
// Some basic cleanup.
|
||||
pm.addNestedPass<::mlir::FuncOp>(::mlir::createCanonicalizerPass());
|
||||
pm.addNestedPass<::mlir::FuncOp>(::mlir::createCSEPass());
|
||||
// Make loops with min bounds into a conditional plus static bounds.
|
||||
// Only do this if we unrolled in the first place.
|
||||
if (!options.unroll_factors.empty()) {
|
||||
pm.addNestedPass<::mlir::FuncOp>(mlir::createForLoopSpecializationPass());
|
||||
}
|
||||
// Approximate of requested.
|
||||
if (options.use_approximations) {
|
||||
pm.addNestedPass<::mlir::FuncOp>(
|
||||
|
||||
Loading…
x
Reference in New Issue
Block a user