Home
last modified time | relevance | path

Searched refs:kernelPm (Results 1 – 4 of 4) sorted by relevance

/external/tensorflow/tensorflow/compiler/xla/service/mlir_gpu/
Dkernel_lowering.cc185 auto& kernelPm = pm.nest<::mlir::gpu::GPUModuleOp>(); in LowerKernelBodiesToNVVM() local
186 kernelPm.addPass(::mlir::createLowerToCFGPass()); in LowerKernelBodiesToNVVM()
187 kernelPm.addPass(absl::make_unique<LowerToNVVMPass>()); in LowerKernelBodiesToNVVM()
189 kernelPm.addNestedPass<::mlir::FuncOp>(::mlir::createCanonicalizerPass()); in LowerKernelBodiesToNVVM()
190 kernelPm.addNestedPass<::mlir::FuncOp>(::mlir::createCSEPass()); in LowerKernelBodiesToNVVM()
255 auto& kernelPm = pm.nest<::mlir::gpu::GPUModuleOp>(); in LowerKernelBodiesToROCDL() local
256 kernelPm.addPass(::mlir::createLowerToCFGPass()); in LowerKernelBodiesToROCDL()
257 kernelPm.addPass(absl::make_unique<LowerToROCDLPass>()); in LowerKernelBodiesToROCDL()
260 kernelPm.addNestedPass<::mlir::FuncOp>(::mlir::createCanonicalizerPass()); in LowerKernelBodiesToROCDL()
261 kernelPm.addNestedPass<::mlir::FuncOp>(::mlir::createCSEPass()); in LowerKernelBodiesToROCDL()
[all …]
/external/llvm-project/mlir/tools/mlir-cuda-runner/
Dmlir-cuda-runner.cpp114 auto &kernelPm = pm.nest<gpu::GPUModuleOp>(); in runMLIRPasses() local
115 kernelPm.addPass(createStripDebugInfoPass()); in runMLIRPasses()
116 kernelPm.addPass(createLowerGpuOpsToNVVMOpsPass()); in runMLIRPasses()
117 kernelPm.addPass(createConvertGPUKernelToBlobPass( in runMLIRPasses()
/external/llvm-project/mlir/tools/mlir-rocm-runner/
Dmlir-rocm-runner.cpp311 auto &kernelPm = pm.nest<gpu::GPUModuleOp>(); in runMLIRPasses() local
312 kernelPm.addPass(createStripDebugInfoPass()); in runMLIRPasses()
313 kernelPm.addPass(createLowerGpuOpsToROCDLOpsPass()); in runMLIRPasses()
314 kernelPm.addPass(createConvertGPUKernelToBlobPass( in runMLIRPasses()
/external/tensorflow/tensorflow/compiler/mlir/tools/kernel_gen/
Dkernel_creator.cc361 auto& kernelPm = pm.nest<::mlir::gpu::GPUModuleOp>(); in LowerKernelBodiesToLowLevelIr() local
362 kernelPm.addPass(::mlir::createLowerToCFGPass()); in LowerKernelBodiesToLowLevelIr()
364 kernelPm.addPass(mlir::kernel_gen::transforms::CreateGpuKernelToRocdlPass()); in LowerKernelBodiesToLowLevelIr()
366 kernelPm.addPass(mlir::kernel_gen::transforms::CreateGpuKernelToNvvmPass()); in LowerKernelBodiesToLowLevelIr()