mlir/test/Dialect/SparseTensor/sparse_relu.mlir - llvm-project - Git at Google

 // RUN: mlir-opt %s --sparsification-and-bufferization | FileCheck %s

 #map = affine_map<(d0, d1, d2) -> (d0, d1, d2)>

 #sparse = #sparse_tensor.encoding<{
     map = (d0, d1, d2) -> (d0 : dense, d1 : dense, d2 : compressed)
 }>

 //
 // Make sure a simple ReLU passes the sparsifier
 //
 // CHECK-LABEL: func.func @relu
 // CHECK:       scf.for
 // CHECK:         scf.for
 // CHECK:           scf.for
 // CHECK:             arith.cmpf ugt
 // CHECK:             arith.select
 //
 func.func @relu(%arg0: tensor<10x20x30xf64, #sparse>) -> tensor<10x20x30xf64, #sparse> {
   %cst = arith.constant 0.000000e+00 : f64
   %0 = tensor.empty() : tensor<10x20x30xf64>
   %1 = linalg.generic {
       indexing_maps = [#map, #map],
       iterator_types = ["parallel", "parallel", "parallel"]}
       ins(%arg0 : tensor<10x20x30xf64, #sparse>)
       outs(%0 : tensor<10x20x30xf64>) {
   ^bb0(%in: f64, %out: f64):
       %2 = arith.cmpf ugt, %in, %cst : f64
       %3 = arith.select %2, %in, %cst : f64
       linalg.yield %3 : f64
   } -> tensor<10x20x30xf64>
   %cast = tensor.cast %1 : tensor<10x20x30xf64> to tensor<10x20x30xf64, #sparse>
   return %cast : tensor<10x20x30xf64, #sparse>
 }
	// RUN: mlir-opt %s --sparsification-and-bufferization \| FileCheck %s

	#map = affine_map<(d0, d1, d2) -> (d0, d1, d2)>

	#sparse = #sparse_tensor.encoding<{
	map = (d0, d1, d2) -> (d0 : dense, d1 : dense, d2 : compressed)
	}>

	//
	// Make sure a simple ReLU passes the sparsifier
	//
	// CHECK-LABEL: func.func @relu
	// CHECK: scf.for
	// CHECK: scf.for
	// CHECK: scf.for
	// CHECK: arith.cmpf ugt
	// CHECK: arith.select
	//
	func.func @relu(%arg0: tensor<10x20x30xf64, #sparse>) -> tensor<10x20x30xf64, #sparse> {
	%cst = arith.constant 0.000000e+00 : f64
	%0 = tensor.empty() : tensor<10x20x30xf64>
	%1 = linalg.generic {
	indexing_maps = [#map, #map],
	iterator_types = ["parallel", "parallel", "parallel"]}
	ins(%arg0 : tensor<10x20x30xf64, #sparse>)
	outs(%0 : tensor<10x20x30xf64>) {
	^bb0(%in: f64, %out: f64):
	%2 = arith.cmpf ugt, %in, %cst : f64
	%3 = arith.select %2, %in, %cst : f64
	linalg.yield %3 : f64
	} -> tensor<10x20x30xf64>
	%cast = tensor.cast %1 : tensor<10x20x30xf64> to tensor<10x20x30xf64, #sparse>
	return %cast : tensor<10x20x30xf64, #sparse>
	}