tests/e2e/matmul/large_linalg_matmul.mlir - 3p/openxla/iree - Git at Google

 // Test large aligned linalg matmul to make sure we go through the optimized
 // path for GPUs.
 func.func @large_aligned() {
   %lhs = util.unfoldable_constant dense<1.0> : tensor<2048x1024xf32>
   %rhs = util.unfoldable_constant dense<0.4> : tensor<1024x512xf32>
   %c0 = arith.constant 0.0 : f32
   %init = linalg.init_tensor[2048, 512] : tensor<2048x512xf32>
   %CC = linalg.fill ins(%c0 : f32) outs(%init : tensor<2048x512xf32>) -> tensor<2048x512xf32>
   %D = linalg.matmul ins(%lhs, %rhs: tensor<2048x1024xf32>, tensor<1024x512xf32>)
                     outs(%CC: tensor<2048x512xf32>) -> tensor<2048x512xf32>
   check.expect_almost_eq_const(%D, dense<409.596> : tensor<2048x512xf32>) : tensor<2048x512xf32>
   return
 }
	// Test large aligned linalg matmul to make sure we go through the optimized
	// path for GPUs.
	func.func @large_aligned() {
	%lhs = util.unfoldable_constant dense<1.0> : tensor<2048x1024xf32>
	%rhs = util.unfoldable_constant dense<0.4> : tensor<1024x512xf32>
	%c0 = arith.constant 0.0 : f32
	%init = linalg.init_tensor[2048, 512] : tensor<2048x512xf32>
	%CC = linalg.fill ins(%c0 : f32) outs(%init : tensor<2048x512xf32>) -> tensor<2048x512xf32>
	%D = linalg.matmul ins(%lhs, %rhs: tensor<2048x1024xf32>, tensor<1024x512xf32>)
	outs(%CC: tensor<2048x512xf32>) -> tensor<2048x512xf32>
	check.expect_almost_eq_const(%D, dense<409.596> : tensor<2048x512xf32>) : tensor<2048x512xf32>
	return
	}