// RUN: hlo_to_llvm_ir --ptx --sm=60 %s | FileCheck %s | |
HloModule ReduceTileFit | |
// CHECK: ld.global.nc.v2.f32 | |
// CHECK: ld.global.nc.v2.f32 | |
// CHECK: ld.global.nc.v2.f32 | |
// CHECK: ld.global.nc.v2.f32 | |
%max_ { | |
%x = f32[] parameter(0) | |
%y = f32[] parameter(1) | |
ROOT %maximum.7 = f32[] maximum(f32[] %x, f32[] %y) | |
} | |
ENTRY %main { | |
%param_0 = f32[5,122880] parameter(0) | |
%constant.3 = f32[] constant(0) | |
ROOT %reduce.8 = f32[5] reduce(f32[5,122880] %param_0, f32[] %constant.3), dimensions={1}, to_apply=%max_ | |
} |