| // RUN: hlo_to_llvm_ir --ptx --sm=50 %s | FileCheck %s |
| |
| HloModule ReduceTileFit |
| |
| // CHECK-NOT: ld.global.nc.v2.f32 |
| // CHECK: ld.global.nc.f32 |
| // CHECK: ld.global.nc.f32 |
| // CHECK: ld.global.nc.f32 |
| // CHECK: ld.global.nc.f32 |
| // CHECK: ld.global.nc.f32 |
| // CHECK: ld.global.nc.f32 |
| // CHECK: ld.global.nc.f32 |
| // CHECK: ld.global.nc.f32 |
| |
| %max_ { |
| %x = f32[] parameter(0) |
| %y = f32[] parameter(1) |
| ROOT %maximum.7 = f32[] maximum(f32[] %x, f32[] %y) |
| } |
| |
| ENTRY %main { |
| %param_0 = f32[5,122880] parameter(0) |
| %constant.3 = f32[] constant(0) |
| ROOT %reduce.8 = f32[5] reduce(f32[5,122880] %param_0, f32[] %constant.3), dimensions={1}, to_apply=%max_ |
| } |