Minor change to one comment.
diff --git a/tensorflow/compiler/xla/service/gpu/ir_emission_utils.cc b/tensorflow/compiler/xla/service/gpu/ir_emission_utils.cc
index b5c197f..78f8e22 100644
--- a/tensorflow/compiler/xla/service/gpu/ir_emission_utils.cc
+++ b/tensorflow/compiler/xla/service/gpu/ir_emission_utils.cc
@@ -220,7 +220,7 @@
}
// For column reduction, the tile block is tize_size_y x tile_size_x, and we
- // are reducing along tile_size_y. tile_size_y needs to be
+ // are reducing along tile_size_y. Only tile_size_y needs to be
// large enough to make the tiling implementation efficient.
return dims_in_elem[1] >= kWarpSize;
}