| /* Copyright 2015 The TensorFlow Authors. All Rights Reserved. |
| |
| Licensed under the Apache License, Version 2.0 (the "License"); |
| you may not use this file except in compliance with the License. |
| You may obtain a copy of the License at |
| |
| http://www.apache.org/licenses/LICENSE-2.0 |
| |
| Unless required by applicable law or agreed to in writing, software |
| distributed under the License is distributed on an "AS IS" BASIS, |
| WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| See the License for the specific language governing permissions and |
| limitations under the License. |
| ==============================================================================*/ |
| |
| #include "tensorflow/core/kernels/xent_op.h" |
| #include "tensorflow/core/common_runtime/kernel_benchmark_testlib.h" |
| #include "tensorflow/core/framework/tensor.h" |
| #include "tensorflow/core/platform/test.h" |
| #include "tensorflow/core/platform/test_benchmark.h" |
| |
| namespace tensorflow { |
| |
| static Graph* Xent(int batch_size, int num_classes) { |
| Graph* g = new Graph(OpRegistry::Global()); |
| Tensor logits(DT_FLOAT, TensorShape({batch_size, num_classes})); |
| logits.flat<float>().setRandom(); |
| Tensor labels(DT_FLOAT, TensorShape({batch_size, num_classes})); |
| labels.flat<float>().setRandom(); |
| test::graph::Binary(g, "SoftmaxCrossEntropyWithLogits", |
| test::graph::Constant(g, logits), |
| test::graph::Constant(g, labels)); |
| return g; |
| } |
| |
| #define BM_XentDev(BATCH, CLASS, DEVICE) \ |
| static void BM_Xent##_##BATCH##_##CLASS##_##DEVICE(int iters) { \ |
| testing::ItemsProcessed(static_cast<int64>(iters) * BATCH * CLASS); \ |
| test::Benchmark(#DEVICE, Xent(BATCH, CLASS)).Run(iters); \ |
| } \ |
| BENCHMARK(BM_Xent##_##BATCH##_##CLASS##_##DEVICE); |
| |
| /// The representative tests for ptb_word on GPU |
| BM_XentDev(16, 10000, gpu); |
| BM_XentDev(16, 30000, gpu); |
| BM_XentDev(16, 100000, gpu); |
| |
| BM_XentDev(32, 10000, gpu); |
| BM_XentDev(32, 30000, gpu); |
| BM_XentDev(32, 100000, gpu); |
| |
| BM_XentDev(64, 10000, gpu); |
| BM_XentDev(64, 30000, gpu); |
| BM_XentDev(64, 100000, gpu); |
| |
| /// Only the smaller tests for CPU. Otherwise, it's too slow |
| BM_XentDev(16, 10000, cpu); |
| BM_XentDev(32, 10000, cpu); |
| BM_XentDev(64, 10000, cpu); |
| |
| } // end namespace tensorflow |