test/cpp/aot_inductor/test.cpp - platform/external/pytorch - Git at Google

 #include <gtest/gtest.h>
 #include <string>
 #include <vector>

 #include <c10/cuda/CUDAStream.h>
 #include <torch/csrc/inductor/aot_inductor_interface.h>
 #include <torch/torch.h>

 namespace torch {
 namespace aot_inductor {

 struct Net : torch::nn::Module {
   Net() : linear(register_module("linear", torch::nn::Linear(64, 10))) {}

   torch::Tensor forward(torch::Tensor x, torch::Tensor y) {
     return linear(torch::sin(x) + torch::cos(y));
   }
   torch::nn::Linear linear;
 };

 TEST(AotInductorTest, BasicTest) {
   torch::NoGradGuard no_grad;
   Net net;
   net.to(torch::kCUDA);

   torch::Tensor x =
       at::randn({32, 64}, at::dtype(at::kFloat).device(at::kCUDA));
   torch::Tensor y =
       at::randn({32, 64}, at::dtype(at::kFloat).device(at::kCUDA));
   torch::Tensor results_ref = net.forward(x, y);

   // TODO: we need to provide an API to concatenate args and weights
   std::vector<torch::Tensor> inputs;
   for (const auto& pair : net.named_parameters()) {
     inputs.push_back(pair.value());
   }
   inputs.push_back(x);
   inputs.push_back(y);

   AOTInductorModelContainerHandle container_handle;
   AOT_INDUCTOR_ERROR_CHECK(
       AOTInductorModelContainerCreate(&container_handle, 1 /*num_models*/))
   AOTInductorParamShape output_shape;
   AOT_INDUCTOR_ERROR_CHECK(AOTInductorModelContainerGetMaxOutputShape(
       container_handle, 0 /*output_idx*/, &output_shape));

   c10::IntArrayRef array_size(output_shape.shape_data, output_shape.ndim);
   torch::Tensor output_tensor =
       at::zeros(array_size, at::dtype(at::kFloat).device(at::kCUDA));
   std::vector<torch::Tensor> outputs;
   outputs.push_back(output_tensor);

   const auto& cuda_stream = at::cuda::getCurrentCUDAStream(0 /*device_index*/);
   const auto stream_id = cuda_stream.stream();
   AOTInductorStreamHandle stream_handle =
       reinterpret_cast<AOTInductorStreamHandle>(stream_id);
   AOTInductorTensorHandle inputs_handle =
       reinterpret_cast<AOTInductorTensorHandle>(inputs.data());
   AOTInductorTensorHandle outputs_handle =
       reinterpret_cast<AOTInductorTensorHandle>(outputs.data());
   AOT_INDUCTOR_ERROR_CHECK(AOTInductorModelContainerRun(
       container_handle,
       inputs_handle,
       inputs.size(),
       outputs_handle,
       outputs.size(),
       stream_handle));

   ASSERT_TRUE(torch::allclose(results_ref, outputs[0]));
   AOT_INDUCTOR_ERROR_CHECK(AOTInductorModelContainerDelete(container_handle));
 }

 } // namespace aot_inductor
 } // namespace torch
	#include <gtest/gtest.h>
	#include <string>
	#include <vector>

	#include <c10/cuda/CUDAStream.h>
	#include <torch/csrc/inductor/aot_inductor_interface.h>
	#include <torch/torch.h>

	namespace torch {
	namespace aot_inductor {

	struct Net : torch::nn::Module {
	Net() : linear(register_module("linear", torch::nn::Linear(64, 10))) {}

	torch::Tensor forward(torch::Tensor x, torch::Tensor y) {
	return linear(torch::sin(x) + torch::cos(y));
	}
	torch::nn::Linear linear;
	};

	TEST(AotInductorTest, BasicTest) {
	torch::NoGradGuard no_grad;
	Net net;
	net.to(torch::kCUDA);

	torch::Tensor x =
	at::randn({32, 64}, at::dtype(at::kFloat).device(at::kCUDA));
	torch::Tensor y =
	at::randn({32, 64}, at::dtype(at::kFloat).device(at::kCUDA));
	torch::Tensor results_ref = net.forward(x, y);

	// TODO: we need to provide an API to concatenate args and weights
	std::vector<torch::Tensor> inputs;
	for (const auto& pair : net.named_parameters()) {
	inputs.push_back(pair.value());
	}
	inputs.push_back(x);
	inputs.push_back(y);

	AOTInductorModelContainerHandle container_handle;
	AOT_INDUCTOR_ERROR_CHECK(
	AOTInductorModelContainerCreate(&container_handle, 1 /num_models/))
	AOTInductorParamShape output_shape;
	AOT_INDUCTOR_ERROR_CHECK(AOTInductorModelContainerGetMaxOutputShape(
	container_handle, 0 /output_idx/, &output_shape));

	c10::IntArrayRef array_size(output_shape.shape_data, output_shape.ndim);
	torch::Tensor output_tensor =
	at::zeros(array_size, at::dtype(at::kFloat).device(at::kCUDA));
	std::vector<torch::Tensor> outputs;
	outputs.push_back(output_tensor);

	const auto& cuda_stream = at::cuda::getCurrentCUDAStream(0 /device_index/);
	const auto stream_id = cuda_stream.stream();
	AOTInductorStreamHandle stream_handle =
	reinterpret_cast<AOTInductorStreamHandle>(stream_id);
	AOTInductorTensorHandle inputs_handle =
	reinterpret_cast<AOTInductorTensorHandle>(inputs.data());
	AOTInductorTensorHandle outputs_handle =
	reinterpret_cast<AOTInductorTensorHandle>(outputs.data());
	AOT_INDUCTOR_ERROR_CHECK(AOTInductorModelContainerRun(
	container_handle,
	inputs_handle,
	inputs.size(),
	outputs_handle,
	outputs.size(),
	stream_handle));

	ASSERT_TRUE(torch::allclose(results_ref, outputs[0]));
	AOT_INDUCTOR_ERROR_CHECK(AOTInductorModelContainerDelete(container_handle));
	}

	} // namespace aot_inductor
	} // namespace torch