test/cpp/api/container.cpp - platform/external/pytorch - Git at Google

 #include <catch.hpp>

 #include <torch/nn/module.h>
 #include <torch/nn/modules/batchnorm.h>
 #include <torch/nn/modules/conv.h>
 #include <torch/nn/modules/dropout.h>
 #include <torch/nn/modules/embedding.h>
 #include <torch/nn/modules/functional.h>
 #include <torch/nn/modules/linear.h>
 #include <torch/tensor.h>

 #include <test/cpp/api/util.h>

 using namespace torch;
 using namespace torch::nn;

 class TestModel : public Module {
  public:
   TestModel() {
     l1 = register_module("l1", Linear(10, 3).build());
     l2 = register_module("l2", Linear(3, 5).build());
     l3 = register_module("l3", Linear(5, 100).build());
   }

   std::vector<Variable> forward(std::vector<Variable> input) {
     return input;
   }

   std::shared_ptr<Linear> l1, l2, l3;
 };

 class NestedModel : public Module {
  public:
   NestedModel() {
     l1 = register_module("l1", Linear(5, 20).build());
     t = register_module("test", std::make_shared<TestModel>());
     param_ =
         register_parameter("param", at::CPU(at::kFloat).tensor({3, 2, 21}));
   }

   std::vector<Variable> forward(std::vector<Variable> input) {
     return input;
   };

   Variable param_;
   std::shared_ptr<Linear> l1;
   std::shared_ptr<TestModel> t;
 };

 TEST_CASE("containers") {
   SECTION("conv") {
     SECTION("1d") {
       auto model = Conv1d(3, 2, 3).stride(2).build();
       auto x = Var(at::CPU(at::kFloat).randn({2, 3, 5}), true);
       auto y = model->forward({x})[0];
       Variable s = y.sum();

       s.backward();
       REQUIRE(y.ndimension() == 3);
       REQUIRE(s.ndimension() == 0);
       for (auto i = 0; i < 3; i++) {
         REQUIRE(y.size(i) == 2);
       }

       REQUIRE(model->parameters()["weight"].grad().numel() == 3 * 2 * 3);
     }
     SECTION("2d") {
       SECTION("even") {
         auto model = Conv2d(3, 2, 3).stride(2).build();
         auto x = Var(at::CPU(at::kFloat).randn({2, 3, 5, 5}), true);
         auto y = model->forward({x})[0];
         Variable s = y.sum();

         s.backward();
         REQUIRE(y.ndimension() == 4);
         REQUIRE(s.ndimension() == 0);
         for (auto i = 0; i < 4; i++) {
           REQUIRE(y.size(i) == 2);
         }

         REQUIRE(
             model->parameters()["weight"].grad().numel() == 3 * 2 * 3 * 3);
       }

       SECTION("uneven") {
         auto model = Conv2d(3, 2, {3, 2}).stride({2, 2}).build();
         auto x = Var(at::CPU(at::kFloat).randn({2, 3, 5, 4}), true);
         auto y = model->forward({x})[0];
         Variable s = y.sum();

         s.backward();
         REQUIRE(y.ndimension() == 4);
         REQUIRE(s.ndimension() == 0);
         for (auto i = 0; i < 4; i++) {
           REQUIRE(y.size(i) == 2);
         }

         REQUIRE(
             model->parameters()["weight"].grad().numel() == 3 * 2 * 3 * 2);
       }
     }
     SECTION("3d") {
       auto model = Conv3d(3, 2, 3).stride(2).build();
       auto x = Var(at::CPU(at::kFloat).randn({2, 3, 5, 5, 5}), true);
       auto y = model->forward({x})[0];
       Variable s = y.sum();

       s.backward();
       REQUIRE(y.ndimension() == 5);
       REQUIRE(s.ndimension() == 0);
       for (auto i = 0; i < 5; i++) {
         REQUIRE(y.size(i) == 2);
       }

       REQUIRE(
           model->parameters()["weight"].grad().numel() ==
           3 * 2 * 3 * 3 * 3);
     }
   }
   SECTION("linear") {
     SECTION("basic1") {
       auto model = Linear(5, 2).build();
       auto x = Var(at::CPU(at::kFloat).randn({10, 5}), true);
       auto y = model->forward({x})[0];
       Variable s = y.sum();

       s.backward();
       REQUIRE(y.ndimension() == 2);
       REQUIRE(s.ndimension() == 0);
       REQUIRE(y.size(0) == 10);
       REQUIRE(y.size(1) == 2);

       REQUIRE(model->parameters()["weight"].grad().numel() == 2 * 5);
     }
   }

   SECTION("simple") {
     auto model = std::make_shared<SimpleContainer>();
     auto l1 = model->add(Linear(10, 3).build(), "l1");
     auto l2 = model->add(Linear(3, 5).build(), "l2");
     auto l3 = model->add(Linear(5, 100).build(), "l3");

     auto x = Var(at::CPU(at::kFloat).randn({1000, 10}));
     x = l1->forward({x})[0].clamp_min(0);
     x = l2->forward({x})[0].clamp_min(0);
     x = l3->forward({x})[0].clamp_min(0);

     x.backward();
     REQUIRE(x.ndimension() == 2);
     REQUIRE(x.size(0) == 1000);
     REQUIRE(x.size(1) == 100);
     REQUIRE(x.data().min().toCFloat() == 0);
   }

   SECTION("embedding") {
     SECTION("basic") {
       int dict_size = 10;
       auto model = Embedding(dict_size, 2).build();
       // Cannot get gradients to change indices (input) - only for embedding
       // params
       auto x = Var(at::CPU(at::kLong).tensor({10}).fill_(dict_size - 1), false);
       auto y = model->forward({x})[0];
       Variable s = y.sum();

       s.backward();
       REQUIRE(y.ndimension() == 2);
       REQUIRE(s.ndimension() == 0);
       REQUIRE(y.size(0) == 10);
       REQUIRE(y.size(1) == 2);

       REQUIRE(
           model->parameters()["table"].grad().numel() == 2 * dict_size);
     }

     SECTION("list") {
       auto model = Embedding(6, 4).build();
       auto x = Var(at::CPU(at::kLong).tensor({2, 3}).fill_(5), false);
       auto y = model->forward({x})[0];
       Variable s = y.sum();

       s.backward();
       REQUIRE(y.ndimension() == 3);
       REQUIRE(y.size(0) == 2);
       REQUIRE(y.size(1) == 3);
       REQUIRE(y.size(2) == 4);
     }
   }

   SECTION("dropout") {
     auto dropout = Dropout(0.5).build();
     Variable x = Var(at::CPU(at::kFloat).ones(100));
     Variable y = dropout->forward({x})[0];

     y.backward();
     REQUIRE(y.ndimension() == 1);
     REQUIRE(y.size(0) == 100);
     // TODO: These two tests are flaky
     // https://github.com/pytorch/pytorch/issues/7286
     // REQUIRE(y.sum().toCFloat() < 130); // Probably
     // REQUIRE(y.sum().toCFloat() > 70); // Probably

     dropout->eval();
     y = dropout->forward({x})[0];
     REQUIRE(y.data().sum().toCFloat() == 100);
   }

   SECTION("param") {
     auto model = std::make_shared<NestedModel>();
     auto parameters = model->parameters();
     REQUIRE(parameters["param"].size(0) == 3);
     REQUIRE(parameters["param"].size(1) == 2);
     REQUIRE(parameters["param"].size(2) == 21);
     REQUIRE(parameters["l1.bias"].size(0) == 20);
     REQUIRE(parameters["l1.weight"].size(0) == 20);
     REQUIRE(parameters["l1.weight"].size(1) == 5);
     REQUIRE(parameters["test.l1.bias"].size(0) == 3);
     REQUIRE(parameters["test.l1.weight"].size(0) == 3);
     REQUIRE(parameters["test.l1.weight"].size(1) == 10);
     REQUIRE(parameters["test.l2.bias"].size(0) == 5);
     REQUIRE(parameters["test.l2.weight"].size(0) == 5);
     REQUIRE(parameters["test.l2.weight"].size(1) == 3);
     REQUIRE(parameters["test.l3.bias"].size(0) == 100);
     REQUIRE(parameters["test.l3.weight"].size(0) == 100);
     REQUIRE(parameters["test.l3.weight"].size(1) == 5);
   }

   SECTION("functional") {
     bool was_called = false;
     // clang-format off
     auto functional = Functional([&was_called](std::vector<Variable> input) {
       was_called = true;
       return input;
     }).build();
     // clang-format on
     auto output = functional->forward({Var(at::CPU(at::kFloat).ones(5))});
     REQUIRE(was_called);
     REQUIRE(output.size() == 1);
     REQUIRE(output.front().equal(Var(at::CPU(at::kFloat).ones(5))));
   }
 }

 TEST_CASE("containers_cuda", "[cuda]") {
   SECTION("1") {
     auto model = Linear(5, 2).build();
     model->cuda();
     auto x = Var(at::CUDA(at::kFloat).randn({10, 5}), true);
     auto y = model->forward({x})[0];
     Variable s = y.sum();

     s.backward();
     REQUIRE(y.ndimension() == 2);
     REQUIRE(s.ndimension() == 0);
     REQUIRE(y.size(0) == 10);
     REQUIRE(y.size(1) == 2);

     REQUIRE(model->parameters()["weight"].grad().numel() == 2 * 5);
   }

   SECTION("2") {
     auto model = Linear(5, 2).build();
     model->cuda();
     model->cpu();
     auto x = Var(at::CPU(at::kFloat).randn({10, 5}), true);
     auto y = model->forward({x})[0];
     Variable s = y.sum();

     s.backward();
     REQUIRE(y.ndimension() == 2);
     REQUIRE(s.ndimension() == 0);
     REQUIRE(y.size(0) == 10);
     REQUIRE(y.size(1) == 2);

     REQUIRE(model->parameters()["weight"].grad().numel() == 2 * 5);
   }
 }
	#include <catch.hpp>

	#include <torch/nn/module.h>
	#include <torch/nn/modules/batchnorm.h>
	#include <torch/nn/modules/conv.h>
	#include <torch/nn/modules/dropout.h>
	#include <torch/nn/modules/embedding.h>
	#include <torch/nn/modules/functional.h>
	#include <torch/nn/modules/linear.h>
	#include <torch/tensor.h>

	#include <test/cpp/api/util.h>

	using namespace torch;
	using namespace torch::nn;

	class TestModel : public Module {
	public:
	TestModel() {
	l1 = register_module("l1", Linear(10, 3).build());
	l2 = register_module("l2", Linear(3, 5).build());
	l3 = register_module("l3", Linear(5, 100).build());
	}

	std::vector<Variable> forward(std::vector<Variable> input) {
	return input;
	}

	std::shared_ptr<Linear> l1, l2, l3;
	};

	class NestedModel : public Module {
	public:
	NestedModel() {
	l1 = register_module("l1", Linear(5, 20).build());
	t = register_module("test", std::make_shared<TestModel>());
	param_ =
	register_parameter("param", at::CPU(at::kFloat).tensor({3, 2, 21}));
	}

	std::vector<Variable> forward(std::vector<Variable> input) {
	return input;
	};

	Variable param_;
	std::shared_ptr<Linear> l1;
	std::shared_ptr<TestModel> t;
	};

	TEST_CASE("containers") {
	SECTION("conv") {
	SECTION("1d") {
	auto model = Conv1d(3, 2, 3).stride(2).build();
	auto x = Var(at::CPU(at::kFloat).randn({2, 3, 5}), true);
	auto y = model->forward({x})[0];
	Variable s = y.sum();

	s.backward();
	REQUIRE(y.ndimension() == 3);
	REQUIRE(s.ndimension() == 0);
	for (auto i = 0; i < 3; i++) {
	REQUIRE(y.size(i) == 2);
	}

	REQUIRE(model->parameters()["weight"].grad().numel() == 3 * 2 * 3);
	}
	SECTION("2d") {
	SECTION("even") {
	auto model = Conv2d(3, 2, 3).stride(2).build();
	auto x = Var(at::CPU(at::kFloat).randn({2, 3, 5, 5}), true);
	auto y = model->forward({x})[0];
	Variable s = y.sum();

	s.backward();
	REQUIRE(y.ndimension() == 4);
	REQUIRE(s.ndimension() == 0);
	for (auto i = 0; i < 4; i++) {
	REQUIRE(y.size(i) == 2);
	}

	REQUIRE(
	model->parameters()["weight"].grad().numel() == 3 * 2 * 3 * 3);
	}

	SECTION("uneven") {
	auto model = Conv2d(3, 2, {3, 2}).stride({2, 2}).build();
	auto x = Var(at::CPU(at::kFloat).randn({2, 3, 5, 4}), true);
	auto y = model->forward({x})[0];
	Variable s = y.sum();

	s.backward();
	REQUIRE(y.ndimension() == 4);
	REQUIRE(s.ndimension() == 0);
	for (auto i = 0; i < 4; i++) {
	REQUIRE(y.size(i) == 2);
	}

	REQUIRE(
	model->parameters()["weight"].grad().numel() == 3 * 2 * 3 * 2);
	}
	}
	SECTION("3d") {
	auto model = Conv3d(3, 2, 3).stride(2).build();
	auto x = Var(at::CPU(at::kFloat).randn({2, 3, 5, 5, 5}), true);
	auto y = model->forward({x})[0];
	Variable s = y.sum();

	s.backward();
	REQUIRE(y.ndimension() == 5);
	REQUIRE(s.ndimension() == 0);
	for (auto i = 0; i < 5; i++) {
	REQUIRE(y.size(i) == 2);
	}

	REQUIRE(
	model->parameters()["weight"].grad().numel() ==
	3 * 2 * 3 * 3 * 3);
	}
	}
	SECTION("linear") {
	SECTION("basic1") {
	auto model = Linear(5, 2).build();
	auto x = Var(at::CPU(at::kFloat).randn({10, 5}), true);
	auto y = model->forward({x})[0];
	Variable s = y.sum();

	s.backward();
	REQUIRE(y.ndimension() == 2);
	REQUIRE(s.ndimension() == 0);
	REQUIRE(y.size(0) == 10);
	REQUIRE(y.size(1) == 2);

	REQUIRE(model->parameters()["weight"].grad().numel() == 2 * 5);
	}
	}

	SECTION("simple") {
	auto model = std::make_shared<SimpleContainer>();
	auto l1 = model->add(Linear(10, 3).build(), "l1");
	auto l2 = model->add(Linear(3, 5).build(), "l2");
	auto l3 = model->add(Linear(5, 100).build(), "l3");

	auto x = Var(at::CPU(at::kFloat).randn({1000, 10}));
	x = l1->forward({x})[0].clamp_min(0);
	x = l2->forward({x})[0].clamp_min(0);
	x = l3->forward({x})[0].clamp_min(0);

	x.backward();
	REQUIRE(x.ndimension() == 2);
	REQUIRE(x.size(0) == 1000);
	REQUIRE(x.size(1) == 100);
	REQUIRE(x.data().min().toCFloat() == 0);
	}

	SECTION("embedding") {
	SECTION("basic") {
	int dict_size = 10;
	auto model = Embedding(dict_size, 2).build();
	// Cannot get gradients to change indices (input) - only for embedding
	// params
	auto x = Var(at::CPU(at::kLong).tensor({10}).fill_(dict_size - 1), false);
	auto y = model->forward({x})[0];
	Variable s = y.sum();

	s.backward();
	REQUIRE(y.ndimension() == 2);
	REQUIRE(s.ndimension() == 0);
	REQUIRE(y.size(0) == 10);
	REQUIRE(y.size(1) == 2);

	REQUIRE(
	model->parameters()["table"].grad().numel() == 2 * dict_size);
	}

	SECTION("list") {
	auto model = Embedding(6, 4).build();
	auto x = Var(at::CPU(at::kLong).tensor({2, 3}).fill_(5), false);
	auto y = model->forward({x})[0];
	Variable s = y.sum();

	s.backward();
	REQUIRE(y.ndimension() == 3);
	REQUIRE(y.size(0) == 2);
	REQUIRE(y.size(1) == 3);
	REQUIRE(y.size(2) == 4);
	}
	}

	SECTION("dropout") {
	auto dropout = Dropout(0.5).build();
	Variable x = Var(at::CPU(at::kFloat).ones(100));
	Variable y = dropout->forward({x})[0];

	y.backward();
	REQUIRE(y.ndimension() == 1);
	REQUIRE(y.size(0) == 100);
	// TODO: These two tests are flaky
	// https://github.com/pytorch/pytorch/issues/7286
	// REQUIRE(y.sum().toCFloat() < 130); // Probably
	// REQUIRE(y.sum().toCFloat() > 70); // Probably

	dropout->eval();
	y = dropout->forward({x})[0];
	REQUIRE(y.data().sum().toCFloat() == 100);
	}

	SECTION("param") {
	auto model = std::make_shared<NestedModel>();
	auto parameters = model->parameters();
	REQUIRE(parameters["param"].size(0) == 3);
	REQUIRE(parameters["param"].size(1) == 2);
	REQUIRE(parameters["param"].size(2) == 21);
	REQUIRE(parameters["l1.bias"].size(0) == 20);
	REQUIRE(parameters["l1.weight"].size(0) == 20);
	REQUIRE(parameters["l1.weight"].size(1) == 5);
	REQUIRE(parameters["test.l1.bias"].size(0) == 3);
	REQUIRE(parameters["test.l1.weight"].size(0) == 3);
	REQUIRE(parameters["test.l1.weight"].size(1) == 10);
	REQUIRE(parameters["test.l2.bias"].size(0) == 5);
	REQUIRE(parameters["test.l2.weight"].size(0) == 5);
	REQUIRE(parameters["test.l2.weight"].size(1) == 3);
	REQUIRE(parameters["test.l3.bias"].size(0) == 100);
	REQUIRE(parameters["test.l3.weight"].size(0) == 100);
	REQUIRE(parameters["test.l3.weight"].size(1) == 5);
	}

	SECTION("functional") {
	bool was_called = false;
	// clang-format off
	auto functional = Functional([&was_called](std::vector<Variable> input) {
	was_called = true;
	return input;
	}).build();
	// clang-format on
	auto output = functional->forward({Var(at::CPU(at::kFloat).ones(5))});
	REQUIRE(was_called);
	REQUIRE(output.size() == 1);
	REQUIRE(output.front().equal(Var(at::CPU(at::kFloat).ones(5))));
	}
	}

	TEST_CASE("containers_cuda", "[cuda]") {
	SECTION("1") {
	auto model = Linear(5, 2).build();
	model->cuda();
	auto x = Var(at::CUDA(at::kFloat).randn({10, 5}), true);
	auto y = model->forward({x})[0];
	Variable s = y.sum();

	s.backward();
	REQUIRE(y.ndimension() == 2);
	REQUIRE(s.ndimension() == 0);
	REQUIRE(y.size(0) == 10);
	REQUIRE(y.size(1) == 2);

	REQUIRE(model->parameters()["weight"].grad().numel() == 2 * 5);
	}

	SECTION("2") {
	auto model = Linear(5, 2).build();
	model->cuda();
	model->cpu();
	auto x = Var(at::CPU(at::kFloat).randn({10, 5}), true);
	auto y = model->forward({x})[0];
	Variable s = y.sum();

	s.backward();
	REQUIRE(y.ndimension() == 2);
	REQUIRE(s.ndimension() == 0);
	REQUIRE(y.size(0) == 10);
	REQUIRE(y.size(1) == 2);

	REQUIRE(model->parameters()["weight"].grad().numel() == 2 * 5);
	}
	}