caffe2/operators/load_save_op.h - platform/external/pytorch - Git at Google

 #ifndef CAFFE2_OPERATORS_LOAD_SAVE_OP_H_
 #define CAFFE2_OPERATORS_LOAD_SAVE_OP_H_

 #include <cstdio>
 #include <map>
 #include <unordered_set>

 #include "caffe2/core/context.h"
 #include "caffe2/core/db.h"
 #include "caffe2/core/logging.h"
 #include "caffe2/core/operator.h"
 #include "caffe2/utils/math.h"
 #include "caffe2/utils/proto_utils.h"

 namespace caffe2 {

 using db::Cursor;
 using db::DB;
 using db::Transaction;

 template <class Context>
 class LoadOp final : public Operator<Context> {
  public:
   USE_OPERATOR_CONTEXT_FUNCTIONS;
   LoadOp(const OperatorDef& operator_def, Workspace* ws)
       : Operator<Context>(operator_def, ws),
         ws_(ws),
         absolute_path_(
             OperatorBase::GetSingleArgument<int>("absolute_path", false)),
         db_name_(OperatorBase::GetSingleArgument<string>("db", "")),
         db_type_(OperatorBase::GetSingleArgument<string>("db_type", "")),
         keep_device_(OperatorBase::GetSingleArgument<int>("keep_device", 0)),
         load_all_(OperatorBase::GetSingleArgument<int>("load_all", 0)) {
     if (InputSize() == 0) {
       CAFFE_ENFORCE_GT(db_name_.size(), 0, "Must specify a db name.");
       CAFFE_ENFORCE_GT(db_type_.size(), 0, "Must specify a db type.");
     }
     if (!load_all_) {
       int idx = 0;
       for (const string& output_name : this->def().output()) {
         output_indices_[output_name] = idx++;
       }
     }
   }

   void SetCurrentDevice(BlobProto* proto);

   bool RunOnDevice() override {
     if (InputSize() == 1) {
       const db::DBReader& reader = OperatorBase::Input<db::DBReader>(0);
       extract(reader.cursor());
     } else {
       string full_db_name =
           absolute_path_ ? db_name_ : (ws_->RootFolder() + "/" + db_name_);
       std::unique_ptr<DB> in_db(
           caffe2::db::CreateDB(db_type_, full_db_name, caffe2::db::READ));
       CAFFE_ENFORCE(in_db.get(), "Cannot open db: ", db_name_);
       std::unique_ptr<Cursor> cursor(in_db->NewCursor());
       extract(cursor.get());
     }

     return true;
   }

  private:
   void extract(Cursor* cursor) {
     if (load_all_) {
       extractAll(cursor);
     } else {
       extractFrom(cursor, OperatorBase::Outputs());
     }
   }

   void extractAll(Cursor* cursor) {
     CAFFE_ENFORCE(cursor, "cursor is not valid");
     std::unordered_set<string> seen_blobs;
     for (; cursor->Valid(); cursor->Next()) {
       const string& key = cursor->key();
       BlobProto proto;
       CAFFE_ENFORCE(
           proto.ParseFromString(cursor->value()), "Couldn't parse Proto");
       if (!keep_device_) {
         // If we are not keeping the device as the one specified in the
         // proto, we will set the current device.
         SetCurrentDevice(&proto);
       }

       if (seen_blobs.count(key) == 0 && ws_->GetBlob(key)) {
         // This blob already exists, reset it, read below about why!
         ws_->GetBlob(key)->Reset();
       }

       Blob* blob = ws_->CreateBlob(key);
       CAFFE_ENFORCE(blob->Deserialize(proto), "Couldn't deserialize blob");
       if (!blob->IsType<Tensor<Context>>()) {
         // Only tensors can be seen multiple times as chunks.
         CAFFE_ENFORCE(seen_blobs.count(key) == 0, "Blob duplicated");
       }
       seen_blobs.insert(key);
     }
   }

   void extractFrom(Cursor* cursor, const vector<Blob*>& outputs) {
     CAFFE_ENFORCE(cursor);

     // We are tracking sizes of already read tensor parts while reading data
     // chunks. This way we can make sure that all chunks were loaded in the end.
     // This is a map from output index to current size of the blob
     std::map<int, size_t> blobSizes;
     std::unordered_set<string> loaded;
     for (; cursor->Valid(); cursor->Next()) {
       const string& key = cursor->key();
       if (!output_indices_.count(key)) {
         VLOG(1) << "Key " << key << " not used. Skipping.";
       } else {
         CAFFE_ENFORCE(
             loaded.count(key) == 0,
             "Multiple copies of blob ",
             key,
             " found in the db.");

         VLOG(2) << "Deserializing blob " << key;
         BlobProto proto;
         CAFFE_ENFORCE(proto.ParseFromString(cursor->value()));
         if (!keep_device_) {
           // If we are not keeping the device as the one specified in the
           // proto, we will set the current device.
           SetCurrentDevice(&proto);
         }
         auto blobIndex = output_indices_[key];
         Blob* blob = outputs.at(blobIndex);
         auto blobSize = blobSizes.insert({blobIndex, 0});
         if (blobSize.second) {
           // We reset the blob so that any existing content is destroyed. This
           // is to guaranee correct device placement: if we are deserializing
           // into a TensorCUDA, without explicit Reset we might be loading data
           // into an existing TensorCUDA that has pre-allocated memory on a
           // different GPU.
           blob->Reset();
         }
         CAFFE_ENFORCE(blob->Deserialize(proto));

         if (!blob->IsType<Tensor<Context>>()) {
           // Deal with non-tensors: we don't support chunking so we're done.
           loaded.insert(key);
         } else {
           // Deal with tensors: done whtn read total tensor size
           CAFFE_ENFORCE(proto.has_tensor());
           auto tensorSize = blob->Get<Tensor<Context>>().size();
           if (proto.tensor().has_segment()) {
             blobSize.first->second += proto.tensor().segment().end() -
                 proto.tensor().segment().begin();
           } else {
             CAFFE_ENFORCE(blobSize.first->second == 0);
             blobSize.first->second = tensorSize;
           }
           if (blobSize.first->second >= tensorSize) {
             loaded.insert(key);
           }
         }

         if (loaded.size() >= OutputSize()) {
           break;
         }
       }
     }

     for (const auto& blobSize : blobSizes) {
       Blob* blob = outputs.at(blobSize.first);
       if (blob->IsType<Tensor<Context>>()) {
         size_t tensorSize = blob->Get<Tensor<Context>>().size();
         CAFFE_ENFORCE(
             tensorSize == blobSize.second,
             "Expected: ",
             tensorSize,
             " Read: ",
             blobSize.second);
       }
     }

     if (loaded.size() != OutputSize()) {
       for (const string& output_name : this->def().output()) {
         if (loaded.count(output_name) <= 0) {
           LOG(ERROR) << "Failed to load blob: " << output_name;
         }
       }
       CAFFE_THROW(
           "Expected to load ", OutputSize(), " blobs, ", "got ", loaded.size());
     }
   }

  private:
   Workspace* ws_;
   bool absolute_path_;
   string db_name_;
   string db_type_;
   bool keep_device_;
   bool load_all_;
   std::map<string, int> output_indices_;
 };

 template <class Context>
 class SaveOp final : public Operator<Context> {
  public:
   USE_OPERATOR_CONTEXT_FUNCTIONS;
   SaveOp(const OperatorDef& operator_def, Workspace* ws)
       : Operator<Context>(operator_def, ws),
         ws_(ws),
         absolute_path_(
             OperatorBase::GetSingleArgument<int>("absolute_path", false)),
         db_name_(OperatorBase::GetSingleArgument<string>("db", "")),
         db_type_(OperatorBase::GetSingleArgument<string>("db_type", "")) {
     CAFFE_ENFORCE_GT(db_name_.size(), 0, "Must specify a db name.");
     CAFFE_ENFORCE_GT(db_type_.size(), 0, "Must specify a db type.");
   }

   bool RunOnDevice() override {
     string full_db_name =
         absolute_path_ ? db_name_ : (ws_->RootFolder() + "/" + db_name_);
     std::unique_ptr<DB> out_db(
         caffe2::db::CreateDB(db_type_, full_db_name, caffe2::db::NEW));
     CAFFE_ENFORCE(out_db.get(), "Cannot open db for writing: ", full_db_name);

     const vector<const Blob*>& inputs = OperatorBase::Inputs();
     BlobSerializerBase::SerializationAcceptor acceptor = [&](
         const std::string& blobName, const std::string& data) {
       // transaction should take care of locking
       std::unique_ptr<Transaction> transaction(out_db->NewTransaction());
       transaction->Put(blobName, data);
       transaction->Commit();
     };
     std::set<std::string> input_names;
     for (int i = 0; i < inputs.size(); ++i) {
       CAFFE_ENFORCE(
           input_names.insert(def().input(i)).second,
           "Duplicated feature: ",
           def().input(i));
     }
     for (int i = 0; i < inputs.size(); ++i) {
       inputs[i]->Serialize(def().input(i), acceptor);
     }
     return true;
   }

  private:
   Workspace* ws_;
   bool absolute_path_;
   string db_name_;
   string db_type_;
 };

 template <typename... Ts>
 string FormatString(const string& pattern, Ts... values) {
   // Note(Yangqing): We believe that 1024 is enough, but who are we to assert
   // that?
   // As a result, if things go wrong, we'll just throw the towel and quit loud.
   // Yeah, I know that there is snprintf, but it is not present in *some*
   // platforms unfortunately.
   char buffer[1024];
   int written = sprintf(buffer, pattern.c_str(), values...);
   if (written < 0 || written + 1 > 1024) {
     LOG(FATAL) << "FormatString fails: total bytes written " << written;
   }
   return string(buffer);
   /*
    * The following is the snprintf version that is safe; enable it one day?
   unsigned int required =
       std::snprintf(nullptr, 0, pattern.c_str(), values...) + 1;
   char bytes[required];
   std::snprintf(bytes, required, pattern.c_str(), values...);
   return string(bytes);
   */
 }

 // SnapshotOp is a wrapper over a SaveFloatTensorOp that basically allows
 // flexible naming over iterations.
 // The file pattern in db_name should be a format string that can be passed into
 // sprintf with an int argument specifying the current iteration. An example:
 //     "/path/to/my/snapshot/snapshot_at_%d.pb"
 template <class Context>
 class SnapshotOp final : public Operator<Context> {
  public:
   SnapshotOp(const OperatorDef& operator_def, Workspace* ws)
       : Operator<Context>(operator_def, ws),
         db_pattern_(OperatorBase::GetSingleArgument<string>("db", "")),
         every_(OperatorBase::GetSingleArgument<int>("every", 1)),
         ws_(ws),
         save_op_def_(operator_def) {
     CAFFE_ENFORCE_GT(
         db_pattern_.size(), 0, "Must specify a snapshot file pattern.");
     CAFFE_ENFORCE_GT(every_, 0, "Snapshot interval should be positive.");
     if (every_ == 1) {
       // Just issue a warning, but it's totally legal so we don't do anything.
       LOG(WARNING) << "It seems that we are snapshotting every iteration. "
                    << "Is that intended?";
     }
     save_op_def_.set_type("Save");
   }

   bool RunOnDevice() override {
     int64_t iter =
         OperatorBase::Input<TensorCPU>(0).template data<int64_t>()[0];
     if (iter % every_ == 0) {
       GetMutableArgument("db", true, &save_op_def_)
           ->set_s(FormatString(db_pattern_, iter));
       SaveOp<Context> sub_op(save_op_def_, ws_);
       return sub_op.Run();
     } else {
       return true;
     }
   }

  private:
   string db_pattern_;
   int every_;
   Workspace* ws_;
   OperatorDef save_op_def_;
 };

 } // namespace caffe2

 #endif // CAFFE2_OPERATORS_LOAD_SAVE_OP_H_
	#ifndef CAFFE2_OPERATORS_LOAD_SAVE_OP_H_
	#define CAFFE2_OPERATORS_LOAD_SAVE_OP_H_

	#include <cstdio>
	#include <map>
	#include <unordered_set>

	#include "caffe2/core/context.h"
	#include "caffe2/core/db.h"
	#include "caffe2/core/logging.h"
	#include "caffe2/core/operator.h"
	#include "caffe2/utils/math.h"
	#include "caffe2/utils/proto_utils.h"

	namespace caffe2 {

	using db::Cursor;
	using db::DB;
	using db::Transaction;

	template <class Context>
	class LoadOp final : public Operator<Context> {
	public:
	USE_OPERATOR_CONTEXT_FUNCTIONS;
	LoadOp(const OperatorDef& operator_def, Workspace* ws)
	: Operator<Context>(operator_def, ws),
	ws_(ws),
	absolute_path_(
	OperatorBase::GetSingleArgument<int>("absolute_path", false)),
	db_name_(OperatorBase::GetSingleArgument<string>("db", "")),
	db_type_(OperatorBase::GetSingleArgument<string>("db_type", "")),
	keep_device_(OperatorBase::GetSingleArgument<int>("keep_device", 0)),
	load_all_(OperatorBase::GetSingleArgument<int>("load_all", 0)) {
	if (InputSize() == 0) {
	CAFFE_ENFORCE_GT(db_name_.size(), 0, "Must specify a db name.");
	CAFFE_ENFORCE_GT(db_type_.size(), 0, "Must specify a db type.");
	}
	if (!load_all_) {
	int idx = 0;
	for (const string& output_name : this->def().output()) {
	output_indices_[output_name] = idx++;
	}
	}
	}

	void SetCurrentDevice(BlobProto* proto);

	bool RunOnDevice() override {
	if (InputSize() == 1) {
	const db::DBReader& reader = OperatorBase::Input<db::DBReader>(0);
	extract(reader.cursor());
	} else {
	string full_db_name =
	absolute_path_ ? db_name_ : (ws_->RootFolder() + "/" + db_name_);
	std::unique_ptr<DB> in_db(
	caffe2::db::CreateDB(db_type_, full_db_name, caffe2::db::READ));
	CAFFE_ENFORCE(in_db.get(), "Cannot open db: ", db_name_);
	std::unique_ptr<Cursor> cursor(in_db->NewCursor());
	extract(cursor.get());
	}

	return true;
	}

	private:
	void extract(Cursor* cursor) {
	if (load_all_) {
	extractAll(cursor);
	} else {
	extractFrom(cursor, OperatorBase::Outputs());
	}
	}

	void extractAll(Cursor* cursor) {
	CAFFE_ENFORCE(cursor, "cursor is not valid");
	std::unordered_set<string> seen_blobs;
	for (; cursor->Valid(); cursor->Next()) {
	const string& key = cursor->key();
	BlobProto proto;
	CAFFE_ENFORCE(
	proto.ParseFromString(cursor->value()), "Couldn't parse Proto");
	if (!keep_device_) {
	// If we are not keeping the device as the one specified in the
	// proto, we will set the current device.
	SetCurrentDevice(&proto);
	}

	if (seen_blobs.count(key) == 0 && ws_->GetBlob(key)) {
	// This blob already exists, reset it, read below about why!
	ws_->GetBlob(key)->Reset();
	}

	Blob* blob = ws_->CreateBlob(key);
	CAFFE_ENFORCE(blob->Deserialize(proto), "Couldn't deserialize blob");
	if (!blob->IsType<Tensor<Context>>()) {
	// Only tensors can be seen multiple times as chunks.
	CAFFE_ENFORCE(seen_blobs.count(key) == 0, "Blob duplicated");
	}
	seen_blobs.insert(key);
	}
	}

	void extractFrom(Cursor* cursor, const vector<Blob*>& outputs) {
	CAFFE_ENFORCE(cursor);

	// We are tracking sizes of already read tensor parts while reading data
	// chunks. This way we can make sure that all chunks were loaded in the end.
	// This is a map from output index to current size of the blob
	std::map<int, size_t> blobSizes;
	std::unordered_set<string> loaded;
	for (; cursor->Valid(); cursor->Next()) {
	const string& key = cursor->key();
	if (!output_indices_.count(key)) {
	VLOG(1) << "Key " << key << " not used. Skipping.";
	} else {
	CAFFE_ENFORCE(
	loaded.count(key) == 0,
	"Multiple copies of blob ",
	key,
	" found in the db.");

	VLOG(2) << "Deserializing blob " << key;
	BlobProto proto;
	CAFFE_ENFORCE(proto.ParseFromString(cursor->value()));
	if (!keep_device_) {
	// If we are not keeping the device as the one specified in the
	// proto, we will set the current device.
	SetCurrentDevice(&proto);
	}
	auto blobIndex = output_indices_[key];
	Blob* blob = outputs.at(blobIndex);
	auto blobSize = blobSizes.insert({blobIndex, 0});
	if (blobSize.second) {
	// We reset the blob so that any existing content is destroyed. This
	// is to guaranee correct device placement: if we are deserializing
	// into a TensorCUDA, without explicit Reset we might be loading data
	// into an existing TensorCUDA that has pre-allocated memory on a
	// different GPU.
	blob->Reset();
	}
	CAFFE_ENFORCE(blob->Deserialize(proto));

	if (!blob->IsType<Tensor<Context>>()) {
	// Deal with non-tensors: we don't support chunking so we're done.
	loaded.insert(key);
	} else {
	// Deal with tensors: done whtn read total tensor size
	CAFFE_ENFORCE(proto.has_tensor());
	auto tensorSize = blob->Get<Tensor<Context>>().size();
	if (proto.tensor().has_segment()) {
	blobSize.first->second += proto.tensor().segment().end() -
	proto.tensor().segment().begin();
	} else {
	CAFFE_ENFORCE(blobSize.first->second == 0);
	blobSize.first->second = tensorSize;
	}
	if (blobSize.first->second >= tensorSize) {
	loaded.insert(key);
	}
	}

	if (loaded.size() >= OutputSize()) {
	break;
	}
	}
	}

	for (const auto& blobSize : blobSizes) {
	Blob* blob = outputs.at(blobSize.first);
	if (blob->IsType<Tensor<Context>>()) {
	size_t tensorSize = blob->Get<Tensor<Context>>().size();
	CAFFE_ENFORCE(
	tensorSize == blobSize.second,
	"Expected: ",
	tensorSize,
	" Read: ",
	blobSize.second);
	}
	}

	if (loaded.size() != OutputSize()) {
	for (const string& output_name : this->def().output()) {
	if (loaded.count(output_name) <= 0) {
	LOG(ERROR) << "Failed to load blob: " << output_name;
	}
	}
	CAFFE_THROW(
	"Expected to load ", OutputSize(), " blobs, ", "got ", loaded.size());
	}
	}

	private:
	Workspace* ws_;
	bool absolute_path_;
	string db_name_;
	string db_type_;
	bool keep_device_;
	bool load_all_;
	std::map<string, int> output_indices_;
	};

	template <class Context>
	class SaveOp final : public Operator<Context> {
	public:
	USE_OPERATOR_CONTEXT_FUNCTIONS;
	SaveOp(const OperatorDef& operator_def, Workspace* ws)
	: Operator<Context>(operator_def, ws),
	ws_(ws),
	absolute_path_(
	OperatorBase::GetSingleArgument<int>("absolute_path", false)),
	db_name_(OperatorBase::GetSingleArgument<string>("db", "")),
	db_type_(OperatorBase::GetSingleArgument<string>("db_type", "")) {
	CAFFE_ENFORCE_GT(db_name_.size(), 0, "Must specify a db name.");
	CAFFE_ENFORCE_GT(db_type_.size(), 0, "Must specify a db type.");
	}

	bool RunOnDevice() override {
	string full_db_name =
	absolute_path_ ? db_name_ : (ws_->RootFolder() + "/" + db_name_);
	std::unique_ptr<DB> out_db(
	caffe2::db::CreateDB(db_type_, full_db_name, caffe2::db::NEW));
	CAFFE_ENFORCE(out_db.get(), "Cannot open db for writing: ", full_db_name);

	const vector<const Blob*>& inputs = OperatorBase::Inputs();
	BlobSerializerBase::SerializationAcceptor acceptor = [&](
	const std::string& blobName, const std::string& data) {
	// transaction should take care of locking
	std::unique_ptr<Transaction> transaction(out_db->NewTransaction());
	transaction->Put(blobName, data);
	transaction->Commit();
	};
	std::set<std::string> input_names;
	for (int i = 0; i < inputs.size(); ++i) {
	CAFFE_ENFORCE(
	input_names.insert(def().input(i)).second,
	"Duplicated feature: ",
	def().input(i));
	}
	for (int i = 0; i < inputs.size(); ++i) {
	inputs[i]->Serialize(def().input(i), acceptor);
	}
	return true;
	}

	private:
	Workspace* ws_;
	bool absolute_path_;
	string db_name_;
	string db_type_;
	};

	template <typename... Ts>
	string FormatString(const string& pattern, Ts... values) {
	// Note(Yangqing): We believe that 1024 is enough, but who are we to assert
	// that?
	// As a result, if things go wrong, we'll just throw the towel and quit loud.
	// Yeah, I know that there is snprintf, but it is not present in some
	// platforms unfortunately.
	char buffer[1024];
	int written = sprintf(buffer, pattern.c_str(), values...);
	if (written < 0 \|\| written + 1 > 1024) {
	LOG(FATAL) << "FormatString fails: total bytes written " << written;
	}
	return string(buffer);
	/*
	* The following is the snprintf version that is safe; enable it one day?
	unsigned int required =
	std::snprintf(nullptr, 0, pattern.c_str(), values...) + 1;
	char bytes[required];
	std::snprintf(bytes, required, pattern.c_str(), values...);
	return string(bytes);
	*/
	}

	// SnapshotOp is a wrapper over a SaveFloatTensorOp that basically allows
	// flexible naming over iterations.
	// The file pattern in db_name should be a format string that can be passed into
	// sprintf with an int argument specifying the current iteration. An example:
	// "/path/to/my/snapshot/snapshot_at_%d.pb"
	template <class Context>
	class SnapshotOp final : public Operator<Context> {
	public:
	SnapshotOp(const OperatorDef& operator_def, Workspace* ws)
	: Operator<Context>(operator_def, ws),
	db_pattern_(OperatorBase::GetSingleArgument<string>("db", "")),
	every_(OperatorBase::GetSingleArgument<int>("every", 1)),
	ws_(ws),
	save_op_def_(operator_def) {
	CAFFE_ENFORCE_GT(
	db_pattern_.size(), 0, "Must specify a snapshot file pattern.");
	CAFFE_ENFORCE_GT(every_, 0, "Snapshot interval should be positive.");
	if (every_ == 1) {
	// Just issue a warning, but it's totally legal so we don't do anything.
	LOG(WARNING) << "It seems that we are snapshotting every iteration. "
	<< "Is that intended?";
	}
	save_op_def_.set_type("Save");
	}

	bool RunOnDevice() override {
	int64_t iter =
	OperatorBase::Input<TensorCPU>(0).template data<int64_t>()[0];
	if (iter % every_ == 0) {
	GetMutableArgument("db", true, &save_op_def_)
	->set_s(FormatString(db_pattern_, iter));
	SaveOp<Context> sub_op(save_op_def_, ws_);
	return sub_op.Run();
	} else {
	return true;
	}
	}

	private:
	string db_pattern_;
	int every_;
	Workspace* ws_;
	OperatorDef save_op_def_;
	};

	} // namespace caffe2

	#endif // CAFFE2_OPERATORS_LOAD_SAVE_OP_H_