blob: dd2ab9a4fb78f21630441840248e49288d7044b5 [file] [log] [blame]
/* Copyright 2015 The TensorFlow Authors. All Rights Reserved.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
==============================================================================*/
#ifndef TENSORFLOW_CORE_PLATFORM_FILE_SYSTEM_H_
#define TENSORFLOW_CORE_PLATFORM_FILE_SYSTEM_H_
#include <stdint.h>
#include <functional>
#include <string>
#include <unordered_map>
#include <utility>
#include <vector>
#include "tensorflow/core/platform/cord.h"
#include "tensorflow/core/platform/errors.h"
#include "tensorflow/core/platform/file_statistics.h"
#include "tensorflow/core/platform/macros.h"
#include "tensorflow/core/platform/platform.h"
#include "tensorflow/core/platform/stringpiece.h"
#include "tensorflow/core/platform/types.h"
#ifdef PLATFORM_WINDOWS
#undef DeleteFile
#undef CopyFile
#undef TranslateName
#endif
namespace tensorflow {
class RandomAccessFile;
class ReadOnlyMemoryRegion;
class WritableFile;
class FileSystem;
struct TransactionToken {
FileSystem* owner;
void* token;
};
/// A generic interface for accessing a file system. Implementations
/// of custom filesystem adapters must implement this interface,
/// RandomAccessFile, WritableFile, and ReadOnlyMemoryRegion classes.
class FileSystem {
public:
/// \brief Creates a brand new random access read-only file with the
/// specified name.
///
/// On success, stores a pointer to the new file in
/// *result and returns OK. On failure stores NULL in *result and
/// returns non-OK. If the file does not exist, returns a non-OK
/// status.
///
/// The returned file may be concurrently accessed by multiple threads.
///
/// The ownership of the returned RandomAccessFile is passed to the caller
/// and the object should be deleted when is not used.
virtual tensorflow::Status NewRandomAccessFile(
const std::string& fname, std::unique_ptr<RandomAccessFile>* result) {
return NewRandomAccessFile(fname, nullptr, result);
}
virtual tensorflow::Status NewRandomAccessFile(
const std::string& fname, TransactionToken* token,
std::unique_ptr<RandomAccessFile>* result) {
// We duplicate these methods due to Google internal coding style prevents
// virtual functions with default arguments. See PR #41615.
return Status::OK();
}
/// \brief Creates an object that writes to a new file with the specified
/// name.
///
/// Deletes any existing file with the same name and creates a
/// new file. On success, stores a pointer to the new file in
/// *result and returns OK. On failure stores NULL in *result and
/// returns non-OK.
///
/// The returned file will only be accessed by one thread at a time.
///
/// The ownership of the returned WritableFile is passed to the caller
/// and the object should be deleted when is not used.
virtual tensorflow::Status NewWritableFile(
const std::string& fname, std::unique_ptr<WritableFile>* result) {
return NewWritableFile(fname, nullptr, result);
}
virtual tensorflow::Status NewWritableFile(
const std::string& fname, TransactionToken* token,
std::unique_ptr<WritableFile>* result) {
return Status::OK();
}
/// \brief Creates an object that either appends to an existing file, or
/// writes to a new file (if the file does not exist to begin with).
///
/// On success, stores a pointer to the new file in *result and
/// returns OK. On failure stores NULL in *result and returns
/// non-OK.
///
/// The returned file will only be accessed by one thread at a time.
///
/// The ownership of the returned WritableFile is passed to the caller
/// and the object should be deleted when is not used.
virtual tensorflow::Status NewAppendableFile(
const std::string& fname, std::unique_ptr<WritableFile>* result) {
return NewAppendableFile(fname, nullptr, result);
}
virtual tensorflow::Status NewAppendableFile(
const std::string& fname, TransactionToken* token,
std::unique_ptr<WritableFile>* result) {
return Status::OK();
}
/// \brief Creates a readonly region of memory with the file context.
///
/// On success, it returns a pointer to read-only memory region
/// from the content of file fname. The ownership of the region is passed to
/// the caller. On failure stores nullptr in *result and returns non-OK.
///
/// The returned memory region can be accessed from many threads in parallel.
///
/// The ownership of the returned ReadOnlyMemoryRegion is passed to the caller
/// and the object should be deleted when is not used.
virtual tensorflow::Status NewReadOnlyMemoryRegionFromFile(
const std::string& fname, std::unique_ptr<ReadOnlyMemoryRegion>* result) {
return NewReadOnlyMemoryRegionFromFile(fname, nullptr, result);
}
virtual tensorflow::Status NewReadOnlyMemoryRegionFromFile(
const std::string& fname, TransactionToken* token,
std::unique_ptr<ReadOnlyMemoryRegion>* result) {
return Status::OK();
}
/// Returns OK if the named path exists and NOT_FOUND otherwise.
virtual tensorflow::Status FileExists(const std::string& fname) {
return FileExists(fname, nullptr);
}
virtual tensorflow::Status FileExists(const std::string& fname,
TransactionToken* token) {
return Status::OK();
}
/// Returns true if all the listed files exist, false otherwise.
/// if status is not null, populate the vector with a detailed status
/// for each file.
virtual bool FilesExist(const std::vector<string>& files,
std::vector<Status>* status) {
return FilesExist(files, nullptr, status);
}
virtual bool FilesExist(const std::vector<string>& files,
TransactionToken* token, std::vector<Status>* status);
/// \brief Returns the immediate children in the given directory.
///
/// The returned paths are relative to 'dir'.
virtual tensorflow::Status GetChildren(const std::string& dir,
std::vector<string>* result) {
return GetChildren(dir, nullptr, result);
}
virtual tensorflow::Status GetChildren(const std::string& dir,
TransactionToken* token,
std::vector<string>* result) {
return Status::OK();
}
/// \brief Given a pattern, stores in *results the set of paths that matches
/// that pattern. *results is cleared.
///
/// pattern must match all of a name, not just a substring.
///
/// pattern: { term }
/// term:
/// '*': matches any sequence of non-'/' characters
/// '?': matches a single non-'/' character
/// '[' [ '^' ] { match-list } ']':
/// matches any single character (not) on the list
/// c: matches character c (c != '*', '?', '\\', '[')
/// '\\' c: matches character c
/// character-range:
/// c: matches character c (c != '\\', '-', ']')
/// '\\' c: matches character c
/// lo '-' hi: matches character c for lo <= c <= hi
///
/// Typical return codes:
/// * OK - no errors
/// * UNIMPLEMENTED - Some underlying functions (like GetChildren) are not
/// implemented
virtual tensorflow::Status GetMatchingPaths(const std::string& pattern,
std::vector<string>* results) {
return GetMatchingPaths(pattern, nullptr, results);
}
virtual tensorflow::Status GetMatchingPaths(const std::string& pattern,
TransactionToken* token,
std::vector<string>* results) {
return Status::OK();
}
/// \brief Checks if the given filename matches the pattern.
///
/// This function provides the equivalent of posix fnmatch, however it is
/// implemented without fnmatch to ensure that this can be used for cloud
/// filesystems on windows. For windows filesystems, it uses PathMatchSpec.
virtual bool Match(const std::string& filename, const std::string& pattern);
/// \brief Obtains statistics for the given path.
virtual tensorflow::Status Stat(const std::string& fname,
FileStatistics* stat) {
return Stat(fname, nullptr, stat);
}
virtual tensorflow::Status Stat(const std::string& fname,
TransactionToken* token,
FileStatistics* stat) {
return Status::OK();
}
/// \brief Deletes the named file.
virtual tensorflow::Status DeleteFile(const std::string& fname) {
return DeleteFile(fname, nullptr);
}
virtual tensorflow::Status DeleteFile(const std::string& fname,
TransactionToken* token) {
return Status::OK();
}
/// \brief Creates the specified directory.
/// Typical return codes:
/// * OK - successfully created the directory.
/// * ALREADY_EXISTS - directory with name dirname already exists.
/// * PERMISSION_DENIED - dirname is not writable.
virtual tensorflow::Status CreateDir(const std::string& dirname) {
return CreateDir(dirname, nullptr);
}
virtual tensorflow::Status CreateDir(const std::string& dirname,
TransactionToken* token) {
return Status::OK();
}
/// \brief Creates the specified directory and all the necessary
/// subdirectories.
/// Typical return codes:
/// * OK - successfully created the directory and sub directories, even if
/// they were already created.
/// * PERMISSION_DENIED - dirname or some subdirectory is not writable.
virtual tensorflow::Status RecursivelyCreateDir(const std::string& dirname) {
return RecursivelyCreateDir(dirname, nullptr);
}
virtual tensorflow::Status RecursivelyCreateDir(const std::string& dirname,
TransactionToken* token);
/// \brief Deletes the specified directory.
virtual tensorflow::Status DeleteDir(const std::string& dirname) {
return DeleteDir(dirname, nullptr);
}
virtual tensorflow::Status DeleteDir(const std::string& dirname,
TransactionToken* token) {
return Status::OK();
}
/// \brief Deletes the specified directory and all subdirectories and files
/// underneath it. This is accomplished by traversing the directory tree
/// rooted at dirname and deleting entries as they are encountered.
///
/// If dirname itself is not readable or does not exist, *undeleted_dir_count
/// is set to 1, *undeleted_file_count is set to 0 and an appropriate status
/// (e.g. NOT_FOUND) is returned.
///
/// If dirname and all its descendants were successfully deleted, TF_OK is
/// returned and both error counters are set to zero.
///
/// Otherwise, while traversing the tree, undeleted_file_count and
/// undeleted_dir_count are updated if an entry of the corresponding type
/// could not be deleted. The returned error status represents the reason that
/// any one of these entries could not be deleted.
///
/// REQUIRES: undeleted_files, undeleted_dirs to be not null.
///
/// Typical return codes:
/// * OK - dirname exists and we were able to delete everything underneath.
/// * NOT_FOUND - dirname doesn't exist
/// * PERMISSION_DENIED - dirname or some descendant is not writable
/// * UNIMPLEMENTED - Some underlying functions (like Delete) are not
/// implemented
virtual tensorflow::Status DeleteRecursively(const std::string& dirname,
int64_t* undeleted_files,
int64_t* undeleted_dirs) {
return DeleteRecursively(dirname, nullptr, undeleted_files, undeleted_dirs);
}
virtual tensorflow::Status DeleteRecursively(const std::string& dirname,
TransactionToken* token,
int64_t* undeleted_files,
int64_t* undeleted_dirs);
/// \brief Stores the size of `fname` in `*file_size`.
virtual tensorflow::Status GetFileSize(const std::string& fname,
uint64* file_size) {
return GetFileSize(fname, nullptr, file_size);
}
virtual tensorflow::Status GetFileSize(const std::string& fname,
TransactionToken* token,
uint64* file_size) {
return Status::OK();
}
/// \brief Overwrites the target if it exists.
virtual tensorflow::Status RenameFile(const std::string& src,
const std::string& target) {
return RenameFile(src, target, nullptr);
}
virtual tensorflow::Status RenameFile(const std::string& src,
const std::string& target,
TransactionToken* token) {
return Status::OK();
}
/// \brief Copy the src to target.
virtual tensorflow::Status CopyFile(const std::string& src,
const std::string& target) {
return CopyFile(src, target, nullptr);
}
virtual tensorflow::Status CopyFile(const std::string& src,
const std::string& target,
TransactionToken* token);
/// \brief Translate an URI to a filename for the FileSystem implementation.
///
/// The implementation in this class cleans up the path, removing
/// duplicate /'s, resolving .. and removing trailing '/'.
/// This respects relative vs. absolute paths, but does not
/// invoke any system calls (getcwd(2)) in order to resolve relative
/// paths with respect to the actual working directory. That is, this is
/// purely string manipulation, completely independent of process state.
virtual std::string TranslateName(const std::string& name) const;
/// \brief Returns whether the given path is a directory or not.
///
/// Typical return codes (not guaranteed exhaustive):
/// * OK - The path exists and is a directory.
/// * FAILED_PRECONDITION - The path exists and is not a directory.
/// * NOT_FOUND - The path entry does not exist.
/// * PERMISSION_DENIED - Insufficient permissions.
/// * UNIMPLEMENTED - The file factory doesn't support directories.
virtual tensorflow::Status IsDirectory(const std::string& fname) {
return IsDirectory(fname, nullptr);
}
virtual tensorflow::Status IsDirectory(const std::string& fname,
TransactionToken* token);
/// \brief Returns whether the given path is on a file system
/// that has atomic move capabilities. This can be used
/// to determine if there needs to be a temp location to safely write objects.
/// The second boolean argument has_atomic_move contains this information.
///
/// Returns one of the following status codes (not guaranteed exhaustive):
/// * OK - The path is on a recognized file system,
/// so has_atomic_move holds the above information.
/// * UNIMPLEMENTED - The file system of the path hasn't been implemented in
/// TF
virtual Status HasAtomicMove(const std::string& path, bool* has_atomic_move);
/// \brief Flushes any cached filesystem objects from memory.
virtual void FlushCaches() { FlushCaches(nullptr); }
virtual void FlushCaches(TransactionToken* token);
/// \brief The separator this filesystem uses.
///
/// This is implemented as a part of the filesystem, because even on windows,
/// a user may need access to filesystems with '/' separators, such as cloud
/// filesystems.
virtual char Separator() const;
/// \brief Split a path to its basename and dirname.
///
/// Helper function for Basename and Dirname.
std::pair<StringPiece, StringPiece> SplitPath(StringPiece uri) const;
/// \brief returns the final file name in the given path.
///
/// Returns the part of the path after the final "/". If there is no
/// "/" in the path, the result is the same as the input.
virtual StringPiece Basename(StringPiece path) const;
/// \brief Returns the part of the path before the final "/".
///
/// If there is a single leading "/" in the path, the result will be the
/// leading "/". If there is no "/" in the path, the result is the empty
/// prefix of the input.
StringPiece Dirname(StringPiece path) const;
/// \brief Returns the part of the basename of path after the final ".".
///
/// If there is no "." in the basename, the result is empty.
StringPiece Extension(StringPiece path) const;
/// \brief Clean duplicate and trailing, "/"s, and resolve ".." and ".".
///
/// NOTE: This respects relative vs. absolute paths, but does not
/// invoke any system calls (getcwd(2)) in order to resolve relative
/// paths with respect to the actual working directory. That is, this is
/// purely string manipulation, completely independent of process state.
std::string CleanPath(StringPiece path) const;
/// \brief Creates a URI from a scheme, host, and path.
///
/// If the scheme is empty, we just return the path.
std::string CreateURI(StringPiece scheme, StringPiece host,
StringPiece path) const;
/// \brief Creates a temporary file name with an extension.
std::string GetTempFilename(const std::string& extension) const;
/// \brief Return true if path is absolute.
bool IsAbsolutePath(tensorflow::StringPiece path) const;
#ifndef SWIG // variadic templates
/// \brief Join multiple paths together.
///
/// This function also removes the unnecessary path separators.
/// For example:
///
/// Arguments | JoinPath
/// ---------------------------+----------
/// '/foo', 'bar' | /foo/bar
/// '/foo/', 'bar' | /foo/bar
/// '/foo', '/bar' | /foo/bar
///
/// Usage:
/// string path = io::JoinPath("/mydir", filename);
/// string path = io::JoinPath(FLAGS_test_srcdir, filename);
/// string path = io::JoinPath("/full", "path", "to", "filename");
template <typename... T>
std::string JoinPath(const T&... args) {
return JoinPathImpl({args...});
}
#endif /* SWIG */
std::string JoinPathImpl(
std::initializer_list<tensorflow::StringPiece> paths);
/// \brief Populates the scheme, host, and path from a URI.
///
/// scheme, host, and path are guaranteed by this function to point into the
/// contents of uri, even if empty.
///
/// Corner cases:
/// - If the URI is invalid, scheme and host are set to empty strings and the
/// passed string is assumed to be a path
/// - If the URI omits the path (e.g. file://host), then the path is left
/// empty.
void ParseURI(StringPiece remaining, StringPiece* scheme, StringPiece* host,
StringPiece* path) const;
// Transaction related API
/// \brief Starts a new transaction
virtual tensorflow::Status StartTransaction(TransactionToken** token) {
*token = nullptr;
return Status::OK();
}
/// \brief Adds `path` to transaction in `token`
virtual tensorflow::Status AddToTransaction(const std::string& path,
TransactionToken* token) {
return Status::OK();
}
/// \brief Ends transaction
virtual tensorflow::Status EndTransaction(TransactionToken* token) {
return Status::OK();
}
/// \brief Get token for `path` or start a new transaction and add `path` to
/// it.
virtual tensorflow::Status GetTokenOrStartTransaction(
const std::string& path, TransactionToken** token) {
*token = nullptr;
return Status::OK();
}
/// \brief Return transaction for `path` or nullptr in `token`
virtual tensorflow::Status GetTransactionForPath(const std::string& path,
TransactionToken** token) {
*token = nullptr;
return Status::OK();
}
/// \brief Decode transaction to human readable string.
virtual std::string DecodeTransaction(const TransactionToken* token);
/// \brief Set File System Configuration Option
virtual tensorflow::Status SetOption(const std::string& name,
const std::vector<string>& values) {
return errors::Unimplemented("SetOption");
}
/// \brief Set File System Configuration Option
virtual tensorflow::Status SetOption(const std::string& name,
const std::vector<int64_t>& values) {
return errors::Unimplemented("SetOption");
}
/// \brief Set File System Configuration Option
virtual tensorflow::Status SetOption(const std::string& name,
const std::vector<double>& values) {
return errors::Unimplemented("SetOption");
}
FileSystem() {}
virtual ~FileSystem() = default;
};
/// This macro adds forwarding methods from FileSystem class to
/// used class since name hiding will prevent these to be accessed from
/// derived classes and would require all use locations to migrate to
/// Transactional API. This is an interim solution until ModularFileSystem class
/// becomes a singleton.
// TODO(sami): Remove this macro when filesystem plugins migration is complete.
#define TF_USE_FILESYSTEM_METHODS_WITH_NO_TRANSACTION_SUPPORT \
using FileSystem::NewRandomAccessFile; \
using FileSystem::NewWritableFile; \
using FileSystem::NewAppendableFile; \
using FileSystem::NewReadOnlyMemoryRegionFromFile; \
using FileSystem::FileExists; \
using FileSystem::GetChildren; \
using FileSystem::GetMatchingPaths; \
using FileSystem::Stat; \
using FileSystem::DeleteFile; \
using FileSystem::RecursivelyCreateDir; \
using FileSystem::DeleteDir; \
using FileSystem::DeleteRecursively; \
using FileSystem::GetFileSize; \
using FileSystem::RenameFile; \
using FileSystem::CopyFile; \
using FileSystem::IsDirectory; \
using FileSystem::FlushCaches
/// A Wrapper class for Transactional FileSystem support.
/// This provides means to make use of the transactions with minimal code change
/// Any operations that are done through this interface will be through the
/// transaction created at the time of construction of this instance.
/// See FileSystem documentation for method descriptions.
/// This class simply forwards all calls to wrapped filesystem either with given
/// transaction token or with token used in its construction. This allows doing
/// transactional filesystem access with minimal code change.
class WrappedFileSystem : public FileSystem {
public:
TF_USE_FILESYSTEM_METHODS_WITH_NO_TRANSACTION_SUPPORT;
tensorflow::Status NewRandomAccessFile(
const std::string& fname, TransactionToken* token,
std::unique_ptr<RandomAccessFile>* result) override {
return fs_->NewRandomAccessFile(fname, (token ? token : token_), result);
}
tensorflow::Status NewWritableFile(
const std::string& fname, TransactionToken* token,
std::unique_ptr<WritableFile>* result) override {
return fs_->NewWritableFile(fname, (token ? token : token_), result);
}
tensorflow::Status NewAppendableFile(
const std::string& fname, TransactionToken* token,
std::unique_ptr<WritableFile>* result) override {
return fs_->NewAppendableFile(fname, (token ? token : token_), result);
}
tensorflow::Status NewReadOnlyMemoryRegionFromFile(
const std::string& fname, TransactionToken* token,
std::unique_ptr<ReadOnlyMemoryRegion>* result) override {
return fs_->NewReadOnlyMemoryRegionFromFile(fname, (token ? token : token_),
result);
}
tensorflow::Status FileExists(const std::string& fname,
TransactionToken* token) override {
return fs_->FileExists(fname, (token ? token : token_));
}
bool FilesExist(const std::vector<string>& files, TransactionToken* token,
std::vector<Status>* status) override {
return fs_->FilesExist(files, (token ? token : token_), status);
}
tensorflow::Status GetChildren(const std::string& dir,
TransactionToken* token,
std::vector<string>* result) override {
return fs_->GetChildren(dir, (token ? token : token_), result);
}
tensorflow::Status GetMatchingPaths(const std::string& pattern,
TransactionToken* token,
std::vector<string>* results) override {
return fs_->GetMatchingPaths(pattern, (token ? token : token_), results);
}
bool Match(const std::string& filename, const std::string& pattern) override {
return fs_->Match(filename, pattern);
}
tensorflow::Status Stat(const std::string& fname, TransactionToken* token,
FileStatistics* stat) override {
return fs_->Stat(fname, (token ? token : token_), stat);
}
tensorflow::Status DeleteFile(const std::string& fname,
TransactionToken* token) override {
return fs_->DeleteFile(fname, (token ? token : token_));
}
tensorflow::Status CreateDir(const std::string& dirname,
TransactionToken* token) override {
return fs_->CreateDir(dirname, (token ? token : token_));
}
tensorflow::Status RecursivelyCreateDir(const std::string& dirname,
TransactionToken* token) override {
return fs_->RecursivelyCreateDir(dirname, (token ? token : token_));
}
tensorflow::Status DeleteDir(const std::string& dirname,
TransactionToken* token) override {
return fs_->DeleteDir(dirname, (token ? token : token_));
}
tensorflow::Status DeleteRecursively(const std::string& dirname,
TransactionToken* token,
int64_t* undeleted_files,
int64_t* undeleted_dirs) override {
return fs_->DeleteRecursively(dirname, (token ? token : token_),
undeleted_files, undeleted_dirs);
}
tensorflow::Status GetFileSize(const std::string& fname,
TransactionToken* token,
uint64* file_size) override {
return fs_->GetFileSize(fname, (token ? token : token_), file_size);
}
tensorflow::Status RenameFile(const std::string& src,
const std::string& target,
TransactionToken* token) override {
return fs_->RenameFile(src, target, (token ? token : token_));
}
tensorflow::Status CopyFile(const std::string& src, const std::string& target,
TransactionToken* token) override {
return fs_->CopyFile(src, target, (token ? token : token_));
}
std::string TranslateName(const std::string& name) const override {
return fs_->TranslateName(name);
}
tensorflow::Status IsDirectory(const std::string& fname,
TransactionToken* token) override {
return fs_->IsDirectory(fname, (token ? token : token_));
}
Status HasAtomicMove(const std::string& path,
bool* has_atomic_move) override {
return fs_->HasAtomicMove(path, has_atomic_move);
}
void FlushCaches(TransactionToken* token) override {
return fs_->FlushCaches((token ? token : token_));
}
char Separator() const override { return fs_->Separator(); }
StringPiece Basename(StringPiece path) const override {
return fs_->Basename(path);
}
tensorflow::Status StartTransaction(TransactionToken** token) override {
return fs_->StartTransaction(token);
}
tensorflow::Status AddToTransaction(const std::string& path,
TransactionToken* token) override {
return fs_->AddToTransaction(path, (token ? token : token_));
}
tensorflow::Status EndTransaction(TransactionToken* token) override {
return fs_->EndTransaction(token);
}
tensorflow::Status GetTransactionForPath(const std::string& path,
TransactionToken** token) override {
return fs_->GetTransactionForPath(path, token);
}
tensorflow::Status GetTokenOrStartTransaction(
const std::string& path, TransactionToken** token) override {
return fs_->GetTokenOrStartTransaction(path, token);
}
std::string DecodeTransaction(const TransactionToken* token) override {
return fs_->DecodeTransaction((token ? token : token_));
}
WrappedFileSystem(FileSystem* file_system, TransactionToken* token)
: fs_(file_system), token_(token) {}
~WrappedFileSystem() override = default;
private:
FileSystem* fs_;
TransactionToken* token_;
};
/// A file abstraction for randomly reading the contents of a file.
class RandomAccessFile {
public:
RandomAccessFile() {}
virtual ~RandomAccessFile() = default;
/// \brief Returns the name of the file.
///
/// This is an optional operation that may not be implemented by every
/// filesystem.
virtual tensorflow::Status Name(StringPiece* result) const {
return errors::Unimplemented("This filesystem does not support Name()");
}
/// \brief Reads up to `n` bytes from the file starting at `offset`.
///
/// `scratch[0..n-1]` may be written by this routine. Sets `*result`
/// to the data that was read (including if fewer than `n` bytes were
/// successfully read). May set `*result` to point at data in
/// `scratch[0..n-1]`, so `scratch[0..n-1]` must be live when
/// `*result` is used.
///
/// On OK returned status: `n` bytes have been stored in `*result`.
/// On non-OK returned status: `[0..n]` bytes have been stored in `*result`.
///
/// Returns `OUT_OF_RANGE` if fewer than n bytes were stored in `*result`
/// because of EOF.
///
/// Safe for concurrent use by multiple threads.
virtual tensorflow::Status Read(uint64 offset, size_t n, StringPiece* result,
char* scratch) const = 0;
#if defined(TF_CORD_SUPPORT)
/// \brief Read up to `n` bytes from the file starting at `offset`.
virtual tensorflow::Status Read(uint64 offset, size_t n,
absl::Cord* cord) const {
return errors::Unimplemented(
"Read(uint64, size_t, absl::Cord*) is not "
"implemented");
}
#endif
private:
TF_DISALLOW_COPY_AND_ASSIGN(RandomAccessFile);
};
/// \brief A file abstraction for sequential writing.
///
/// The implementation must provide buffering since callers may append
/// small fragments at a time to the file.
class WritableFile {
public:
WritableFile() {}
virtual ~WritableFile() = default;
/// \brief Append 'data' to the file.
virtual tensorflow::Status Append(StringPiece data) = 0;
#if defined(TF_CORD_SUPPORT)
// \brief Append 'data' to the file.
virtual tensorflow::Status Append(const absl::Cord& cord) {
for (StringPiece chunk : cord.Chunks()) {
TF_RETURN_IF_ERROR(Append(chunk));
}
return tensorflow::Status::OK();
}
#endif
/// \brief Close the file.
///
/// Flush() and de-allocate resources associated with this file
///
/// Typical return codes (not guaranteed to be exhaustive):
/// * OK
/// * Other codes, as returned from Flush()
virtual tensorflow::Status Close() = 0;
/// \brief Flushes the file and optionally syncs contents to filesystem.
///
/// This should flush any local buffers whose contents have not been
/// delivered to the filesystem.
///
/// If the process terminates after a successful flush, the contents
/// may still be persisted, since the underlying filesystem may
/// eventually flush the contents. If the OS or machine crashes
/// after a successful flush, the contents may or may not be
/// persisted, depending on the implementation.
virtual tensorflow::Status Flush() = 0;
// \brief Returns the name of the file.
///
/// This is an optional operation that may not be implemented by every
/// filesystem.
virtual tensorflow::Status Name(StringPiece* result) const {
return errors::Unimplemented("This filesystem does not support Name()");
}
/// \brief Syncs contents of file to filesystem.
///
/// This waits for confirmation from the filesystem that the contents
/// of the file have been persisted to the filesystem; if the OS
/// or machine crashes after a successful Sync, the contents should
/// be properly saved.
virtual tensorflow::Status Sync() = 0;
/// \brief Retrieves the current write position in the file, or -1 on
/// error.
///
/// This is an optional operation, subclasses may choose to return
/// errors::Unimplemented.
virtual tensorflow::Status Tell(int64_t* position) {
*position = -1;
return errors::Unimplemented("This filesystem does not support Tell()");
}
private:
TF_DISALLOW_COPY_AND_ASSIGN(WritableFile);
};
/// \brief A readonly memmapped file abstraction.
///
/// The implementation must guarantee that all memory is accessible when the
/// object exists, independently from the Env that created it.
class ReadOnlyMemoryRegion {
public:
ReadOnlyMemoryRegion() {}
virtual ~ReadOnlyMemoryRegion() = default;
/// \brief Returns a pointer to the memory region.
virtual const void* data() = 0;
/// \brief Returns the length of the memory region in bytes.
virtual uint64 length() = 0;
};
/// \brief A registry for file system implementations.
///
/// Filenames are specified as an URI, which is of the form
/// [scheme://]<filename>.
/// File system implementations are registered using the REGISTER_FILE_SYSTEM
/// macro, providing the 'scheme' as the key.
///
/// There are two `Register` methods: one using `Factory` for legacy filesystems
/// (deprecated mechanism of subclassing `FileSystem` and using
/// `REGISTER_FILE_SYSTEM` macro), and one using `std::unique_ptr<FileSystem>`
/// for the new modular approach.
///
/// Note that the new API expects a pointer to `ModularFileSystem` but this is
/// not checked as there should be exactly one caller to the API and doing the
/// check results in a circular dependency between `BUILD` targets.
///
/// Plan is to completely remove the filesystem registration from `Env` and
/// incorporate it into `ModularFileSystem` class (which will be renamed to be
/// the only `FileSystem` class and marked as `final`). But this will happen at
/// a later time, after we convert all filesystems to the new API.
///
/// TODO(mihaimaruseac): After all filesystems are converted, remove old
/// registration and update comment.
class FileSystemRegistry {
public:
typedef std::function<FileSystem*()> Factory;
virtual ~FileSystemRegistry() = default;
virtual tensorflow::Status Register(const std::string& scheme,
Factory factory) = 0;
virtual tensorflow::Status Register(
const std::string& scheme, std::unique_ptr<FileSystem> filesystem) = 0;
virtual FileSystem* Lookup(const std::string& scheme) = 0;
virtual tensorflow::Status GetRegisteredFileSystemSchemes(
std::vector<std::string>* schemes) = 0;
};
} // namespace tensorflow
#endif // TENSORFLOW_CORE_PLATFORM_FILE_SYSTEM_H_