blob: ddfa499221b8bb1e67a671a052b73e499bd6865e [file] [log] [blame]
/*
* Copyright (C) 2018 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#include "utils/resources.h"
#include "utils/base/logging.h"
#include "utils/zlib/buffer_generated.h"
#include "utils/zlib/zlib.h"
namespace libtextclassifier3 {
namespace {
bool isWildcardMatch(const flatbuffers::String* left,
const std::string& right) {
return (left == nullptr || right.empty());
}
bool isExactMatch(const flatbuffers::String* left, const std::string& right) {
if (left == nullptr) {
return right.empty();
}
return left->str() == right;
}
} // namespace
int Resources::LocaleMatch(const Locale& locale,
const LanguageTag* entry_locale) const {
int match = LOCALE_NO_MATCH;
if (isExactMatch(entry_locale->language(), locale.Language())) {
match |= LOCALE_LANGUAGE_MATCH;
} else if (isWildcardMatch(entry_locale->language(), locale.Language())) {
match |= LOCALE_LANGUAGE_WILDCARD_MATCH;
}
if (isExactMatch(entry_locale->script(), locale.Script())) {
match |= LOCALE_SCRIPT_MATCH;
} else if (isWildcardMatch(entry_locale->script(), locale.Script())) {
match |= LOCALE_SCRIPT_WILDCARD_MATCH;
}
if (isExactMatch(entry_locale->region(), locale.Region())) {
match |= LOCALE_REGION_MATCH;
} else if (isWildcardMatch(entry_locale->region(), locale.Region())) {
match |= LOCALE_REGION_WILDCARD_MATCH;
}
return match;
}
const ResourceEntry* Resources::FindResource(
const StringPiece resource_name) const {
if (resources_ == nullptr || resources_->resource_entry() == nullptr) {
TC3_LOG(ERROR) << "No resources defined.";
return nullptr;
}
const ResourceEntry* entry =
resources_->resource_entry()->LookupByKey(resource_name.data());
if (entry == nullptr) {
TC3_LOG(ERROR) << "Resource " << resource_name.ToString() << " not found";
return nullptr;
}
return entry;
}
int Resources::BestResourceForLocales(
const ResourceEntry* resource, const std::vector<Locale>& locales) const {
// Find best match based on locale.
int resource_id = -1;
int locale_match = LOCALE_NO_MATCH;
const auto* resources = resource->resource();
for (int user_locale = 0; user_locale < locales.size(); user_locale++) {
if (!locales[user_locale].IsValid()) {
continue;
}
for (int i = 0; i < resources->size(); i++) {
for (const int locale_id : *resources->Get(i)->locale()) {
const int candidate_match = LocaleMatch(
locales[user_locale], resources_->locale()->Get(locale_id));
// Only consider if at least the language matches.
if ((candidate_match & LOCALE_LANGUAGE_MATCH) == 0 &&
(candidate_match & LOCALE_LANGUAGE_WILDCARD_MATCH) == 0) {
continue;
}
if (candidate_match > locale_match) {
locale_match = candidate_match;
resource_id = i;
}
}
}
// If the language matches exactly, we are already finished.
// We found an exact language match.
if (locale_match & LOCALE_LANGUAGE_MATCH) {
return resource_id;
}
}
return resource_id;
}
bool Resources::GetResourceContent(const std::vector<Locale>& locales,
const StringPiece resource_name,
std::string* result) const {
const ResourceEntry* entry = FindResource(resource_name);
if (entry == nullptr || entry->resource() == nullptr) {
return false;
}
int resource_id = BestResourceForLocales(entry, locales);
if (resource_id < 0) {
return false;
}
const auto* resource = entry->resource()->Get(resource_id);
if (resource->content() != nullptr) {
*result = resource->content()->str();
return true;
} else if (resource->compressed_content() != nullptr) {
std::unique_ptr<ZlibDecompressor> decompressor = ZlibDecompressor::Instance(
resources_->compression_dictionary()->data(),
resources_->compression_dictionary()->size());
if (decompressor != nullptr &&
decompressor->MaybeDecompress(resource->compressed_content(), result)) {
return true;
}
}
return false;
}
bool CompressResources(ResourcePoolT* resources,
const bool build_compression_dictionary,
const int dictionary_sample_every) {
std::vector<unsigned char> dictionary;
if (build_compression_dictionary) {
{
// Build up a compression dictionary.
std::unique_ptr<ZlibCompressor> compressor = ZlibCompressor::Instance();
int i = 0;
for (auto& entry : resources->resource_entry) {
for (auto& resource : entry->resource) {
if (resource->content.empty()) {
continue;
}
i++;
// Use a sample of the entries to build up a custom compression
// dictionary. Using all entries will generally not give a benefit
// for small data sizes, so we subsample here.
if (i % dictionary_sample_every != 0) {
continue;
}
CompressedBufferT compressed_content;
compressor->Compress(resource->content, &compressed_content);
}
}
compressor->GetDictionary(&dictionary);
resources->compression_dictionary.assign(
dictionary.data(), dictionary.data() + dictionary.size());
}
}
for (auto& entry : resources->resource_entry) {
for (auto& resource : entry->resource) {
if (resource->content.empty()) {
continue;
}
// Try compressing the data.
std::unique_ptr<ZlibCompressor> compressor =
build_compression_dictionary
? ZlibCompressor::Instance(dictionary.data(), dictionary.size())
: ZlibCompressor::Instance();
if (!compressor) {
TC3_LOG(ERROR) << "Cannot create zlib compressor.";
return false;
}
CompressedBufferT compressed_content;
compressor->Compress(resource->content, &compressed_content);
// Only keep compressed version if smaller.
if (compressed_content.uncompressed_size >
compressed_content.buffer.size()) {
resource->content.clear();
resource->compressed_content.reset(new CompressedBufferT);
*resource->compressed_content = compressed_content;
}
}
}
return true;
}
std::string CompressSerializedResources(const std::string& resources,
const int dictionary_sample_every) {
std::unique_ptr<ResourcePoolT> unpacked_resources(
flatbuffers::GetRoot<ResourcePool>(resources.data())->UnPack());
TC3_CHECK(unpacked_resources != nullptr);
TC3_CHECK(
CompressResources(unpacked_resources.get(), dictionary_sample_every));
flatbuffers::FlatBufferBuilder builder;
builder.Finish(ResourcePool::Pack(builder, unpacked_resources.get()));
return std::string(reinterpret_cast<const char*>(builder.GetBufferPointer()),
builder.GetSize());
}
} // namespace libtextclassifier3