/*
|
* Copyright (C) 2018 The Android Open Source Project
|
*
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
* you may not use this file except in compliance with the License.
|
* You may obtain a copy of the License at
|
*
|
* http://www.apache.org/licenses/LICENSE-2.0
|
*
|
* Unless required by applicable law or agreed to in writing, software
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
* See the License for the specific language governing permissions and
|
* limitations under the License.
|
*/
|
|
#include "utils/resources.h"
|
#include "utils/base/logging.h"
|
#include "utils/zlib/buffer_generated.h"
|
#include "utils/zlib/zlib.h"
|
|
namespace libtextclassifier3 {
|
namespace {
|
bool isWildcardMatch(const flatbuffers::String* left,
|
const std::string& right) {
|
return (left == nullptr || right.empty());
|
}
|
|
bool isExactMatch(const flatbuffers::String* left, const std::string& right) {
|
if (left == nullptr) {
|
return right.empty();
|
}
|
return left->str() == right;
|
}
|
|
} // namespace
|
|
int Resources::LocaleMatch(const Locale& locale,
|
const LanguageTag* entry_locale) const {
|
int match = LOCALE_NO_MATCH;
|
if (isExactMatch(entry_locale->language(), locale.Language())) {
|
match |= LOCALE_LANGUAGE_MATCH;
|
} else if (isWildcardMatch(entry_locale->language(), locale.Language())) {
|
match |= LOCALE_LANGUAGE_WILDCARD_MATCH;
|
}
|
|
if (isExactMatch(entry_locale->script(), locale.Script())) {
|
match |= LOCALE_SCRIPT_MATCH;
|
} else if (isWildcardMatch(entry_locale->script(), locale.Script())) {
|
match |= LOCALE_SCRIPT_WILDCARD_MATCH;
|
}
|
|
if (isExactMatch(entry_locale->region(), locale.Region())) {
|
match |= LOCALE_REGION_MATCH;
|
} else if (isWildcardMatch(entry_locale->region(), locale.Region())) {
|
match |= LOCALE_REGION_WILDCARD_MATCH;
|
}
|
|
return match;
|
}
|
|
const ResourceEntry* Resources::FindResource(
|
const StringPiece resource_name) const {
|
if (resources_ == nullptr || resources_->resource_entry() == nullptr) {
|
TC3_LOG(ERROR) << "No resources defined.";
|
return nullptr;
|
}
|
const ResourceEntry* entry =
|
resources_->resource_entry()->LookupByKey(resource_name.data());
|
if (entry == nullptr) {
|
TC3_LOG(ERROR) << "Resource " << resource_name.ToString() << " not found";
|
return nullptr;
|
}
|
return entry;
|
}
|
|
int Resources::BestResourceForLocales(
|
const ResourceEntry* resource, const std::vector<Locale>& locales) const {
|
// Find best match based on locale.
|
int resource_id = -1;
|
int locale_match = LOCALE_NO_MATCH;
|
const auto* resources = resource->resource();
|
for (int user_locale = 0; user_locale < locales.size(); user_locale++) {
|
if (!locales[user_locale].IsValid()) {
|
continue;
|
}
|
for (int i = 0; i < resources->size(); i++) {
|
for (const int locale_id : *resources->Get(i)->locale()) {
|
const int candidate_match = LocaleMatch(
|
locales[user_locale], resources_->locale()->Get(locale_id));
|
|
// Only consider if at least the language matches.
|
if ((candidate_match & LOCALE_LANGUAGE_MATCH) == 0 &&
|
(candidate_match & LOCALE_LANGUAGE_WILDCARD_MATCH) == 0) {
|
continue;
|
}
|
|
if (candidate_match > locale_match) {
|
locale_match = candidate_match;
|
resource_id = i;
|
}
|
}
|
}
|
|
// If the language matches exactly, we are already finished.
|
// We found an exact language match.
|
if (locale_match & LOCALE_LANGUAGE_MATCH) {
|
return resource_id;
|
}
|
}
|
return resource_id;
|
}
|
|
bool Resources::GetResourceContent(const std::vector<Locale>& locales,
|
const StringPiece resource_name,
|
std::string* result) const {
|
const ResourceEntry* entry = FindResource(resource_name);
|
if (entry == nullptr || entry->resource() == nullptr) {
|
return false;
|
}
|
|
int resource_id = BestResourceForLocales(entry, locales);
|
if (resource_id < 0) {
|
return false;
|
}
|
const auto* resource = entry->resource()->Get(resource_id);
|
if (resource->content() != nullptr) {
|
*result = resource->content()->str();
|
return true;
|
} else if (resource->compressed_content() != nullptr) {
|
std::unique_ptr<ZlibDecompressor> decompressor = ZlibDecompressor::Instance(
|
resources_->compression_dictionary()->data(),
|
resources_->compression_dictionary()->size());
|
if (decompressor != nullptr &&
|
decompressor->MaybeDecompress(resource->compressed_content(), result)) {
|
return true;
|
}
|
}
|
return false;
|
}
|
|
bool CompressResources(ResourcePoolT* resources,
|
const bool build_compression_dictionary,
|
const int dictionary_sample_every) {
|
std::vector<unsigned char> dictionary;
|
if (build_compression_dictionary) {
|
{
|
// Build up a compression dictionary.
|
std::unique_ptr<ZlibCompressor> compressor = ZlibCompressor::Instance();
|
int i = 0;
|
for (auto& entry : resources->resource_entry) {
|
for (auto& resource : entry->resource) {
|
if (resource->content.empty()) {
|
continue;
|
}
|
i++;
|
|
// Use a sample of the entries to build up a custom compression
|
// dictionary. Using all entries will generally not give a benefit
|
// for small data sizes, so we subsample here.
|
if (i % dictionary_sample_every != 0) {
|
continue;
|
}
|
CompressedBufferT compressed_content;
|
compressor->Compress(resource->content, &compressed_content);
|
}
|
}
|
compressor->GetDictionary(&dictionary);
|
resources->compression_dictionary.assign(
|
dictionary.data(), dictionary.data() + dictionary.size());
|
}
|
}
|
|
for (auto& entry : resources->resource_entry) {
|
for (auto& resource : entry->resource) {
|
if (resource->content.empty()) {
|
continue;
|
}
|
// Try compressing the data.
|
std::unique_ptr<ZlibCompressor> compressor =
|
build_compression_dictionary
|
? ZlibCompressor::Instance(dictionary.data(), dictionary.size())
|
: ZlibCompressor::Instance();
|
if (!compressor) {
|
TC3_LOG(ERROR) << "Cannot create zlib compressor.";
|
return false;
|
}
|
|
CompressedBufferT compressed_content;
|
compressor->Compress(resource->content, &compressed_content);
|
|
// Only keep compressed version if smaller.
|
if (compressed_content.uncompressed_size >
|
compressed_content.buffer.size()) {
|
resource->content.clear();
|
resource->compressed_content.reset(new CompressedBufferT);
|
*resource->compressed_content = compressed_content;
|
}
|
}
|
}
|
return true;
|
}
|
|
std::string CompressSerializedResources(const std::string& resources,
|
const int dictionary_sample_every) {
|
std::unique_ptr<ResourcePoolT> unpacked_resources(
|
flatbuffers::GetRoot<ResourcePool>(resources.data())->UnPack());
|
TC3_CHECK(unpacked_resources != nullptr);
|
TC3_CHECK(
|
CompressResources(unpacked_resources.get(), dictionary_sample_every));
|
flatbuffers::FlatBufferBuilder builder;
|
builder.Finish(ResourcePool::Pack(builder, unpacked_resources.get()));
|
return std::string(reinterpret_cast<const char*>(builder.GetBufferPointer()),
|
builder.GetSize());
|
}
|
|
} // namespace libtextclassifier3
|