/*
|
* Copyright (C) 2018 The Android Open Source Project
|
*
|
* Licensed under the Apache License, Version 2.0 (the "License");
|
* you may not use this file except in compliance with the License.
|
* You may obtain a copy of the License at
|
*
|
* http://www.apache.org/licenses/LICENSE-2.0
|
*
|
* Unless required by applicable law or agreed to in writing, software
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
* See the License for the specific language governing permissions and
|
* limitations under the License.
|
*/
|
|
// Utility functions for working with FlatBuffers.
|
|
#ifndef LIBTEXTCLASSIFIER_UTILS_FLATBUFFERS_H_
|
#define LIBTEXTCLASSIFIER_UTILS_FLATBUFFERS_H_
|
|
#include <map>
|
#include <memory>
|
#include <string>
|
|
#include "annotator/model_generated.h"
|
#include "utils/strings/stringpiece.h"
|
#include "utils/variant.h"
|
#include "flatbuffers/flatbuffers.h"
|
#include "flatbuffers/reflection.h"
|
|
namespace libtextclassifier3 {
|
|
// Loads and interprets the buffer as 'FlatbufferMessage' and verifies its
|
// integrity.
|
template <typename FlatbufferMessage>
|
const FlatbufferMessage* LoadAndVerifyFlatbuffer(const void* buffer, int size) {
|
const FlatbufferMessage* message =
|
flatbuffers::GetRoot<FlatbufferMessage>(buffer);
|
if (message == nullptr) {
|
return nullptr;
|
}
|
flatbuffers::Verifier verifier(reinterpret_cast<const uint8_t*>(buffer),
|
size);
|
if (message->Verify(verifier)) {
|
return message;
|
} else {
|
return nullptr;
|
}
|
}
|
|
// Same as above but takes string.
|
template <typename FlatbufferMessage>
|
const FlatbufferMessage* LoadAndVerifyFlatbuffer(const std::string& buffer) {
|
return LoadAndVerifyFlatbuffer<FlatbufferMessage>(buffer.c_str(),
|
buffer.size());
|
}
|
|
// Loads and interprets the buffer as 'FlatbufferMessage', verifies its
|
// integrity and returns its mutable version.
|
template <typename FlatbufferMessage>
|
std::unique_ptr<typename FlatbufferMessage::NativeTableType>
|
LoadAndVerifyMutableFlatbuffer(const void* buffer, int size) {
|
const FlatbufferMessage* message =
|
LoadAndVerifyFlatbuffer<FlatbufferMessage>(buffer, size);
|
if (message == nullptr) {
|
return nullptr;
|
}
|
return std::unique_ptr<typename FlatbufferMessage::NativeTableType>(
|
message->UnPack());
|
}
|
|
// Same as above but takes string.
|
template <typename FlatbufferMessage>
|
std::unique_ptr<typename FlatbufferMessage::NativeTableType>
|
LoadAndVerifyMutableFlatbuffer(const std::string& buffer) {
|
return LoadAndVerifyMutableFlatbuffer<FlatbufferMessage>(buffer.c_str(),
|
buffer.size());
|
}
|
|
template <typename FlatbufferMessage>
|
const char* FlatbufferFileIdentifier() {
|
return nullptr;
|
}
|
|
template <>
|
const char* FlatbufferFileIdentifier<Model>();
|
|
// Packs the mutable flatbuffer message to string.
|
template <typename FlatbufferMessage>
|
std::string PackFlatbuffer(
|
const typename FlatbufferMessage::NativeTableType* mutable_message) {
|
flatbuffers::FlatBufferBuilder builder;
|
builder.Finish(FlatbufferMessage::Pack(builder, mutable_message),
|
FlatbufferFileIdentifier<FlatbufferMessage>());
|
return std::string(reinterpret_cast<const char*>(builder.GetBufferPointer()),
|
builder.GetSize());
|
}
|
|
// A flatbuffer that can be built using flatbuffer reflection data of the
|
// schema.
|
// Normally, field information is hard-coded in code generated from a flatbuffer
|
// schema. Here we lookup the necessary information for building a flatbuffer
|
// from the provided reflection meta data.
|
// When serializing a flatbuffer, the library requires that the sub messages
|
// are already serialized, therefore we explicitly keep the field values and
|
// serialize the message in (reverse) topological dependency order.
|
class ReflectiveFlatbuffer {
|
public:
|
ReflectiveFlatbuffer(const reflection::Schema* schema,
|
const reflection::Object* type)
|
: schema_(schema), type_(type) {}
|
|
// Encapsulates a repeated field.
|
// Serves as a common base class for repeated fields.
|
class RepeatedField {
|
public:
|
virtual ~RepeatedField() {}
|
|
virtual flatbuffers::uoffset_t Serialize(
|
flatbuffers::FlatBufferBuilder* builder) const = 0;
|
};
|
|
// Represents a repeated field of particular type.
|
template <typename T>
|
class TypedRepeatedField : public RepeatedField {
|
public:
|
void Add(const T value) { items_.push_back(value); }
|
|
flatbuffers::uoffset_t Serialize(
|
flatbuffers::FlatBufferBuilder* builder) const override {
|
return builder->CreateVector(items_).o;
|
}
|
|
private:
|
std::vector<T> items_;
|
};
|
|
// Specialization for strings.
|
template <>
|
class TypedRepeatedField<std::string> : public RepeatedField {
|
public:
|
void Add(const std::string& value) { items_.push_back(value); }
|
|
flatbuffers::uoffset_t Serialize(
|
flatbuffers::FlatBufferBuilder* builder) const override {
|
std::vector<flatbuffers::Offset<flatbuffers::String>> offsets(
|
items_.size());
|
for (int i = 0; i < items_.size(); i++) {
|
offsets[i] = builder->CreateString(items_[i]);
|
}
|
return builder->CreateVector(offsets).o;
|
}
|
|
private:
|
std::vector<std::string> items_;
|
};
|
|
// Specialization for repeated sub-messages.
|
template <>
|
class TypedRepeatedField<ReflectiveFlatbuffer> : public RepeatedField {
|
public:
|
TypedRepeatedField<ReflectiveFlatbuffer>(
|
const reflection::Schema* const schema,
|
const reflection::Type* const type)
|
: schema_(schema), type_(type) {}
|
|
ReflectiveFlatbuffer* Add() {
|
items_.emplace_back(new ReflectiveFlatbuffer(
|
schema_, schema_->objects()->Get(type_->index())));
|
return items_.back().get();
|
}
|
|
flatbuffers::uoffset_t Serialize(
|
flatbuffers::FlatBufferBuilder* builder) const override {
|
std::vector<flatbuffers::Offset<void>> offsets(items_.size());
|
for (int i = 0; i < items_.size(); i++) {
|
offsets[i] = items_[i]->Serialize(builder);
|
}
|
return builder->CreateVector(offsets).o;
|
}
|
|
private:
|
const reflection::Schema* const schema_;
|
const reflection::Type* const type_;
|
std::vector<std::unique_ptr<ReflectiveFlatbuffer>> items_;
|
};
|
|
// Gets the field information for a field name, returns nullptr if the
|
// field was not defined.
|
const reflection::Field* GetFieldOrNull(const StringPiece field_name) const;
|
const reflection::Field* GetFieldOrNull(const FlatbufferField* field) const;
|
const reflection::Field* GetFieldByOffsetOrNull(const int field_offset) const;
|
|
// Gets a nested field and the message it is defined on.
|
bool GetFieldWithParent(const FlatbufferFieldPath* field_path,
|
ReflectiveFlatbuffer** parent,
|
reflection::Field const** field);
|
|
// Checks whether a variant value type agrees with a field type.
|
bool IsMatchingType(const reflection::Field* field,
|
const Variant& value) const;
|
|
// Sets a (primitive) field to a specific value.
|
// Returns true if successful, and false if the field was not found or the
|
// expected type doesn't match.
|
template <typename T>
|
bool Set(StringPiece field_name, T value) {
|
if (const reflection::Field* field = GetFieldOrNull(field_name)) {
|
return Set<T>(field, value);
|
}
|
return false;
|
}
|
|
// Sets a (primitive) field to a specific value.
|
// Returns true if successful, and false if the expected type doesn't match.
|
// Expects `field` to be non-null.
|
template <typename T>
|
bool Set(const reflection::Field* field, T value) {
|
if (field == nullptr) {
|
TC3_LOG(ERROR) << "Expected non-null field.";
|
return false;
|
}
|
Variant variant_value(value);
|
if (!IsMatchingType(field, variant_value)) {
|
TC3_LOG(ERROR) << "Type mismatch for field `" << field->name()->str()
|
<< "`, expected: " << field->type()->base_type()
|
<< ", got: " << variant_value.GetType();
|
return false;
|
}
|
fields_[field] = variant_value;
|
return true;
|
}
|
|
template <typename T>
|
bool Set(const FlatbufferFieldPath* path, T value) {
|
ReflectiveFlatbuffer* parent;
|
const reflection::Field* field;
|
if (!GetFieldWithParent(path, &parent, &field)) {
|
return false;
|
}
|
return parent->Set<T>(field, value);
|
}
|
|
// Sets a (primitive) field to a specific value.
|
// Parses the string value according to the field type.
|
bool ParseAndSet(const reflection::Field* field, const std::string& value);
|
bool ParseAndSet(const FlatbufferFieldPath* path, const std::string& value);
|
|
// Gets the reflective flatbuffer for a table field.
|
// Returns nullptr if the field was not found, or the field type was not a
|
// table.
|
ReflectiveFlatbuffer* Mutable(StringPiece field_name);
|
ReflectiveFlatbuffer* Mutable(const reflection::Field* field);
|
|
// Gets the reflective flatbuffer for a repeated field.
|
// Returns nullptr if the field was not found, or the field type was not a
|
// vector.
|
RepeatedField* Repeated(StringPiece field_name);
|
RepeatedField* Repeated(const reflection::Field* field);
|
|
template <typename T>
|
TypedRepeatedField<T>* Repeated(const reflection::Field* field) {
|
return static_cast<TypedRepeatedField<T>*>(Repeated(field));
|
}
|
|
template <typename T>
|
TypedRepeatedField<T>* Repeated(StringPiece field_name) {
|
return static_cast<TypedRepeatedField<T>*>(Repeated(field_name));
|
}
|
|
// Serializes the flatbuffer.
|
flatbuffers::uoffset_t Serialize(
|
flatbuffers::FlatBufferBuilder* builder) const;
|
std::string Serialize() const;
|
|
// Merges the fields from the given flatbuffer table into this flatbuffer.
|
// Scalar fields will be overwritten, if present in `from`.
|
// Embedded messages will be merged.
|
bool MergeFrom(const flatbuffers::Table* from);
|
bool MergeFromSerializedFlatbuffer(StringPiece from);
|
|
// Flattens the flatbuffer as a flat map.
|
// (Nested) fields names are joined by `key_separator`.
|
std::map<std::string, Variant> AsFlatMap(
|
const std::string& key_separator = ".") const {
|
std::map<std::string, Variant> result;
|
AsFlatMap(key_separator, /*key_prefix=*/"", &result);
|
return result;
|
}
|
|
private:
|
const reflection::Schema* const schema_;
|
const reflection::Object* const type_;
|
|
// Cached primitive fields (scalars and strings).
|
std::map<const reflection::Field*, Variant> fields_;
|
|
// Cached sub-messages.
|
std::map<const reflection::Field*, std::unique_ptr<ReflectiveFlatbuffer>>
|
children_;
|
|
// Cached repeated fields.
|
std::map<const reflection::Field*, std::unique_ptr<RepeatedField>>
|
repeated_fields_;
|
|
// Flattens the flatbuffer as a flat map.
|
// (Nested) fields names are joined by `key_separator` and prefixed by
|
// `key_prefix`.
|
void AsFlatMap(const std::string& key_separator,
|
const std::string& key_prefix,
|
std::map<std::string, Variant>* result) const;
|
};
|
|
// A helper class to build flatbuffers based on schema reflection data.
|
// Can be used to a `ReflectiveFlatbuffer` for the root message of the
|
// schema, or any defined table via name.
|
class ReflectiveFlatbufferBuilder {
|
public:
|
explicit ReflectiveFlatbufferBuilder(const reflection::Schema* schema)
|
: schema_(schema) {}
|
|
// Starts a new root table message.
|
std::unique_ptr<ReflectiveFlatbuffer> NewRoot() const;
|
|
// Starts a new table message. Returns nullptr if no table with given name is
|
// found in the schema.
|
std::unique_ptr<ReflectiveFlatbuffer> NewTable(
|
const StringPiece table_name) const;
|
|
private:
|
const reflection::Schema* const schema_;
|
};
|
|
} // namespace libtextclassifier3
|
|
#endif // LIBTEXTCLASSIFIER_UTILS_FLATBUFFERS_H_
|