STT-tensorflow/tensorflow/lite/delegates/gpu/cl/serialization.cc
Raman Sarokin 465aeca042 Serialization of OpenCL InferenceContext.
PiperOrigin-RevId: 337185119
Change-Id: I3841fd093a692a4acd851792f723381fd29e53bc
2020-10-14 15:31:13 -07:00

1050 lines
40 KiB
C++

/* Copyright 2020 The TensorFlow Authors. All Rights Reserved.
Licensed under the Apache License, Version 2.0 (the "License");
you may not use this file except in compliance with the License.
You may obtain a copy of the License at
http://www.apache.org/licenses/LICENSE-2.0
Unless required by applicable law or agreed to in writing, software
distributed under the License is distributed on an "AS IS" BASIS,
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
See the License for the specific language governing permissions and
limitations under the License.
==============================================================================*/
#include "tensorflow/lite/delegates/gpu/cl/serialization.h"
#include <cstdint>
#include "tensorflow/lite/delegates/gpu/cl/arguments.h"
#include "tensorflow/lite/delegates/gpu/cl/buffer.h"
#include "tensorflow/lite/delegates/gpu/cl/gpu_object.h"
#include "tensorflow/lite/delegates/gpu/cl/inference_context.h"
#include "tensorflow/lite/delegates/gpu/cl/kernels/gpu_operation.h"
#include "tensorflow/lite/delegates/gpu/cl/linear_storage.h"
#include "tensorflow/lite/delegates/gpu/cl/precision.h"
#include "tensorflow/lite/delegates/gpu/cl/serialization_generated.h"
#include "tensorflow/lite/delegates/gpu/cl/tensor_type.h"
#include "tensorflow/lite/delegates/gpu/cl/texture2d.h"
#include "tensorflow/lite/delegates/gpu/common/model.h"
namespace tflite {
namespace gpu {
namespace cl {
namespace {
data::AccessType ToFB(AccessType type) {
switch (type) {
case AccessType::READ:
return data::AccessType::READ;
case AccessType::WRITE:
return data::AccessType::WRITE;
case AccessType::READ_WRITE:
return data::AccessType::READ_WRITE;
default:
return data::AccessType::READ_WRITE;
}
}
data::DataType ToFB(DataType type) {
switch (type) {
case DataType::FLOAT16:
return data::DataType::FLOAT16;
case DataType::FLOAT32:
return data::DataType::FLOAT32;
default:
return data::DataType::UNKNOWN;
}
}
data::MemoryType ToFB(MemoryType type) {
switch (type) {
case MemoryType::CONSTANT:
return data::MemoryType::CONSTANT;
case MemoryType::GLOBAL:
return data::MemoryType::GLOBAL;
case MemoryType::LOCAL:
return data::MemoryType::LOCAL;
}
}
data::LinearStorageType ToFB(LinearStorageType type) {
switch (type) {
case LinearStorageType::BUFFER:
return data::LinearStorageType::BUFFER;
case LinearStorageType::TEXTURE_2D:
return data::LinearStorageType::TEXTURE_2D;
}
}
data::TensorStorageType ToFB(TensorStorageType type) {
switch (type) {
case TensorStorageType::BUFFER:
return data::TensorStorageType::BUFFER;
case TensorStorageType::IMAGE_BUFFER:
return data::TensorStorageType::IMAGE_BUFFER;
case TensorStorageType::TEXTURE_2D:
return data::TensorStorageType::TEXTURE_2D;
case TensorStorageType::TEXTURE_ARRAY:
return data::TensorStorageType::TEXTURE_ARRAY;
case TensorStorageType::TEXTURE_3D:
return data::TensorStorageType::TEXTURE_3D;
case TensorStorageType::SINGLE_TEXTURE_2D:
return data::TensorStorageType::SINGLE_TEXTURE_2D;
case TensorStorageType::UNKNOWN:
return data::TensorStorageType::UNKNOWN;
}
}
data::Layout ToFB(Layout type) {
switch (type) {
case Layout::HWC:
return data::Layout::HWC;
case Layout::BHWC:
return data::Layout::BHWC;
case Layout::HWDC:
return data::Layout::HWDC;
case Layout::BHWDC:
return data::Layout::BHWDC;
default:
return data::Layout::UNKNOWN;
}
}
data::CalculationsPrecision ToFB(CalculationsPrecision type) {
switch (type) {
case CalculationsPrecision::F32:
return data::CalculationsPrecision::F32;
case CalculationsPrecision::F32_F16:
return data::CalculationsPrecision::F32_F16;
case CalculationsPrecision::F16:
return data::CalculationsPrecision::F16;
}
}
data::TensorToGrid ToFB(TensorToGrid type) {
switch (type) {
case TensorToGrid::kCustom:
return data::TensorToGrid::CUSTOM;
case TensorToGrid::kWBToX_HDToY_SToZ:
return data::TensorToGrid::WB_TO_X_HD_TO_Y_S_TO_Z;
case TensorToGrid::kWBToX_HDToY_ZIs1:
return data::TensorToGrid::WB_TO_X_HD_TO_Y_Z_IS_1;
case TensorToGrid::kWBToX_HToY_DToZ:
return data::TensorToGrid::WB_TO_X_H_TO_Y_D_TO_Z;
case TensorToGrid::kBToX_YIs1_ZIs1:
return data::TensorToGrid::B_TO_X_Y_IS_1_Z_IS_1;
}
}
data::CompilerOptions ToFB(CompilerOptions type) {
switch (type) {
case CompilerOptions::ADRENO_FULL_SIMD_LINE:
return data::CompilerOptions::ADRENO_FULL_SIMD_LINE;
case CompilerOptions::ADRENO_MORE_WAVES:
return data::CompilerOptions::ADRENO_MORE_WAVES;
case CompilerOptions::POWERVR_FP16:
return data::CompilerOptions::POWERVR_FP16;
case CompilerOptions::CL_OPT_DISABLE:
return data::CompilerOptions::CL_OPT_DISABLE;
case CompilerOptions::CL_2_0:
return data::CompilerOptions::CL_2_0;
case CompilerOptions::CL_3_0:
return data::CompilerOptions::CL_3_0;
}
}
DataType ToEnum(data::DataType type) {
switch (type) {
case data::DataType::FLOAT16:
return DataType::FLOAT16;
case data::DataType::FLOAT32:
return DataType::FLOAT32;
default:
return DataType::UNKNOWN;
}
}
AccessType ToEnum(data::AccessType type) {
switch (type) {
case data::AccessType::READ:
return AccessType::READ;
case data::AccessType::WRITE:
return AccessType::WRITE;
case data::AccessType::READ_WRITE:
return AccessType::READ_WRITE;
}
}
MemoryType ToEnum(data::MemoryType type) {
switch (type) {
case data::MemoryType::CONSTANT:
return MemoryType::CONSTANT;
case data::MemoryType::GLOBAL:
return MemoryType::GLOBAL;
case data::MemoryType::LOCAL:
return MemoryType::LOCAL;
}
}
LinearStorageType ToEnum(data::LinearStorageType type) {
switch (type) {
case data::LinearStorageType::BUFFER:
return LinearStorageType::BUFFER;
case data::LinearStorageType::TEXTURE_2D:
return LinearStorageType::TEXTURE_2D;
}
}
TensorStorageType ToEnum(data::TensorStorageType type) {
switch (type) {
case data::TensorStorageType::BUFFER:
return TensorStorageType::BUFFER;
case data::TensorStorageType::IMAGE_BUFFER:
return TensorStorageType::IMAGE_BUFFER;
case data::TensorStorageType::TEXTURE_2D:
return TensorStorageType::TEXTURE_2D;
case data::TensorStorageType::TEXTURE_ARRAY:
return TensorStorageType::TEXTURE_ARRAY;
case data::TensorStorageType::TEXTURE_3D:
return TensorStorageType::TEXTURE_3D;
case data::TensorStorageType::SINGLE_TEXTURE_2D:
return TensorStorageType::SINGLE_TEXTURE_2D;
case data::TensorStorageType::UNKNOWN:
return TensorStorageType::UNKNOWN;
}
}
Layout ToEnum(data::Layout type) {
switch (type) {
case data::Layout::HWC:
return Layout::HWC;
case data::Layout::BHWC:
return Layout::BHWC;
case data::Layout::HWDC:
return Layout::HWDC;
case data::Layout::BHWDC:
return Layout::BHWDC;
default:
return Layout::UNKNOWN;
}
}
CalculationsPrecision ToEnum(data::CalculationsPrecision type) {
switch (type) {
case data::CalculationsPrecision::F32:
return CalculationsPrecision::F32;
case data::CalculationsPrecision::F32_F16:
return CalculationsPrecision::F32_F16;
case data::CalculationsPrecision::F16:
return CalculationsPrecision::F16;
}
}
TensorToGrid ToEnum(data::TensorToGrid type) {
switch (type) {
case data::TensorToGrid::CUSTOM:
return TensorToGrid::kCustom;
case data::TensorToGrid::WB_TO_X_HD_TO_Y_S_TO_Z:
return TensorToGrid::kWBToX_HDToY_SToZ;
case data::TensorToGrid::WB_TO_X_HD_TO_Y_Z_IS_1:
return TensorToGrid::kWBToX_HDToY_ZIs1;
case data::TensorToGrid::WB_TO_X_H_TO_Y_D_TO_Z:
return TensorToGrid::kWBToX_HToY_DToZ;
case data::TensorToGrid::B_TO_X_Y_IS_1_Z_IS_1:
return TensorToGrid::kBToX_YIs1_ZIs1;
}
}
CompilerOptions ToEnum(data::CompilerOptions type) {
switch (type) {
case data::CompilerOptions::ADRENO_FULL_SIMD_LINE:
return CompilerOptions::ADRENO_FULL_SIMD_LINE;
case data::CompilerOptions::ADRENO_MORE_WAVES:
return CompilerOptions::ADRENO_MORE_WAVES;
case data::CompilerOptions::POWERVR_FP16:
return CompilerOptions::POWERVR_FP16;
case data::CompilerOptions::CL_OPT_DISABLE:
return CompilerOptions::CL_OPT_DISABLE;
case data::CompilerOptions::CL_2_0:
return CompilerOptions::CL_2_0;
case data::CompilerOptions::CL_3_0:
return CompilerOptions::CL_3_0;
}
}
} // namespace
flatbuffers::Offset<data::Int2> Encode(
const int2& v, flatbuffers::FlatBufferBuilder* builder) {
data::Int2Builder int2_builder(*builder);
int2_builder.add_x(v.x);
int2_builder.add_y(v.y);
return int2_builder.Finish();
}
flatbuffers::Offset<data::Int3> Encode(
const int3& v, flatbuffers::FlatBufferBuilder* builder) {
data::Int3Builder int3_builder(*builder);
int3_builder.add_x(v.x);
int3_builder.add_y(v.y);
int3_builder.add_z(v.z);
return int3_builder.Finish();
}
flatbuffers::Offset<data::GPUObjectDescriptor> Encode(
const GPUObjectDescriptor& desc, flatbuffers::FlatBufferBuilder* builder) {
std::vector<flatbuffers::Offset<data::StateVariable>> state_vars_fb;
for (auto& v0 : desc.state_vars_) {
auto key_fb = builder->CreateString(v0.first);
auto value_fb = builder->CreateString(v0.second);
data::StateVariableBuilder state_builder(*builder);
state_builder.add_key(key_fb);
state_builder.add_value(value_fb);
state_vars_fb.push_back(state_builder.Finish());
}
auto state_vars_fb_vec = builder->CreateVector(state_vars_fb);
data::GPUObjectDescriptorBuilder obj_builder(*builder);
obj_builder.add_state_vars(state_vars_fb_vec);
obj_builder.add_access_type(ToFB(desc.access_type_));
return obj_builder.Finish();
}
void Decode(const data::GPUObjectDescriptor* fb_obj, GPUObjectDescriptor* obj) {
obj->access_type_ = ToEnum(fb_obj->access_type());
for (auto state_fb : *fb_obj->state_vars()) {
std::string key(state_fb->key()->c_str(), state_fb->key()->size());
std::string value(state_fb->value()->c_str(), state_fb->value()->size());
obj->state_vars_[key] = value;
}
}
flatbuffers::Offset<data::BufferDescriptor> Encode(
const BufferDescriptor& desc, flatbuffers::FlatBufferBuilder* builder) {
auto obj_fb =
Encode(*static_cast<const GPUObjectDescriptor*>(&desc), builder);
std::vector<flatbuffers::Offset<flatbuffers::String>> attributes_fb;
for (auto& attr : desc.attributes) {
attributes_fb.push_back(builder->CreateString(attr));
}
auto attributes_fb_vec = builder->CreateVector(attributes_fb);
auto data_fb = builder->CreateVector(desc.data);
data::BufferDescriptorBuilder buf_builder(*builder);
buf_builder.add_base_obj(obj_fb);
buf_builder.add_element_type(ToFB(desc.element_type));
buf_builder.add_element_size(desc.element_size);
buf_builder.add_memory_type(ToFB(desc.memory_type));
buf_builder.add_attributes(attributes_fb_vec);
buf_builder.add_size(desc.size);
buf_builder.add_data(data_fb);
return buf_builder.Finish();
}
void Decode(const data::BufferDescriptor* fb_desc, BufferDescriptor* desc) {
Decode(fb_desc->base_obj(), desc);
desc->element_type = ToEnum(fb_desc->element_type());
desc->element_size = fb_desc->element_size();
desc->memory_type = ToEnum(fb_desc->memory_type());
for (auto attr_fb : *fb_desc->attributes()) {
std::string attr(attr_fb->c_str(), attr_fb->size());
desc->attributes.push_back(attr);
}
desc->size = fb_desc->size();
desc->data =
std::vector<uint8_t>(fb_desc->data()->data(),
fb_desc->data()->data() + fb_desc->data()->size());
}
flatbuffers::Offset<data::Texture2DDescriptor> Encode(
const Texture2DDescriptor& desc, flatbuffers::FlatBufferBuilder* builder) {
auto obj_fb =
Encode(*static_cast<const GPUObjectDescriptor*>(&desc), builder);
auto data_fb = builder->CreateVector(desc.data);
auto size_fb = Encode(desc.size, builder);
data::Texture2DDescriptorBuilder tex_builder(*builder);
tex_builder.add_base_obj(obj_fb);
tex_builder.add_element_type(ToFB(desc.element_type));
tex_builder.add_normalized(desc.normalized);
tex_builder.add_normalized_type(ToFB(desc.normalized_type));
tex_builder.add_size(size_fb);
tex_builder.add_data(data_fb);
return tex_builder.Finish();
}
void Decode(const data::Texture2DDescriptor* fb_desc,
Texture2DDescriptor* desc) {
Decode(fb_desc->base_obj(), desc);
desc->element_type = ToEnum(fb_desc->element_type());
desc->normalized = fb_desc->normalized();
desc->normalized_type = ToEnum(fb_desc->normalized_type());
desc->size.x = fb_desc->size()->x();
desc->size.y = fb_desc->size()->y();
desc->data =
std::vector<uint8_t>(fb_desc->data()->data(),
fb_desc->data()->data() + fb_desc->data()->size());
}
flatbuffers::Offset<data::TensorLinearDescriptor> Encode(
const TensorLinearDescriptor& desc,
flatbuffers::FlatBufferBuilder* builder) {
auto obj_fb =
Encode(*static_cast<const GPUObjectDescriptor*>(&desc), builder);
auto data_fb = builder->CreateVector(desc.data);
data::TensorLinearDescriptorBuilder tensor_builder(*builder);
tensor_builder.add_base_obj(obj_fb);
tensor_builder.add_element_type(ToFB(desc.element_type));
tensor_builder.add_storage_type(ToFB(desc.storage_type));
tensor_builder.add_memory_type(ToFB(desc.memory_type));
tensor_builder.add_size(desc.size);
tensor_builder.add_data(data_fb);
return tensor_builder.Finish();
}
void Decode(const data::TensorLinearDescriptor* fb_desc,
TensorLinearDescriptor* desc) {
Decode(fb_desc->base_obj(), desc);
desc->element_type = ToEnum(fb_desc->element_type());
desc->storage_type = ToEnum(fb_desc->storage_type());
desc->memory_type = ToEnum(fb_desc->memory_type());
desc->size = fb_desc->size();
desc->data =
std::vector<uint8_t>(fb_desc->data()->data(),
fb_desc->data()->data() + fb_desc->data()->size());
}
flatbuffers::Offset<data::TensorDescriptor> Encode(
const TensorDescriptor& desc, flatbuffers::FlatBufferBuilder* builder) {
auto obj_fb =
Encode(*static_cast<const GPUObjectDescriptor*>(&desc), builder);
data::BHWDCBuilder shape_builder(*builder);
shape_builder.add_b(desc.shape.b);
shape_builder.add_h(desc.shape.h);
shape_builder.add_w(desc.shape.w);
shape_builder.add_d(desc.shape.d);
shape_builder.add_c(desc.shape.c);
auto shape_fb = shape_builder.Finish();
auto data_fb = builder->CreateVector(desc.data);
data::TensorDescriptorBuilder tensor_builder(*builder);
tensor_builder.add_base_obj(obj_fb);
tensor_builder.add_data_type(ToFB(desc.data_type));
tensor_builder.add_storage_type(ToFB(desc.storage_type));
tensor_builder.add_layout(ToFB(desc.layout));
tensor_builder.add_shape(shape_fb);
tensor_builder.add_data(data_fb);
return tensor_builder.Finish();
}
void Decode(const data::TensorDescriptor* fb_desc, TensorDescriptor* desc) {
Decode(fb_desc->base_obj(), desc);
desc->data_type = ToEnum(fb_desc->data_type());
desc->storage_type = ToEnum(fb_desc->storage_type());
desc->layout = ToEnum(fb_desc->layout());
desc->shape.b = fb_desc->shape()->b();
desc->shape.h = fb_desc->shape()->h();
desc->shape.w = fb_desc->shape()->w();
desc->shape.d = fb_desc->shape()->d();
desc->shape.c = fb_desc->shape()->c();
desc->data =
std::vector<uint8_t>(fb_desc->data()->data(),
fb_desc->data()->data() + fb_desc->data()->size());
}
flatbuffers::Offset<data::OperationDef> Encode(
const OperationDef& def, flatbuffers::FlatBufferBuilder* builder) {
std::vector<flatbuffers::Offset<data::TensorDescriptor>> src_tensors_fb;
for (auto& desc : def.src_tensors) {
auto desc_fb = Encode(desc, builder);
src_tensors_fb.push_back(desc_fb);
}
std::vector<flatbuffers::Offset<data::TensorDescriptor>> dst_tensors_fb;
for (auto& desc : def.dst_tensors) {
auto desc_fb = Encode(desc, builder);
dst_tensors_fb.push_back(desc_fb);
}
auto src_tensors_fb_vec = builder->CreateVector(src_tensors_fb);
auto dst_tensors_fb_vec = builder->CreateVector(dst_tensors_fb);
data::OperationDefBuilder def_builder(*builder);
def_builder.add_precision(ToFB(def.precision));
def_builder.add_src_tensors(src_tensors_fb_vec);
def_builder.add_dst_tensors(dst_tensors_fb_vec);
return def_builder.Finish();
}
void Decode(const data::OperationDef* fb_def, OperationDef* def) {
for (auto src_fb : *fb_def->src_tensors()) {
TensorDescriptor desc;
Decode(src_fb, &desc);
def->src_tensors.push_back(std::move(desc));
}
for (auto dst_fb : *fb_def->dst_tensors()) {
TensorDescriptor desc;
Decode(dst_fb, &desc);
def->dst_tensors.push_back(std::move(desc));
}
def->precision = ToEnum(fb_def->precision());
}
flatbuffers::Offset<data::TensorDescWithId> Encode(
const TensorDescriptor& desc, const ValueId& id,
flatbuffers::FlatBufferBuilder* builder) {
auto desc_fb = Encode(desc, builder);
data::TensorDescWithIdBuilder desc_builder(*builder);
desc_builder.add_desc(desc_fb);
desc_builder.add_id(id);
return desc_builder.Finish();
}
void Decode(const data::TensorDescWithId* fb_desc, TensorDescriptor* desc,
ValueId* id) {
Decode(fb_desc->desc(), desc);
*id = fb_desc->id();
}
absl::Status Decode(CLContext* context, const data::Arguments* fb_args,
Arguments* args) {
args->shared_int4s_data_ = std::vector<int32_t>(
fb_args->shared_int4s()->data(),
fb_args->shared_int4s()->data() + fb_args->shared_int4s()->size());
args->shared_float4s_data_ = std::vector<float>(
fb_args->shared_float4s()->data(),
fb_args->shared_float4s()->data() + fb_args->shared_float4s()->size());
std::vector<float> tmp = std::vector<float>(
fb_args->shared_half4s()->data(),
fb_args->shared_half4s()->data() + fb_args->shared_half4s()->size());
args->shared_half4s_data_.resize(tmp.size());
for (int i = 0; i < tmp.size(); ++i) {
args->shared_half4s_data_[i] = tmp[i];
}
args->int_values_.clear();
for (auto int_values_fb : *fb_args->int_values()) {
Arguments::IntValue value;
value.value = int_values_fb->value();
value.offset = int_values_fb->offset();
value.active = int_values_fb->active();
std::string name(int_values_fb->name()->c_str(),
int_values_fb->name()->size());
args->int_values_[name] = value;
}
args->float_values_.clear();
for (auto float_values_fb : *fb_args->float_values()) {
Arguments::FloatValue value;
value.value = float_values_fb->value();
value.offset = float_values_fb->offset();
value.active = float_values_fb->active();
std::string name(float_values_fb->name()->c_str(),
float_values_fb->name()->size());
args->float_values_[name] = value;
}
args->half_values_.clear();
for (auto half_values_fb : *fb_args->half_values()) {
Arguments::HalfValue value;
value.value = half_values_fb->value();
value.offset = half_values_fb->offset();
value.active = half_values_fb->active();
value.store_as_f32 = half_values_fb->store_as_f32();
std::string name(half_values_fb->name()->c_str(),
half_values_fb->name()->size());
args->half_values_[name] = value;
}
for (auto buffer_pair_fb : *fb_args->buffer_objects()) {
std::string key(buffer_pair_fb->key()->c_str(),
buffer_pair_fb->key()->size());
BufferDescriptor desc;
Decode(buffer_pair_fb->value(), &desc);
args->AddObject(key, absl::make_unique<BufferDescriptor>(std::move(desc)));
}
for (auto texture_pair_fb : *fb_args->texture2d_objects()) {
std::string key(texture_pair_fb->key()->c_str(),
texture_pair_fb->key()->size());
Texture2DDescriptor desc;
Decode(texture_pair_fb->value(), &desc);
args->AddObject(key,
absl::make_unique<Texture2DDescriptor>(std::move(desc)));
}
for (auto tensor_pair_fb : *fb_args->tensor_linear_objects()) {
std::string key(tensor_pair_fb->key()->c_str(),
tensor_pair_fb->key()->size());
TensorLinearDescriptor desc;
Decode(tensor_pair_fb->value(), &desc);
args->AddObject(key,
absl::make_unique<TensorLinearDescriptor>(std::move(desc)));
}
for (auto tensor_pair_fb : *fb_args->tensor_objects()) {
std::string key(tensor_pair_fb->key()->c_str(),
tensor_pair_fb->key()->size());
TensorDescriptor desc;
Decode(tensor_pair_fb->value(), &desc);
args->AddObject(key, absl::make_unique<TensorDescriptor>(std::move(desc)));
}
for (auto buffer_pair_fb : *fb_args->buffer_refs()) {
std::string key(buffer_pair_fb->key()->c_str(),
buffer_pair_fb->key()->size());
BufferDescriptor desc;
Decode(buffer_pair_fb->value(), &desc);
auto access_type = desc.GetAccess();
args->AddObjectRef(key, access_type,
absl::make_unique<BufferDescriptor>(std::move(desc)));
}
for (auto texture_pair_fb : *fb_args->texture2d_refs()) {
std::string key(texture_pair_fb->key()->c_str(),
texture_pair_fb->key()->size());
Texture2DDescriptor desc;
Decode(texture_pair_fb->value(), &desc);
auto access_type = desc.GetAccess();
args->AddObjectRef(key, access_type,
absl::make_unique<Texture2DDescriptor>(std::move(desc)));
}
for (auto tensor_pair_fb : *fb_args->tensor_linear_refs()) {
std::string key(tensor_pair_fb->key()->c_str(),
tensor_pair_fb->key()->size());
TensorLinearDescriptor desc;
Decode(tensor_pair_fb->value(), &desc);
auto access_type = desc.GetAccess();
args->AddObjectRef(
key, access_type,
absl::make_unique<TensorLinearDescriptor>(std::move(desc)));
}
for (auto tensor_pair_fb : *fb_args->tensor_refs()) {
std::string key(tensor_pair_fb->key()->c_str(),
tensor_pair_fb->key()->size());
TensorDescriptor desc;
Decode(tensor_pair_fb->value(), &desc);
auto access_type = desc.GetAccess();
args->AddObjectRef(key, access_type,
absl::make_unique<TensorDescriptor>(std::move(desc)));
}
RETURN_IF_ERROR(args->AllocateObjects(context));
RETURN_IF_ERROR(args->AddObjectArgs());
return absl::OkStatus();
}
flatbuffers::Offset<data::Arguments> Encode(
const Arguments& args, flatbuffers::FlatBufferBuilder* builder) {
std::vector<flatbuffers::Offset<data::IntValue>> int_values_fb;
for (auto& value : args.int_values_) {
auto name_fb = builder->CreateString(value.first);
data::IntValueBuilder value_builder(*builder);
value_builder.add_name(name_fb);
value_builder.add_value(value.second.value);
value_builder.add_offset(value.second.offset);
value_builder.add_active(value.second.active);
int_values_fb.push_back(value_builder.Finish());
}
std::vector<flatbuffers::Offset<data::FloatValue>> float_values_fb;
for (auto& value : args.float_values_) {
auto name_fb = builder->CreateString(value.first);
data::FloatValueBuilder value_builder(*builder);
value_builder.add_name(name_fb);
value_builder.add_value(value.second.value);
value_builder.add_offset(value.second.offset);
value_builder.add_active(value.second.active);
float_values_fb.push_back(value_builder.Finish());
}
std::vector<flatbuffers::Offset<data::HalfValue>> half_values_fb;
for (auto& value : args.half_values_) {
auto name_fb = builder->CreateString(value.first);
data::HalfValueBuilder value_builder(*builder);
value_builder.add_name(name_fb);
value_builder.add_value(value.second.value);
value_builder.add_offset(value.second.offset);
value_builder.add_active(value.second.active);
value_builder.add_store_as_f32(value.second.store_as_f32);
half_values_fb.push_back(value_builder.Finish());
}
std::vector<flatbuffers::Offset<data::BufferDescriptorMapValue>>
buffer_objs_fb;
for (auto& value : args.objects_) {
const auto* buffer_desc =
dynamic_cast<const BufferDescriptor*>(value.second.descriptor.get());
if (!buffer_desc) continue;
auto desc_fb = Encode(*buffer_desc, builder);
auto key_fb = builder->CreateString(value.first);
data::BufferDescriptorMapValueBuilder buf_map_builder(*builder);
buf_map_builder.add_key(key_fb);
buf_map_builder.add_value(desc_fb);
buffer_objs_fb.push_back(buf_map_builder.Finish());
}
std::vector<flatbuffers::Offset<data::Texture2DDescriptorMapValue>>
texture2d_objs_fb;
for (auto& value : args.objects_) {
const auto* texture_desc =
dynamic_cast<const Texture2DDescriptor*>(value.second.descriptor.get());
if (!texture_desc) continue;
auto desc_fb = Encode(*texture_desc, builder);
auto key_fb = builder->CreateString(value.first);
data::Texture2DDescriptorMapValueBuilder tex_map_builder(*builder);
tex_map_builder.add_key(key_fb);
tex_map_builder.add_value(desc_fb);
texture2d_objs_fb.push_back(tex_map_builder.Finish());
}
std::vector<flatbuffers::Offset<data::TensorLinearDescriptorMapValue>>
tensor_linear_objs_fb;
for (auto& value : args.objects_) {
const auto* tensor_desc = dynamic_cast<const TensorLinearDescriptor*>(
value.second.descriptor.get());
if (!tensor_desc) continue;
auto desc_fb = Encode(*tensor_desc, builder);
auto key_fb = builder->CreateString(value.first);
data::TensorLinearDescriptorMapValueBuilder ten_map_builder(*builder);
ten_map_builder.add_key(key_fb);
ten_map_builder.add_value(desc_fb);
tensor_linear_objs_fb.push_back(ten_map_builder.Finish());
}
std::vector<flatbuffers::Offset<data::TensorDescriptorMapValue>>
tensor_objs_fb;
for (auto& value : args.objects_) {
const auto* tensor_desc =
dynamic_cast<const TensorDescriptor*>(value.second.descriptor.get());
if (!tensor_desc) continue;
auto desc_fb = Encode(*tensor_desc, builder);
auto key_fb = builder->CreateString(value.first);
data::TensorDescriptorMapValueBuilder ten_map_builder(*builder);
ten_map_builder.add_key(key_fb);
ten_map_builder.add_value(desc_fb);
tensor_objs_fb.push_back(ten_map_builder.Finish());
}
std::vector<flatbuffers::Offset<data::BufferDescriptorMapValue>>
buffer_refs_fb;
for (auto& value : args.object_refs_) {
const auto* buffer_desc =
dynamic_cast<const BufferDescriptor*>(value.second.descriptor.get());
if (!buffer_desc) continue;
auto desc_fb = Encode(*buffer_desc, builder);
auto key_fb = builder->CreateString(value.first);
data::BufferDescriptorMapValueBuilder buf_map_builder(*builder);
buf_map_builder.add_key(key_fb);
buf_map_builder.add_value(desc_fb);
buffer_refs_fb.push_back(buf_map_builder.Finish());
}
std::vector<flatbuffers::Offset<data::Texture2DDescriptorMapValue>>
texture2d_refs_fb;
for (auto& value : args.object_refs_) {
const auto* texture_desc =
dynamic_cast<const Texture2DDescriptor*>(value.second.descriptor.get());
if (!texture_desc) continue;
auto desc_fb = Encode(*texture_desc, builder);
auto key_fb = builder->CreateString(value.first);
data::Texture2DDescriptorMapValueBuilder tex_map_builder(*builder);
tex_map_builder.add_key(key_fb);
tex_map_builder.add_value(desc_fb);
texture2d_refs_fb.push_back(tex_map_builder.Finish());
}
std::vector<flatbuffers::Offset<data::TensorLinearDescriptorMapValue>>
tensor_linear_refs_fb;
for (auto& value : args.object_refs_) {
const auto* tensor_desc = dynamic_cast<const TensorLinearDescriptor*>(
value.second.descriptor.get());
if (!tensor_desc) continue;
auto desc_fb = Encode(*tensor_desc, builder);
auto key_fb = builder->CreateString(value.first);
data::TensorLinearDescriptorMapValueBuilder ten_map_builder(*builder);
ten_map_builder.add_key(key_fb);
ten_map_builder.add_value(desc_fb);
tensor_linear_refs_fb.push_back(ten_map_builder.Finish());
}
std::vector<flatbuffers::Offset<data::TensorDescriptorMapValue>>
tensor_refs_fb;
for (auto& value : args.object_refs_) {
const auto* tensor_desc =
dynamic_cast<const TensorDescriptor*>(value.second.descriptor.get());
if (!tensor_desc) continue;
auto desc_fb = Encode(*tensor_desc, builder);
auto key_fb = builder->CreateString(value.first);
data::TensorDescriptorMapValueBuilder ten_map_builder(*builder);
ten_map_builder.add_key(key_fb);
ten_map_builder.add_value(desc_fb);
tensor_refs_fb.push_back(ten_map_builder.Finish());
}
auto shared_int4s_data_fb = builder->CreateVector(args.shared_int4s_data_);
auto shared_float4s_data_fb =
builder->CreateVector(args.shared_float4s_data_);
std::vector<float> tmp(args.shared_half4s_data_.size());
for (int i = 0; i < tmp.size(); ++i) {
tmp[i] = args.shared_half4s_data_[i];
}
auto shared_half4s_data_fb = builder->CreateVector(tmp);
auto int_values_fb_vec = builder->CreateVector(int_values_fb);
auto float_values_fb_vec = builder->CreateVector(float_values_fb);
auto half_values_fb_vec = builder->CreateVector(half_values_fb);
auto buffer_objs_fb_vec = builder->CreateVector(buffer_objs_fb);
auto texture2d_objs_fb_vec = builder->CreateVector(texture2d_objs_fb);
auto tensor_linear_objs_fb_vec = builder->CreateVector(tensor_linear_objs_fb);
auto tensor_objs_fb_vec = builder->CreateVector(tensor_objs_fb);
auto buffer_refs_fb_vec = builder->CreateVector(buffer_refs_fb);
auto texture2d_refs_fb_vec = builder->CreateVector(texture2d_refs_fb);
auto tensor_linear_refs_fb_vec = builder->CreateVector(tensor_linear_refs_fb);
auto tensor_refs_fb_vec = builder->CreateVector(tensor_refs_fb);
data::ArgumentsBuilder arguments_builder(*builder);
arguments_builder.add_shared_int4s(shared_int4s_data_fb);
arguments_builder.add_shared_float4s(shared_float4s_data_fb);
arguments_builder.add_shared_half4s(shared_half4s_data_fb);
arguments_builder.add_int_values(int_values_fb_vec);
arguments_builder.add_float_values(float_values_fb_vec);
arguments_builder.add_half_values(half_values_fb_vec);
arguments_builder.add_buffer_objects(buffer_objs_fb_vec);
arguments_builder.add_texture2d_objects(texture2d_objs_fb_vec);
arguments_builder.add_tensor_linear_objects(tensor_linear_objs_fb_vec);
arguments_builder.add_tensor_objects(tensor_objs_fb_vec);
arguments_builder.add_buffer_refs(buffer_refs_fb_vec);
arguments_builder.add_texture2d_refs(texture2d_refs_fb_vec);
arguments_builder.add_tensor_linear_refs(tensor_linear_refs_fb_vec);
arguments_builder.add_tensor_refs(tensor_refs_fb_vec);
return arguments_builder.Finish();
}
absl::Status Decode(CLContext* context, const data::GPUOperation* fb_op,
GPUOperation* op) {
RETURN_IF_ERROR(Decode(context, fb_op->arguments(), &op->args_));
op->code_ = std::string(fb_op->code()->c_str(), fb_op->code()->size());
op->work_group_size_.x = fb_op->work_group_size()->x();
op->work_group_size_.y = fb_op->work_group_size()->y();
op->work_group_size_.z = fb_op->work_group_size()->z();
for (auto option_fb : *fb_op->compiler_options()) {
op->compiler_options_.push_back(ToEnum(option_fb->option()));
}
op->tensor_to_grid_ = ToEnum(fb_op->tensor_to_grid());
op->elementwise_ = fb_op->elementwise();
op->linkable_ = fb_op->linkable();
op->check_src_channels_size_ = fb_op->check_src_channels_size();
Decode(fb_op->definition(), &op->definition_);
op->grid_dimension_ = fb_op->grid_dimension();
op->work_group_launch_order_.x = fb_op->work_group_launch_order()->x();
op->work_group_launch_order_.y = fb_op->work_group_launch_order()->y();
op->work_group_launch_order_.z = fb_op->work_group_launch_order()->z();
op->grid_size_.x = fb_op->grid_size()->x();
op->grid_size_.y = fb_op->grid_size()->y();
op->grid_size_.z = fb_op->grid_size()->z();
for (auto name_fb : *fb_op->src_tensors_names()) {
std::string name(name_fb->c_str(), name_fb->size());
op->src_tensors_names_.push_back(std::move(name));
}
for (auto name_fb : *fb_op->dst_tensors_names()) {
std::string name(name_fb->c_str(), name_fb->size());
op->dst_tensors_names_.push_back(std::move(name));
}
op->work_groups_count_.x = fb_op->work_groups_count()->x();
op->work_groups_count_.y = fb_op->work_groups_count()->y();
op->work_groups_count_.z = fb_op->work_groups_count()->z();
op->linkable_count_ = fb_op->linkable_count();
op->elementwise_code_ = std::string(fb_op->elementwise_code()->c_str(),
fb_op->elementwise_code()->size());
return absl::OkStatus();
}
flatbuffers::Offset<data::GPUOperation> Encode(
const GPUOperation& op, flatbuffers::FlatBufferBuilder* builder) {
auto args_fb = Encode(op.args_, builder);
auto code_fb = builder->CreateString(op.code_);
auto work_group_size_fb = Encode(op.work_group_size_, builder);
std::vector<flatbuffers::Offset<data::CompilerOption>> compiler_options_fb;
for (int i = 0; i < op.compiler_options_.size(); ++i) {
data::CompilerOptionBuilder option_builder(*builder);
option_builder.add_option(ToFB(op.compiler_options_[i]));
compiler_options_fb.push_back(option_builder.Finish());
}
auto compiler_options_fb_vec = builder->CreateVector(compiler_options_fb);
auto def_fb = Encode(op.definition_, builder);
auto work_group_launch_order_fb =
Encode(op.work_group_launch_order_, builder);
auto grid_size_fb = Encode(op.grid_size_, builder);
auto work_groups_count_fb = Encode(op.work_groups_count_, builder);
std::vector<flatbuffers::Offset<flatbuffers::String>> src_names_fb;
for (auto& name : op.src_tensors_names_) {
src_names_fb.push_back(builder->CreateString(name));
}
auto src_names_fb_vec = builder->CreateVector(src_names_fb);
std::vector<flatbuffers::Offset<flatbuffers::String>> dst_names_fb;
for (auto& name : op.dst_tensors_names_) {
dst_names_fb.push_back(builder->CreateString(name));
}
auto dst_names_fb_vec = builder->CreateVector(dst_names_fb);
auto elementwise_code_fb = builder->CreateString(op.elementwise_code_);
data::GPUOperationBuilder op_builder(*builder);
op_builder.add_arguments(args_fb);
op_builder.add_code(code_fb);
op_builder.add_work_group_size(work_group_size_fb);
op_builder.add_compiler_options(compiler_options_fb_vec);
op_builder.add_tensor_to_grid(ToFB(op.tensor_to_grid_));
op_builder.add_elementwise(op.elementwise_);
op_builder.add_linkable(op.linkable_);
op_builder.add_check_src_channels_size(op.check_src_channels_size_);
op_builder.add_definition(def_fb);
op_builder.add_grid_dimension(op.grid_dimension_);
op_builder.add_work_group_launch_order(work_group_launch_order_fb);
op_builder.add_grid_size(grid_size_fb);
op_builder.add_src_tensors_names(src_names_fb_vec);
op_builder.add_dst_tensors_names(dst_names_fb_vec);
op_builder.add_work_groups_count(work_groups_count_fb);
op_builder.add_linkable_count(op.linkable_count_);
op_builder.add_elementwise_code(elementwise_code_fb);
return op_builder.Finish();
}
flatbuffers::Offset<data::CLNode> Encode(
const CLNode& node, flatbuffers::FlatBufferBuilder* builder) {
auto op_fb = Encode(*node.operation, builder);
std::vector<int32_t> in_ids(node.inputs.size());
for (int i = 0; i < in_ids.size(); ++i) {
in_ids[i] = node.inputs[i];
}
std::vector<int32_t> out_ids(node.outputs.size());
for (int i = 0; i < out_ids.size(); ++i) {
out_ids[i] = node.outputs[i];
}
auto in_ids_fb = builder->CreateVector(in_ids);
auto out_ids_fb = builder->CreateVector(out_ids);
auto name_fb = builder->CreateString(node.name);
data::CLNodeBuilder node_builder(*builder);
node_builder.add_gpu_op(op_fb);
node_builder.add_input_ids(in_ids_fb);
node_builder.add_output_ids(out_ids_fb);
node_builder.add_name(name_fb);
return node_builder.Finish();
}
absl::Status Decode(CLContext* context, const data::CLNode* fb_node,
CLNode* node) {
GPUOperation op;
RETURN_IF_ERROR(Decode(context, fb_node->gpu_op(), &op));
node->operation = absl::make_unique<GPUOperation>(std::move(op));
for (auto in_fb : *fb_node->input_ids()) {
node->inputs.push_back(in_fb);
}
for (auto out_fb : *fb_node->output_ids()) {
node->outputs.push_back(out_fb);
}
node->name = std::string(fb_node->name()->c_str(), fb_node->name()->size());
return absl::OkStatus();
}
flatbuffers::Offset<data::InferenceContext> Encode(
const InferenceContext& inference,
flatbuffers::FlatBufferBuilder* builder) {
std::vector<int32_t> in_ids(inference.input_ids_.size());
for (int i = 0; i < in_ids.size(); ++i) {
in_ids[i] = inference.input_ids_[i];
}
std::vector<int32_t> out_ids(inference.output_ids_.size());
for (int i = 0; i < out_ids.size(); ++i) {
out_ids[i] = inference.output_ids_[i];
}
auto in_ids_fb = builder->CreateVector(in_ids);
auto out_ids_fb = builder->CreateVector(out_ids);
std::vector<flatbuffers::Offset<data::CLNode>> nodes_fb;
for (int i = 0; i < inference.nodes_.size(); ++i) {
auto node_fb = Encode(inference.nodes_[i], builder);
nodes_fb.push_back(node_fb);
}
auto nodes_fb_vec = builder->CreateVector(nodes_fb);
std::vector<flatbuffers::Offset<data::TensorDescWithId>> tensors_fb;
auto tensors = inference.tensor_reserver_.GetTensorDescs();
for (auto& tensor : tensors) {
auto tensor_fb = Encode(tensor.second, tensor.first, builder);
tensors_fb.push_back(tensor_fb);
}
auto tensors_fb_vec = builder->CreateVector(tensors_fb);
std::vector<flatbuffers::Offset<data::PairOfValueIds>>
variable_ids_and_refs_fb;
for (auto& pair : inference.variable_ids_and_refs_) {
data::PairOfValueIdsBuilder pair_builder(*builder);
pair_builder.add_first(pair.first);
pair_builder.add_second(pair.second);
variable_ids_and_refs_fb.push_back(pair_builder.Finish());
}
auto variable_ids_and_refs_fb_vec =
builder->CreateVector(variable_ids_and_refs_fb);
data::InferenceContextBuilder inf_builder(*builder);
inf_builder.add_need_flush(inference.need_flush_);
inf_builder.add_flush_periodically(inference.flush_periodically_);
inf_builder.add_flush_period(inference.flush_period_);
inf_builder.add_need_manual_release(inference.need_manual_release_);
inf_builder.add_precision(ToFB(inference.precision_));
inf_builder.add_storage_type(ToFB(inference.storage_type_));
inf_builder.add_nodes(nodes_fb_vec);
inf_builder.add_tensors(tensors_fb_vec);
inf_builder.add_input_ids(in_ids_fb);
inf_builder.add_output_ids(out_ids_fb);
inf_builder.add_variable_ids_and_refs(variable_ids_and_refs_fb_vec);
return inf_builder.Finish();
}
absl::Status Decode(CLContext* context,
const data::InferenceContext* fb_inference,
InferenceContext* inference) {
inference->need_flush_ = fb_inference->need_flush();
inference->flush_periodically_ = fb_inference->flush_periodically();
inference->flush_period_ = fb_inference->flush_period();
inference->need_manual_release_ = fb_inference->need_manual_release();
inference->precision_ = ToEnum(fb_inference->precision());
inference->storage_type_ = ToEnum(fb_inference->storage_type());
inference->nodes_.resize(fb_inference->nodes()->size());
int counter = 0;
for (auto node_fb : *fb_inference->nodes()) {
RETURN_IF_ERROR(Decode(context, node_fb, &inference->nodes_[counter]));
counter++;
}
std::vector<std::pair<ValueId, TensorDescriptor>> tensors;
for (auto tensor_fb : *fb_inference->tensors()) {
TensorDescriptor desc;
Decode(tensor_fb->desc(), &desc);
tensors.push_back({tensor_fb->id(), std::move(desc)});
}
inference->tensor_reserver_.Add(tensors);
for (auto in_fb : *fb_inference->input_ids()) {
inference->input_ids_.push_back(in_fb);
}
for (auto out_fb : *fb_inference->output_ids()) {
inference->output_ids_.push_back(out_fb);
}
for (auto variable_id : *fb_inference->variable_ids_and_refs()) {
inference->variable_ids_and_refs_[variable_id->first()] =
variable_id->second();
}
return absl::OkStatus();
}
} // namespace cl
} // namespace gpu
} // namespace tflite