Buffer implements GPUObject. PiperOrigin-RevId: 317746356 Change-Id: I715d37a924298e54e9fe68e5c7b719ab592237a1
122 lines
4.2 KiB
C++
122 lines
4.2 KiB
C++
/* Copyright 2019 The TensorFlow Authors. All Rights Reserved.
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
==============================================================================*/
|
|
|
|
#ifndef TENSORFLOW_LITE_DELEGATES_GPU_CL_BUFFER_H_
|
|
#define TENSORFLOW_LITE_DELEGATES_GPU_CL_BUFFER_H_
|
|
|
|
#include "absl/strings/str_cat.h"
|
|
#include "absl/types/span.h"
|
|
#include "tensorflow/lite/delegates/gpu/cl/cl_command_queue.h"
|
|
#include "tensorflow/lite/delegates/gpu/cl/cl_context.h"
|
|
#include "tensorflow/lite/delegates/gpu/cl/gpu_object.h"
|
|
#include "tensorflow/lite/delegates/gpu/cl/opencl_wrapper.h"
|
|
#include "tensorflow/lite/delegates/gpu/cl/util.h"
|
|
#include "tensorflow/lite/delegates/gpu/common/status.h"
|
|
|
|
namespace tflite {
|
|
namespace gpu {
|
|
namespace cl {
|
|
|
|
struct BufferDescriptor : public GPUObjectDescriptor {
|
|
DataType element_type; // FLOAT32 or FLOAT16
|
|
int element_size;
|
|
|
|
absl::Status PerformSelector(const std::string& selector,
|
|
const std::vector<std::string>& args,
|
|
const std::vector<std::string>& template_args,
|
|
std::string* result) const override;
|
|
|
|
GPUResources GetGPUResources(AccessType access_type) const override;
|
|
absl::Status PerformReadSelector(const std::vector<std::string>& args,
|
|
std::string* result) const;
|
|
};
|
|
|
|
// Buffer represent linear GPU data storage with arbitrary data format.
|
|
// Buffer is moveable but not copyable.
|
|
class Buffer : public GPUObject {
|
|
public:
|
|
Buffer() {} // just for using Buffer as a class members
|
|
Buffer(cl_mem buffer, size_t size_in_bytes);
|
|
|
|
// Move only
|
|
Buffer(Buffer&& buffer);
|
|
Buffer& operator=(Buffer&& buffer);
|
|
Buffer(const Buffer&) = delete;
|
|
Buffer& operator=(const Buffer&) = delete;
|
|
|
|
~Buffer();
|
|
|
|
// for profiling and memory statistics
|
|
uint64_t GetMemorySizeInBytes() const { return size_; }
|
|
|
|
cl_mem GetMemoryPtr() const { return buffer_; }
|
|
|
|
// Writes data to a buffer. Data should point to a region that
|
|
// has exact size in bytes as size_in_bytes(constructor parameter).
|
|
template <typename T>
|
|
absl::Status WriteData(CLCommandQueue* queue, const absl::Span<T> data);
|
|
|
|
// Reads data from Buffer into CPU memory.
|
|
template <typename T>
|
|
absl::Status ReadData(CLCommandQueue* queue, std::vector<T>* result) const;
|
|
|
|
GPUResourcesWithValue GetGPUResources(AccessType access_type) const override;
|
|
|
|
private:
|
|
void Release();
|
|
|
|
cl_mem buffer_ = nullptr;
|
|
size_t size_;
|
|
};
|
|
|
|
absl::Status CreateReadOnlyBuffer(size_t size_in_bytes, CLContext* context,
|
|
Buffer* result);
|
|
|
|
absl::Status CreateReadOnlyBuffer(size_t size_in_bytes, const void* data,
|
|
CLContext* context, Buffer* result);
|
|
|
|
absl::Status CreateReadWriteBuffer(size_t size_in_bytes, CLContext* context,
|
|
Buffer* result);
|
|
|
|
template <typename T>
|
|
absl::Status Buffer::WriteData(CLCommandQueue* queue,
|
|
const absl::Span<T> data) {
|
|
if (size_ != sizeof(T) * data.size()) {
|
|
return absl::InvalidArgumentError(
|
|
"absl::Span<T> data size is different from buffer allocated size.");
|
|
}
|
|
RETURN_IF_ERROR(queue->EnqueueWriteBuffer(buffer_, size_, data.data()));
|
|
return absl::OkStatus();
|
|
}
|
|
|
|
template <typename T>
|
|
absl::Status Buffer::ReadData(CLCommandQueue* queue,
|
|
std::vector<T>* result) const {
|
|
if (size_ % sizeof(T) != 0) {
|
|
return absl::UnknownError("Wrong element size(typename T is not correct?");
|
|
}
|
|
|
|
const int elements_count = size_ / sizeof(T);
|
|
result->resize(elements_count);
|
|
|
|
return queue->EnqueueReadBuffer(buffer_, size_, result->data());
|
|
}
|
|
|
|
} // namespace cl
|
|
} // namespace gpu
|
|
} // namespace tflite
|
|
|
|
#endif // TENSORFLOW_LITE_DELEGATES_GPU_CL_BUFFER_H_
|