Add a new `PjRtBuffer::HostBufferSemantics` enum that describes the possible contracts between caller and runtime. * Change `FromHostBuffer(..., force_copy, ...)` to `FromHostBuffer(..., host_buffer_semantics, ...)`. We were seeing some data races between modifications to a NumPy array and JAX on CPU, due to unintended buffer aliasing. This change allows clients to control whether they want zero-copy behavior or not. PiperOrigin-RevId: 316672280 Change-Id: Ibee296305005e0aa306a2c0aacf4b35a3d6c3ac1
61 lines
2.4 KiB
C++
61 lines
2.4 KiB
C++
/* Copyright 2020 The TensorFlow Authors. All Rights Reserved.
|
|
|
|
Licensed under the Apache License, Version 2.0 (the "License");
|
|
you may not use this file except in compliance with the License.
|
|
You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
==============================================================================*/
|
|
|
|
#include "tensorflow/compiler/xla/pjrt/interpreter_device.h"
|
|
|
|
#include "absl/strings/str_cat.h"
|
|
#include "tensorflow/compiler/xla/client/client_library.h"
|
|
#include "tensorflow/compiler/xla/service/platform_util.h"
|
|
|
|
namespace xla {
|
|
|
|
static const char kInterpreterPlatformName[] = "interpreter";
|
|
|
|
InterpreterDevice::InterpreterDevice(
|
|
int id, std::unique_ptr<LocalDeviceState> local_device_state)
|
|
: Device(id, std::move(local_device_state), kInterpreterPlatformName,
|
|
/*device_kind=*/kInterpreterPlatformName) {}
|
|
|
|
StatusOr<std::shared_ptr<PjRtClient>> GetInterpreterClient() {
|
|
TF_ASSIGN_OR_RETURN(se::Platform * platform,
|
|
PlatformUtil::GetPlatform("Interpreter"));
|
|
if (platform->VisibleDeviceCount() != 1) {
|
|
return FailedPrecondition(
|
|
"Interpreter platform should have exactly one device.");
|
|
}
|
|
LocalClientOptions options;
|
|
options.set_platform(platform);
|
|
TF_ASSIGN_OR_RETURN(LocalClient * client,
|
|
ClientLibrary::GetOrCreateLocalClient(options));
|
|
|
|
std::vector<std::unique_ptr<Device>> devices;
|
|
se::StreamExecutor* executor =
|
|
client->backend().stream_executor(0).ValueOrDie();
|
|
auto device_state = absl::make_unique<LocalDeviceState>(
|
|
executor, client, LocalDeviceState::kSynchronous, /*asynchronous=*/false,
|
|
/*allow_event_reuse=*/false);
|
|
auto device =
|
|
absl::make_unique<InterpreterDevice>(0, std::move(device_state));
|
|
devices.push_back(std::move(device));
|
|
|
|
return std::make_shared<PjRtClient>(
|
|
kInterpreterPlatformName, client, std::move(devices), /*host_id=*/0,
|
|
/*allocator=*/nullptr, /*host_memory_allocator=*/nullptr,
|
|
/*should_stage_host_to_device_transfers=*/false,
|
|
/*gpu_run_options=*/nullptr);
|
|
}
|
|
|
|
} // namespace xla
|