Better FullyConnected/ConvTransposed selection for Intel.

PiperOrigin-RevId: 316997745
Change-Id: I28befdd528917c3846ff6ae79b0f8427389dfc39
This commit is contained in:
Raman Sarokin 2020-06-17 17:18:45 -07:00 committed by TensorFlower Gardener
parent bae911298b
commit 1f05cc5973
4 changed files with 6 additions and 2 deletions

View File

@ -269,7 +269,7 @@ ConvolutionTransposed3x3::ConvolutionTransposed3x3(
work_group_launch_order_(2, 0, 1) {
if (device.IsPowerVR()) {
weights_upload_type_ = WeightsUploadType::LOCAL_MEM_ASYNC;
} else if (device.IsNvidia()) {
} else if (device.IsNvidia() || device.IsIntel()) {
weights_upload_type_ = WeightsUploadType::LOCAL_MEM_BY_THREADS;
} else if (device.IsAMD()) {
weights_upload_type_ = WeightsUploadType::CONSTANT_MEM;

View File

@ -270,7 +270,7 @@ ConvolutionTransposed4x4::ConvolutionTransposed4x4(
: GPUOperation(definition) {
if (device.IsPowerVR()) {
weights_upload_type_ = WeightsUploadType::LOCAL_MEM_ASYNC;
} else if (device.IsNvidia()) {
} else if (device.IsNvidia() || device.IsIntel()) {
weights_upload_type_ = WeightsUploadType::LOCAL_MEM_BY_THREADS;
} else if (device.IsAMD()) {
weights_upload_type_ = WeightsUploadType::CONSTANT_MEM;

View File

@ -112,6 +112,7 @@ absl::Status SelectConvolutionTransposed(
case Vendor::POWERVR:
case Vendor::NVIDIA:
case Vendor::AMD:
case Vendor::INTEL:
return SelectConvolutionTransposedPowerVR(attr, creation_context, op_def,
ptr);
case Vendor::MALI:

View File

@ -109,6 +109,9 @@ absl::Status SelectFullyConnected(const FullyConnectedAttributes& attr,
return SelectFullyConnectedAdreno(attr, creation_context, op_def,
batch_size, ptr);
case Vendor::POWERVR:
case Vendor::AMD:
case Vendor::NVIDIA:
case Vendor::INTEL:
return SelectFullyConnectedPowerVR(attr, creation_context, op_def,
batch_size, ptr);
case Vendor::MALI: