Better FullyConnected/ConvTransposed selection for Intel.
PiperOrigin-RevId: 316997745 Change-Id: I28befdd528917c3846ff6ae79b0f8427389dfc39
This commit is contained in:
parent
bae911298b
commit
1f05cc5973
@ -269,7 +269,7 @@ ConvolutionTransposed3x3::ConvolutionTransposed3x3(
|
||||
work_group_launch_order_(2, 0, 1) {
|
||||
if (device.IsPowerVR()) {
|
||||
weights_upload_type_ = WeightsUploadType::LOCAL_MEM_ASYNC;
|
||||
} else if (device.IsNvidia()) {
|
||||
} else if (device.IsNvidia() || device.IsIntel()) {
|
||||
weights_upload_type_ = WeightsUploadType::LOCAL_MEM_BY_THREADS;
|
||||
} else if (device.IsAMD()) {
|
||||
weights_upload_type_ = WeightsUploadType::CONSTANT_MEM;
|
||||
|
@ -270,7 +270,7 @@ ConvolutionTransposed4x4::ConvolutionTransposed4x4(
|
||||
: GPUOperation(definition) {
|
||||
if (device.IsPowerVR()) {
|
||||
weights_upload_type_ = WeightsUploadType::LOCAL_MEM_ASYNC;
|
||||
} else if (device.IsNvidia()) {
|
||||
} else if (device.IsNvidia() || device.IsIntel()) {
|
||||
weights_upload_type_ = WeightsUploadType::LOCAL_MEM_BY_THREADS;
|
||||
} else if (device.IsAMD()) {
|
||||
weights_upload_type_ = WeightsUploadType::CONSTANT_MEM;
|
||||
|
@ -112,6 +112,7 @@ absl::Status SelectConvolutionTransposed(
|
||||
case Vendor::POWERVR:
|
||||
case Vendor::NVIDIA:
|
||||
case Vendor::AMD:
|
||||
case Vendor::INTEL:
|
||||
return SelectConvolutionTransposedPowerVR(attr, creation_context, op_def,
|
||||
ptr);
|
||||
case Vendor::MALI:
|
||||
|
@ -109,6 +109,9 @@ absl::Status SelectFullyConnected(const FullyConnectedAttributes& attr,
|
||||
return SelectFullyConnectedAdreno(attr, creation_context, op_def,
|
||||
batch_size, ptr);
|
||||
case Vendor::POWERVR:
|
||||
case Vendor::AMD:
|
||||
case Vendor::NVIDIA:
|
||||
case Vendor::INTEL:
|
||||
return SelectFullyConnectedPowerVR(attr, creation_context, op_def,
|
||||
batch_size, ptr);
|
||||
case Vendor::MALI:
|
||||
|
Loading…
x
Reference in New Issue
Block a user