Merge pull request #43214 from nouiz:upstream-maxwell-test

PiperOrigin-RevId: 331800832
Change-Id: I9777ecb0d4d5777135eea92064b3c1dc264ec773
This commit is contained in:
TensorFlower Gardener 2020-09-15 10:46:48 -07:00
commit 9b6a1850d9

View File

@ -336,8 +336,17 @@ ENTRY %cluster {
TF_ASSERT_OK_AND_ASSIGN(std::unique_ptr<VerifiedHloModule> optimized_module,
ParseAndReturnVerifiedModule(hlo_text));
CompileAndOptionallyVerifyPtx(std::move(optimized_module),
R"(
const se::DeviceDescription& device_description =
backend().default_stream_executor()->GetDeviceDescription();
int cc_major = 0, cc_minor = 0;
device_description.cuda_compute_capability(&cc_major, &cc_minor);
string expected;
if (cc_major < 6) {
// We do not vectorize for GPU before Pascal.
expected = "CHECK-NOT: ld.global.nc.v2.f32";
} else {
expected = R"(
CHECK: ld.global.nc.v2.f32
CHECK: st.global.v2.f32
CHECK: st.global.v2.f32
@ -350,7 +359,9 @@ CHECK: st.global.v2.f32
CHECK: ld.global.nc.v2.f32
CHECK: st.global.v2.f32
CHECK: st.global.v2.f32
)");
)";
}
CompileAndOptionallyVerifyPtx(std::move(optimized_module), expected);
EXPECT_TRUE(RunAndCompare(hlo_text, ErrorSpec{1e-5, 1e-5}));
}