Merge pull request #43214 from nouiz:upstream-maxwell-test
PiperOrigin-RevId: 331800832 Change-Id: I9777ecb0d4d5777135eea92064b3c1dc264ec773
This commit is contained in:
commit
9b6a1850d9
@ -336,8 +336,17 @@ ENTRY %cluster {
|
||||
|
||||
TF_ASSERT_OK_AND_ASSIGN(std::unique_ptr<VerifiedHloModule> optimized_module,
|
||||
ParseAndReturnVerifiedModule(hlo_text));
|
||||
CompileAndOptionallyVerifyPtx(std::move(optimized_module),
|
||||
R"(
|
||||
const se::DeviceDescription& device_description =
|
||||
backend().default_stream_executor()->GetDeviceDescription();
|
||||
int cc_major = 0, cc_minor = 0;
|
||||
device_description.cuda_compute_capability(&cc_major, &cc_minor);
|
||||
|
||||
string expected;
|
||||
if (cc_major < 6) {
|
||||
// We do not vectorize for GPU before Pascal.
|
||||
expected = "CHECK-NOT: ld.global.nc.v2.f32";
|
||||
} else {
|
||||
expected = R"(
|
||||
CHECK: ld.global.nc.v2.f32
|
||||
CHECK: st.global.v2.f32
|
||||
CHECK: st.global.v2.f32
|
||||
@ -350,7 +359,9 @@ CHECK: st.global.v2.f32
|
||||
CHECK: ld.global.nc.v2.f32
|
||||
CHECK: st.global.v2.f32
|
||||
CHECK: st.global.v2.f32
|
||||
)");
|
||||
)";
|
||||
}
|
||||
CompileAndOptionallyVerifyPtx(std::move(optimized_module), expected);
|
||||
|
||||
EXPECT_TRUE(RunAndCompare(hlo_text, ErrorSpec{1e-5, 1e-5}));
|
||||
}
|
||||
|
Loading…
Reference in New Issue
Block a user