File tree Expand file tree Collapse file tree 1 file changed +2
-1
lines changed
torch/csrc/jit/codegen/cuda/test Expand file tree Collapse file tree 1 file changed +2
-1
lines changed Original file line number Diff line number Diff line change @@ -9636,7 +9636,6 @@ TEST_F(NVFuserTest, FusionPersistentNormLocalShared_CUDA) {
9636
9636
9637
9637
torch::jit::fuser::cuda::FusionExecutor fe;
9638
9638
fe.compileFusion(&fusion, aten_inputs);
9639
- fe.runFusion(aten_inputs, {cg_static_out, cg_dynamic_out});
9640
9639
9641
9640
auto properties = at::cuda::getDeviceProperties(0);
9642
9641
// Require 70KB of smem to run test
@@ -9645,6 +9644,8 @@ TEST_F(NVFuserTest, FusionPersistentNormLocalShared_CUDA) {
9645
9644
GTEST_SKIP() << "not enough shared memory space on device to run test";
9646
9645
}
9647
9646
9647
+ fe.runFusion(aten_inputs, {cg_static_out, cg_dynamic_out});
9648
+
9648
9649
auto at_mu = at::mean(aten_input.to(at::kDouble), -1).unsqueeze(1);
9649
9650
auto at_var = at::var(aten_input.to(at::kDouble), -1, false).unsqueeze(1);
9650
9651
auto at_rvar = at::rsqrt(at::add(at_var, kEps));
You can’t perform that action at this time.
0 commit comments