@@ -103,7 +103,7 @@ INSTANTIATE_TEST_SUITE_P(
103103    });
104104
105105using  ClusterReductionTestAutoScheduler = ClusterReductionTest;
106- TEST_P (ClusterReductionTestAutoScheduler, SoftmaxDtypeHiddenSize ) {
106+ TEST_P (ClusterReductionTestAutoScheduler, Softmax ) {
107107  auto  [hidden_size, dtype] = GetParam ();
108108  int  batch_size = scheduler_utils::safeDiv (deviceSMCount (), 8 );
109109  auto  fusion_ptr = std::make_unique<Fusion>();
@@ -112,9 +112,9 @@ TEST_P(ClusterReductionTestAutoScheduler, SoftmaxDtypeHiddenSize) {
112112  auto  tv0 = makeContigTensor (2 , dtype);
113113  fusion.addInput (tv0);
114114  auto  tv1 = maybeCastOp (DataType::Float, tv0);
115-      auto  tv2 = softmax (tv1, 1 );
116-      auto  tv3 = maybeCastOp (DataType::BFloat16, tv2);
117-      fusion.addOutput (tv3);
115+   auto  tv2 = softmax (tv1, 1 );
116+   auto  tv3 = maybeCastOp (DataType::BFloat16, tv2);
117+   fusion.addOutput (tv3);
118118  auto  unscheduled_fusion_copy = fusion;
119119
120120  auto  options =
@@ -129,7 +129,6 @@ TEST_P(ClusterReductionTestAutoScheduler, SoftmaxDtypeHiddenSize) {
129129  }
130130  testValidate (&unscheduled_fusion_copy, outputs, {t0});
131131}
132- 
133132INSTANTIATE_TEST_SUITE_P (
134133    ,
135134    ClusterReductionTestAutoScheduler,
0 commit comments