Skip to content

Commit 881822d

Browse files
committed
dbg
stack-info: PR: #1911, branch: shunting314/stack/30
1 parent 535386d commit 881822d

File tree

2 files changed

+11
-7
lines changed

2 files changed

+11
-7
lines changed

examples/distributed/fp8_matmul_reduce_scatter.py

Lines changed: 8 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -33,13 +33,16 @@
3333
max_mismatch_pct=1e-3,
3434
)
3535

36+
config = helion.Config(
37+
block_sizes=[64, 64, 32], # M, N, K
38+
num_warps=8,
39+
num_stages=3,
40+
)
41+
42+
# config = helion.Config(block_sizes=[64, 128, 128], indexing=['pointer', 'pointer', 'pointer', 'tensor_descriptor', 'pointer', 'pointer', 'pointer', 'pointer', 'tensor_descriptor', 'pointer', 'pointer', 'pointer', 'tensor_descriptor', 'pointer'], l2_groupings=[1], load_eviction_policies=['last', '', '', '', '', 'first', '', '', '', '', '', 'last'], loop_orders=[[0, 1]], num_sm_multiplier=2, num_stages=1, num_warps=8, pid_type='persistent_blocked', range_flattens=[None, None], range_multi_buffers=[True, None], range_unroll_factors=[3, 0], range_warp_specializes=[])
3643

3744
@helion.kernel(
38-
config=helion.Config(
39-
block_sizes=[64, 64, 32], # M, N, K
40-
num_warps=8,
41-
num_stages=3,
42-
),
45+
config=config,
4346
static_shapes=True,
4447
ignore_warnings=[helion.exc.TensorOperationInWrapper],
4548
autotune_baseline_accuracy_check_fn=functools.partial(

helion/autotuner/base_search.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -635,8 +635,9 @@ def _validate_against_baseline(
635635
custom_check = self.settings.autotune_baseline_accuracy_check_fn
636636
if custom_check is not None:
637637
custom_check(output, self._baseline_output)
638-
if len(self._mutated_arg_indices) > 0:
639-
custom_check(args, self._baseline_post_args)
638+
if os.getenv("CHECK_INPUT_ACCURACY", "1") == "1":
639+
if len(self._mutated_arg_indices) > 0:
640+
custom_check(args, self._baseline_post_args)
640641
else:
641642
_assert_close(
642643
output,

0 commit comments

Comments
 (0)