Restruct sgl-kernel benchmark (#10861)
This commit is contained in:
@@ -41,7 +41,7 @@ def benchmark(num_tokens, impl):
|
||||
def runner():
|
||||
dsv3_fused_a_gemm(mat_a, mat_b)
|
||||
|
||||
ms, min_ms, max_ms = triton.testing.do_bench(runner, quantiles=quantiles)
|
||||
ms, min_ms, max_ms = triton.testing.do_bench_cudagraph(runner, quantiles=quantiles)
|
||||
|
||||
def tflops(t_ms):
|
||||
flops = 2 * M * K * N
|
||||
@@ -54,4 +54,4 @@ if __name__ == "__main__":
|
||||
parser = argparse.ArgumentParser()
|
||||
args = parser.parse_args()
|
||||
|
||||
benchmark.run(print_data=True, show_plots=True, save_path="bench_dsv3_gemm")
|
||||
benchmark.run(print_data=True)
|
||||
|
||||
Reference in New Issue
Block a user