diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB.json index d3677bebb..21924c7e7 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=14336,device_name=NVIDIA_A100-SXM4-80GB.json @@ -143,4 +143,4 @@ "num_warps": 4, "num_stages": 3 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=1792,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=1792,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json index 265768fb9..598993c61 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=1792,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=1792,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json @@ -215,4 +215,4 @@ "num_warps": 4, "num_stages": 4 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=1792,device_name=NVIDIA_A100-SXM4-80GB.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=1792,device_name=NVIDIA_A100-SXM4-80GB.json index d3be23dfc..a7c626e9b 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=1792,device_name=NVIDIA_A100-SXM4-80GB.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=1792,device_name=NVIDIA_A100-SXM4-80GB.json @@ -215,4 +215,4 @@ "num_warps": 4, "num_stages": 3 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=3072,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=3072,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json index 589f5d39f..14bf13935 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=3072,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=3072,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json @@ -215,4 +215,4 @@ "num_warps": 4, "num_stages": 4 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=3072,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=3072,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json index 2c78bfaba..29972c5f3 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=3072,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=3072,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json @@ -215,4 +215,4 @@ "num_warps": 8, "num_stages": 3 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=3072,device_name=NVIDIA_H100_80GB_HBM3.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=3072,device_name=NVIDIA_H100_80GB_HBM3.json index 4da841e74..082fba99b 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=3072,device_name=NVIDIA_H100_80GB_HBM3.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=3072,device_name=NVIDIA_H100_80GB_HBM3.json @@ -215,4 +215,4 @@ "num_warps": 8, "num_stages": 3 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=3584,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=3584,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json index 200356713..dbed86769 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=3584,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=3584,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json @@ -215,4 +215,4 @@ "num_warps": 4, "num_stages": 4 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=3584,device_name=NVIDIA_A100-SXM4-80GB.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=3584,device_name=NVIDIA_A100-SXM4-80GB.json index e076615ee..b89336a26 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=3584,device_name=NVIDIA_A100-SXM4-80GB.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=3584,device_name=NVIDIA_A100-SXM4-80GB.json @@ -215,4 +215,4 @@ "num_warps": 4, "num_stages": 3 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=7168,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=7168,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json index ee896554b..39bc5b9e5 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=7168,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=7168,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json @@ -215,4 +215,4 @@ "num_warps": 4, "num_stages": 4 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=7168,device_name=NVIDIA_A100-SXM4-80GB.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=7168,device_name=NVIDIA_A100-SXM4-80GB.json index 05aed8b1c..35d67f837 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=7168,device_name=NVIDIA_A100-SXM4-80GB.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=1,N=7168,device_name=NVIDIA_A100-SXM4-80GB.json @@ -215,4 +215,4 @@ "num_warps": 4, "num_stages": 3 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=14336,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=14336,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json index 51ad5b299..6443c5cd0 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=14336,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=14336,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json @@ -143,4 +143,4 @@ "num_warps": 4, "num_stages": 4 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=14336,device_name=NVIDIA_A100-SXM4-80GB.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=14336,device_name=NVIDIA_A100-SXM4-80GB.json index ee5119182..1fe9aad96 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=14336,device_name=NVIDIA_A100-SXM4-80GB.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=14336,device_name=NVIDIA_A100-SXM4-80GB.json @@ -143,4 +143,4 @@ "num_warps": 8, "num_stages": 4 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=1792,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=1792,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json index 68793c77b..9b48fe26d 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=1792,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=1792,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json @@ -215,4 +215,4 @@ "num_warps": 4, "num_stages": 4 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=1792,device_name=NVIDIA_A100-SXM4-80GB.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=1792,device_name=NVIDIA_A100-SXM4-80GB.json index 612910720..5ff4a1600 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=1792,device_name=NVIDIA_A100-SXM4-80GB.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=1792,device_name=NVIDIA_A100-SXM4-80GB.json @@ -215,4 +215,4 @@ "num_warps": 4, "num_stages": 3 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=3072,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=3072,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json index 51d03d860..f1f626667 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=3072,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=3072,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json @@ -143,4 +143,4 @@ "num_warps": 4, "num_stages": 3 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=3072,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=3072,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json index 26f9abd6b..6c809a096 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=3072,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=3072,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json @@ -143,4 +143,4 @@ "num_warps": 8, "num_stages": 3 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=3200,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=3200,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json index cd0cdbea0..3a9e2ef0f 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=3200,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=3200,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json @@ -127,4 +127,4 @@ "num_warps": 4, "num_stages": 2 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=3584,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=3584,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json index 64be6e659..1bfd02a41 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=3584,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=3584,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json @@ -143,4 +143,4 @@ "num_warps": 4, "num_stages": 3 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=3584,device_name=NVIDIA_A100-SXM4-80GB.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=3584,device_name=NVIDIA_A100-SXM4-80GB.json index 0a6a6a73f..0bb90b7e4 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=3584,device_name=NVIDIA_A100-SXM4-80GB.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=3584,device_name=NVIDIA_A100-SXM4-80GB.json @@ -215,4 +215,4 @@ "num_warps": 4, "num_stages": 3 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=6400,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=6400,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json index ba9041d00..033ba506d 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=6400,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=6400,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json @@ -127,4 +127,4 @@ "num_warps": 4, "num_stages": 4 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=7168,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=7168,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json index 7a7508aab..14723c576 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=7168,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=7168,device_name=NVIDIA_A100-SXM4-80GB,dtype=int8_w8a16.json @@ -143,4 +143,4 @@ "num_warps": 4, "num_stages": 4 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=7168,device_name=NVIDIA_A100-SXM4-80GB.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=7168,device_name=NVIDIA_A100-SXM4-80GB.json index dbf9a2dd6..9e9d27b1c 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=7168,device_name=NVIDIA_A100-SXM4-80GB.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=7168,device_name=NVIDIA_A100-SXM4-80GB.json @@ -143,4 +143,4 @@ "num_warps": 8, "num_stages": 3 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=7168,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=7168,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json index bbb238604..6ac5ba746 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=7168,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=7168,device_name=NVIDIA_H100_80GB_HBM3,dtype=int8_w8a16.json @@ -143,4 +143,4 @@ "num_warps": 8, "num_stages": 3 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=800,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=800,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json index 57055453a..c87ca0de8 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=800,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=16,N=800,device_name=NVIDIA_H100_80GB_HBM3,dtype=fp8_w8a8.json @@ -127,4 +127,4 @@ "num_warps": 8, "num_stages": 4 } -} \ No newline at end of file +} diff --git a/python/sglang/srt/layers/triton_fused_moe/configs/E=8,N=3584,device_name=NVIDIA_L40S.json b/python/sglang/srt/layers/triton_fused_moe/configs/E=8,N=3584,device_name=NVIDIA_L40S.json index d720deb4b..6499c8586 100644 --- a/python/sglang/srt/layers/triton_fused_moe/configs/E=8,N=3584,device_name=NVIDIA_L40S.json +++ b/python/sglang/srt/layers/triton_fused_moe/configs/E=8,N=3584,device_name=NVIDIA_L40S.json @@ -170,4 +170,4 @@ "num_ctas": 1, "num_stages": 2 } -} \ No newline at end of file +}