[Minor] move triton attention kernels into a separate folder (#1379)

This commit is contained in:
Lianmin Zheng
2024-09-10 15:15:08 -07:00
committed by GitHub
parent fbb4754cb8
commit 3a6e8b6d78
13 changed files with 24 additions and 15 deletions

View File

@@ -13,6 +13,8 @@ See the License for the specific language governing permissions and
limitations under the License.
"""
"""For constrained decoding."""
import json
from typing import Dict, Optional, Union