Spaces:
Running
on
Zero
Running
on
Zero
File size: 833 Bytes
43a7079 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 |
# Copyright (c) 2024 Microsoft
# Licensed under The MIT License [see LICENSE for details]
# flake8: noqa
from .minference_configuration import MInferenceConfig
from .models_patch import MInference
from .ops.block_sparse_flash_attention import block_sparse_attention
from .ops.pit_sparse_flash_attention_v2 import vertical_slash_sparse_attention
from .ops.streaming_kernel import streaming_forward
from .patch import (
minference_patch,
minference_patch_kv_cache_cpu,
minference_patch_with_snapkv,
patch_hf,
)
from .version import VERSION as __version__
__all__ = [
"MInference",
"MInferenceConfig",
"minference_patch",
"minference_patch_kv_cache_cpu",
"minference_patch_with_snapkv",
"patch_hf",
"vertical_slash_sparse_attention",
"block_sparse_attention",
"streaming_forward",
]
|