mirror of
https://github.com/hpcaitech/ColossalAI.git
synced 2025-08-31 16:40:41 +00:00
[doc] updated inference readme (#5343)
This commit is contained in:
@@ -1,5 +1,7 @@
|
||||
from typing import Any
|
||||
|
||||
__all__ = ["CacheBlock"]
|
||||
|
||||
|
||||
class CacheBlock:
|
||||
"""A simplified version of logical cache block used for Paged Attention."""
|
||||
|
@@ -10,6 +10,8 @@ from colossalai.utils import get_current_device
|
||||
|
||||
from .block_cache import CacheBlock
|
||||
|
||||
__all__ = ["KVCacheManager"]
|
||||
|
||||
GIGABYTE = 1024**3
|
||||
|
||||
|
||||
|
Reference in New Issue
Block a user