File size: 612 Bytes
b786614
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
"""
proactive_cache — make any HuggingFace transformer O(n).

Main entry point:
    from proactive_cache import ProactiveCache
"""

from .core import ProactiveCache
from .eviction import score_tokens, prune_kv_cache
from .prototypes import build_prototypes, load_prototypes, save_prototypes
from .profiler import profile_model
from .press import ProactiveCachePress

__version__ = "0.1.0"
__author__ = "Khavin S"

__all__ = [
    "ProactiveCache",
    "ProactiveCachePress",
    "profile_model",
    "build_prototypes",
    "load_prototypes",
    "save_prototypes",
    "score_tokens",
    "prune_kv_cache",
]