|
377 | 377 | "StaticLayer", |
378 | 378 | "SlidingWindowLayer", |
379 | 379 | "ChunkedSlidingLayer", |
380 | | - "CacheProcessor", |
381 | | - "OffloadedCacheProcessor", |
382 | | - "QuantizedCacheProcessor", |
383 | | - "QuantoQuantizedCacheProcessor", |
384 | | - "HQQQuantizedCacheProcessor", |
| 380 | + "QuantoQuantizedLayer", |
| 381 | + "HQQQuantizedLayer", |
385 | 382 | "Cache", |
386 | 383 | "CacheConfig", |
387 | 384 | "DynamicCache", |
388 | 385 | "EncoderDecoderCache", |
389 | 386 | "HQQQuantizedCache", |
390 | | - "HQQQuantizedCacheProcessor", |
391 | 387 | "HybridCache", |
392 | 388 | "HybridChunkedCache", |
393 | 389 | "OffloadedCache", |
394 | 390 | "OffloadedStaticCache", |
395 | 391 | "QuantizedCache", |
396 | | - "QuantoQuantizedCacheProcessor", |
397 | 392 | "QuantizedCacheConfig", |
398 | 393 | "QuantoQuantizedCache", |
399 | 394 | "SinkCache", |
|
586 | 581 | # All modeling imports |
587 | 582 | from .cache_utils import Cache as Cache |
588 | 583 | from .cache_utils import CacheConfig as CacheConfig |
| 584 | + from .cache_utils import ChunkedSlidingLayer as ChunkedSlidingLayer |
589 | 585 | from .cache_utils import DynamicCache as DynamicCache |
| 586 | + from .cache_utils import DynamicLayer as DynamicLayer |
590 | 587 | from .cache_utils import EncoderDecoderCache as EncoderDecoderCache |
591 | 588 | from .cache_utils import HQQQuantizedCache as HQQQuantizedCache |
| 589 | + from .cache_utils import HQQQuantizedLayer as HQQQuantizedLayer |
592 | 590 | from .cache_utils import HybridCache as HybridCache |
593 | 591 | from .cache_utils import MambaCache as MambaCache |
594 | 592 | from .cache_utils import OffloadedCache as OffloadedCache |
595 | 593 | from .cache_utils import OffloadedStaticCache as OffloadedStaticCache |
596 | 594 | from .cache_utils import QuantizedCache as QuantizedCache |
597 | 595 | from .cache_utils import QuantizedCacheConfig as QuantizedCacheConfig |
598 | 596 | from .cache_utils import QuantoQuantizedCache as QuantoQuantizedCache |
| 597 | + from .cache_utils import QuantoQuantizedLayer as QuantoQuantizedLayer |
599 | 598 | from .cache_utils import SinkCache as SinkCache |
600 | 599 | from .cache_utils import SlidingWindowCache as SlidingWindowCache |
| 600 | + from .cache_utils import SlidingWindowLayer as SlidingWindowLayer |
601 | 601 | from .cache_utils import StaticCache as StaticCache |
| 602 | + from .cache_utils import StaticLayer as StaticLayer |
602 | 603 | from .configuration_utils import PretrainedConfig as PretrainedConfig |
603 | 604 | from .convert_slow_tokenizer import SLOW_TO_FAST_CONVERTERS as SLOW_TO_FAST_CONVERTERS |
604 | 605 | from .convert_slow_tokenizer import convert_slow_tokenizer as convert_slow_tokenizer |
|
0 commit comments