ColossalAI/examples/tutorial/opt/inference/cache.py

from collections import OrderedDict
from contextlib import contextmanager
from threading import Lock
from typing import Any, Dict, Hashable, List


class MissCacheError(Exception):
    pass


class ListCache:
    def __init__(self, cache_size: int, list_size: int, fixed_keys: List[Hashable] = []) -> None:
        """Cache a list of values. The fixed keys won't be removed. For other keys, LRU is applied.
        When the value list is not full, a cache miss occurs. Otherwise, a cache hit occurs. Redundant values will be removed.

        Args:
            cache_size (int): Max size for LRU cache.
            list_size (int): Value list size.
            fixed_keys (List[Hashable], optional): The keys which won't be removed. Defaults to [].
        """
        self.cache_size = cache_size
        self.list_size = list_size
        self.cache: OrderedDict[Hashable, List[Any]] = OrderedDict()
        self.fixed_cache: Dict[Hashable, List[Any]] = {}
        for key in fixed_keys:
            self.fixed_cache[key] = []
        self._lock = Lock()

    def get(self, key: Hashable) -> List[Any]:
        with self.lock():
            if key in self.fixed_cache:
                l = self.fixed_cache[key]
                if len(l) >= self.list_size:
                    return l
            elif key in self.cache:
                self.cache.move_to_end(key)
                l = self.cache[key]
                if len(l) >= self.list_size:
                    return l
        raise MissCacheError()

    def add(self, key: Hashable, value: Any) -> None:
        with self.lock():
            if key in self.fixed_cache:
                l = self.fixed_cache[key]
                if len(l) < self.list_size and value not in l:
                    l.append(value)
            elif key in self.cache:
                self.cache.move_to_end(key)
                l = self.cache[key]
                if len(l) < self.list_size and value not in l:
                    l.append(value)
            else:
                if len(self.cache) >= self.cache_size:
                    self.cache.popitem(last=False)
                self.cache[key] = [value]

    @contextmanager
    def lock(self):
        try:
            self._lock.acquire()
            yield
        finally:
            self._lock.release()
[tutorial] edited hands-on practices (#1899) * Add handson to ColossalAI. * Change names of handsons and edit sequence parallel example. * Edit wrong folder name * resolve conflict * delete readme 2022-11-11 09:08:17 +00:00			`from collections import OrderedDict`
			`from contextlib import contextmanager`
[misc] update pre-commit and run all files (#4752) * [misc] update pre-commit * [misc] run pre-commit * [misc] remove useless configuration files * [misc] ignore cuda for clang-format 2023-09-19 06:20:26 +00:00			`from threading import Lock`
			`from typing import Any, Dict, Hashable, List`
[tutorial] edited hands-on practices (#1899) * Add handson to ColossalAI. * Change names of handsons and edit sequence parallel example. * Edit wrong folder name * resolve conflict * delete readme 2022-11-11 09:08:17 +00:00

			`class MissCacheError(Exception):`
			`pass`


			`class ListCache:`
			`def __init__(self, cache_size: int, list_size: int, fixed_keys: List[Hashable] = []) -> None:`
			`"""Cache a list of values. The fixed keys won't be removed. For other keys, LRU is applied.`
			`When the value list is not full, a cache miss occurs. Otherwise, a cache hit occurs. Redundant values will be removed.`

			`Args:`
			`cache_size (int): Max size for LRU cache.`
			`list_size (int): Value list size.`
			`fixed_keys (List[Hashable], optional): The keys which won't be removed. Defaults to [].`
			`"""`
			`self.cache_size = cache_size`
			`self.list_size = list_size`
			`self.cache: OrderedDict[Hashable, List[Any]] = OrderedDict()`
			`self.fixed_cache: Dict[Hashable, List[Any]] = {}`
			`for key in fixed_keys:`
			`self.fixed_cache[key] = []`
			`self._lock = Lock()`

			`def get(self, key: Hashable) -> List[Any]:`
			`with self.lock():`
			`if key in self.fixed_cache:`
			`l = self.fixed_cache[key]`
			`if len(l) >= self.list_size:`
			`return l`
			`elif key in self.cache:`
			`self.cache.move_to_end(key)`
			`l = self.cache[key]`
			`if len(l) >= self.list_size:`
			`return l`
			`raise MissCacheError()`

			`def add(self, key: Hashable, value: Any) -> None:`
			`with self.lock():`
			`if key in self.fixed_cache:`
			`l = self.fixed_cache[key]`
			`if len(l) < self.list_size and value not in l:`
			`l.append(value)`
			`elif key in self.cache:`
			`self.cache.move_to_end(key)`
			`l = self.cache[key]`
			`if len(l) < self.list_size and value not in l:`
			`l.append(value)`
			`else:`
			`if len(self.cache) >= self.cache_size:`
			`self.cache.popitem(last=False)`
			`self.cache[key] = [value]`

			`@contextmanager`
			`def lock(self):`
			`try:`
			`self._lock.acquire()`
			`yield`
			`finally:`
			`self._lock.release()`