Coverage for cuda/core/utils/_program_cache/_in

3# SPDX-License-Identifier: Apache-2.0

5"""In-memory bytes-in / bytes-out program cache."""

7from __future__ import annotations (empty)

9import collections (empty)

10import threading (empty)

12from cuda.core._module import ObjectCode (empty)

14from ._abc import ProgramCacheResource, _as_key_bytes, _extract_bytes (empty)

17class InMemoryProgramCache(ProgramCacheResource): (empty)

18 """In-memory program cache with LRU eviction.

20 Suitable for single-process workflows that want to avoid disk I/O --

21 a typical application compiles its kernels once per process and

22 looks them up many times. Entries live only for the lifetime of

23 the process; use :class:`FileStreamProgramCache` when the cache

24 should persist across runs.

26 Like :class:`FileStreamProgramCache`, this backend is bytes-in /

27 bytes-out: ``__setitem__`` accepts ``bytes``, ``bytearray``,

28 ``memoryview``, or any :class:`~cuda.core.ObjectCode` (path-backed

29 too -- the file is read at write time so the cached entry holds the

30 binary content, not a path). ``__getitem__`` returns ``bytes``.

32 Parameters

33 ----------

34 max_size_bytes:

35 Optional cap on the sum of stored payload sizes. When exceeded,

36 LRU eviction runs until the total fits. ``None`` means

37 unbounded. The size-only bound mirrors

38 :class:`FileStreamProgramCache`.

40 Notes

41 -----

42 Recency is updated on :meth:`__getitem__`; ``get`` is the

43 recommended lookup since the cache deliberately omits

44 ``__contains__`` (the ``if key in cache: ...`` idiom is racy

45 across processes; see :class:`ProgramCacheResource`).

47 Thread safety: a :class:`threading.RLock` serialises every method,

48 so the cache can be shared across threads without external

49 locking.

50 """

52 def __init__( (empty)

53 self,

54 *,

55 max_size_bytes: int | None = None,

56 ) -> None:

57 if max_size_bytes is not None and max_size_bytes <= 0: 22 ctx1hijcbarskodgeuvwtlfmpn

58 raise ValueError("max_size_bytes must be positive or None (0 would evict every write)") 2 ctx1vw

59 self._max_size_bytes = max_size_bytes 20 ctx1hijcbarskodgeutlfmpn

60 # Key insertion order encodes LRU order: oldest first, newest last.

61 # Each value is ``(payload_bytes, payload_size)``; caching the size

62 # avoids recomputing ``len(data)`` on every eviction pass.

63 self._entries: collections.OrderedDict[bytes, tuple[bytes, int]] = collections.OrderedDict() 20 ctx1hijcbarskodgeutlfmpn

64 self._total_bytes = 0 20 ctx1hijcbarskodgeutlfmpn

65 # Reentrant so helper methods that also take the lock can nest

66 # without deadlocking.

67 self._lock = threading.RLock() 20 ctx1hijcbarskodgeutlfmpn

69 def __getitem__(self, key: object) -> bytes: (empty)

70 k = _as_key_bytes(key) 17 ctx1hijcbarskdgetlfmn

71 with self._lock: 16 ctx1hijcbarskdgelfmn

72 try: 16 ctx1hijcbarskdgelfmn

73 data, _size = self._entries[k] 16 ctx1hijcbarskdgelfmn

74 except KeyError: 8 ctx1cbarsdef

75 raise KeyError(key) from None 8 ctx1cbarsdef

76 # Touch LRU: a real read promotes the entry to "most recent"

77 # so eviction prefers genuinely cold entries.

78 self._entries.move_to_end(k) 11 ctx1hijbkgelfmn

79 return data 11 ctx1hijbkgelfmn

81 def __setitem__(self, key: object, value: bytes | bytearray | memoryview | ObjectCode) -> None: (empty)

82 data = _extract_bytes(value) 18 ctx1hijcbakodgeutlfmpn

83 size = len(data) 17 ctx1hijcbakodgetlfmpn

84 k = _as_key_bytes(key) 17 ctx1hijcbakodgetlfmpn

85 with self._lock: 16 ctx1hijcbakodgelfmpn

86 existing = self._entries.pop(k, None) 16 ctx1hijcbakodgelfmpn

87 if existing is not None: 16 ctx1hijcbakodgelfmpn

88 self._total_bytes -= existing[1] 1 ctx1g

89 self._entries[k] = (data, size) 16 ctx1hijcbakodgelfmpn

90 self._total_bytes += size 16 ctx1hijcbakodgelfmpn

91 self._evict_to_caps() 16 ctx1hijcbakodgelfmpn

93 def __delitem__(self, key: object) -> None: (empty)

94 k = _as_key_bytes(key) 1 ctx1a

95 with self._lock: 1 ctx1a

96 try: 1 ctx1a

97 _data, size = self._entries.pop(k) 1 ctx1a

98 except KeyError: 1 ctx1a

99 raise KeyError(key) from None 1 ctx1a

100 self._total_bytes -= size 1 ctx1a

101

102 def __len__(self) -> int: (empty)

103 with self._lock: 7 ctx1cbrodgp

104 return len(self._entries) 7 ctx1cbrodgp

105

106 def clear(self) -> None: (empty)

107 with self._lock: 1 ctx1c

108 self._entries.clear() 1 ctx1c

109 self._total_bytes = 0 1 ctx1c

110

111 # -- eviction ------------------------------------------------------------

112

113 def _evict_to_caps(self) -> None: (empty)

114 """Evict oldest entries until the size cap is satisfied.

115

116 Called from ``__setitem__`` after an insert/update. Pops from

117 the front of the OrderedDict (oldest first). If the

118 just-inserted entry on its own exceeds ``max_size_bytes``, the

119 loop will evict it too -- mirroring

120 :class:`FileStreamProgramCache` (a write that cannot fit does

121 not survive its own size-cap pass).

122 """

123 if self._max_size_bytes is None: 16 ctx1hijcbakodgelfmpn

124 return 11 ctx1hijcakolmpn

125 while self._entries and self._total_bytes > self._max_size_bytes: 5 ctx1bdgef

126 _k, (_data, size) = self._entries.popitem(last=False) 4 ctx1bdef

127 self._total_bytes -= size 4 ctx1bdef

Coverage for cuda / core / utils / _program_cache / _in_memory.py: 100.00%

54 statements