refactor: Flatten @site_cache's internal representation (#28939)

This makes maxsize deterministic while estimating memory costs of using this function. E.g. If I want to cache site config and I'd prefer to keep 16 recent site configs in memory, there's no way to handle this. Site specific maxsize means if I have 1000 sites on bench I'll have 1000 keys in cache. This change makes behaviour similar to lru_cache which is how I thought it workerd TBH.
2024-12-27 21:20:07 +05:30 · 2024-12-27 21:20:07 +05:30 · 28453f59f8
commit 28453f59f8
parent 416919e880
1 changed files with 13 additions and 11 deletions
--- a/frappe/utils/caching.py
+++ b/frappe/utils/caching.py
@ -4,14 +4,15 @@
 import time
 from collections import defaultdict
 from collections.abc import Callable
+from contextlib import suppress
 from functools import wraps

 import frappe

-_SITE_CACHE = defaultdict(lambda: defaultdict(dict))
+_SITE_CACHE = defaultdict(dict)


-def __generate_request_cache_key(args: tuple, kwargs: dict):
+def __generate_request_cache_key(args: tuple, kwargs: dict) -> int:
 	"""Generate a key for the cache."""
 	if not kwargs:
 		return hash(args)
@ -121,31 +122,32 @@ def site_cache(ttl: int | None = None, maxsize: int | None = None) -> Callable:
 			if not site:
 				return func(*args, **kwargs)

-			func_call_key = __generate_request_cache_key(args, kwargs)
+			arguments_key = f"{site}::{__generate_request_cache_key(args, kwargs)}"

 			if hasattr(func, "ttl") and time.monotonic() >= func.expiration:
 				func.clear_cache()
 				func.expiration = time.monotonic() + func.ttl

 			# NOTE: Important things to consider from thread safety POV:
-			#   1. Other thread can issue clear_cache and delete entire func_key dictionary.
+			#   1. Other thread can issue clear_cache and delete entire dictionary.
 			#   2. Other thread can pop the exact elemement we are reading if maxsize is hit.

 			# NOTE: Keep a local reference to dictionary of interest so it doesn't get swapped
-			site_specific_cache = _SITE_CACHE[func_key][site]
+			function_cache = _SITE_CACHE[func_key]

 			try:
-				return site_specific_cache[func_call_key]
-			except KeyError:
-				# NOTE: This is just a cache miss
+				return function_cache[arguments_key]
+			except (KeyError, RuntimeError):
+				# NOTE: This is just a cache miss or dictionary was modified while reading it
 				pass

-			if hasattr(func, "maxsize") and len(site_specific_cache) >= func.maxsize:
+			if hasattr(func, "maxsize") and len(function_cache) >= func.maxsize:
 				# Note: This implements FIFO eviction policy
-				site_specific_cache.pop(next(iter(site_specific_cache)), None)
+				with suppress(RuntimeError):
+					function_cache.pop(next(iter(function_cache)), None)

 			result = func(*args, **kwargs)
-			site_specific_cache[func_call_key] = result
+			function_cache[arguments_key] = result

 			return result