NVIDIA
diff --git a/‎cuda_core/cuda/core/utils.py‎
Lines changed: 0 additions & 8 deletions b/‎cuda_core/cuda/core/utils.py‎
Lines changed: 0 additions & 8 deletions
diff --git a/‎cuda_core/cuda/core/utils/__init__.py‎
Lines changed: 45 additions & 0 deletions b/‎cuda_core/cuda/core/utils/__init__.py‎
Lines changed: 45 additions & 0 deletions
@@ -0,0 +1,45 @@
+# SPDX-FileCopyrightText: Copyright (c) 2024-2026 NVIDIA CORPORATION & AFFILIATES. All rights reserved.
+#
+# SPDX-License-Identifier: Apache-2.0
+
+from cuda.core._memoryview import (
+    StridedMemoryView,
+    args_viewable_as_strided_memory,
+)
+
+# Lazily expose the program-cache APIs so ``from cuda.core.utils import
+# StridedMemoryView`` stays lightweight -- the cache backends pull in driver,
+# NVRTC, and module-load machinery that memoryview-only consumers do not need.
+# The laziness guarantee is for explicit imports only: ``from cuda.core.utils
+# import *`` walks ``__all__`` and therefore resolves every lazy attribute,
+# which eagerly pulls ``_program_cache`` in. Star-imports are discouraged
+# anyway, so treat that as expected.
+_LAZY_CACHE_ATTRS = (
+    "FileStreamProgramCache",
+    "InMemoryProgramCache",
+    "ProgramCacheResource",
+    "SQLiteProgramCache",
+    "make_program_cache_key",
+)
+
+__all__ = [
+    "StridedMemoryView",
+    "args_viewable_as_strided_memory",
+    *_LAZY_CACHE_ATTRS,
+]
+
+
+def __getattr__(name):
+    if name in _LAZY_CACHE_ATTRS:
+        from cuda.core.utils import _program_cache
+
+        value = getattr(_program_cache, name)
+        globals()[name] = value  # cache for subsequent accesses
+        return value
+    raise AttributeError(f"module 'cuda.core.utils' has no attribute {name!r}")
+
+
+def __dir__():
+    # Merge the lazy public API with the real module namespace so REPL and
+    # introspection tools still surface ``__file__``, ``__spec__``, etc.
+    return sorted(set(globals()) | set(__all__))