Coverage for cuda/core/_memoryview.pyx: 62.99%

3# SPDX-License-Identifier: Apache-2.0

5from __future__ import annotations

7from ._dlpack cimport *

8from ._dlpack import classify_dl_device (empty)

9from libc.stdint cimport intptr_t

10from cuda.core._layout cimport _StridedLayout, get_strides_ptr

11from cuda.core._stream import Stream (empty)

13import ctypes (empty)

14import functools (empty)

15import sys (empty)

16import warnings (empty)

18import numpy (empty)

20from cuda.bindings cimport cydriver

21from cuda.core._resource_handles cimport (

22 EventHandle,

23 create_event_handle_noctx,

24 as_cu,

25)

27from cuda.core._utils.cuda_utils import handle_return, driver (empty)

28from cuda.core._utils.cuda_utils cimport HANDLE_RETURN

31from cuda.core._memory import Buffer (empty)

34# ---------------------------------------------------------------------------

35# Lazy tensor bridge (avoids loading _tensor_bridge.so until torch is used)

36# ---------------------------------------------------------------------------

38cdef object _tensor_bridge = None (empty)

39# Cache: type(obj) -> True/False for the torch tensor check.

40# Once a type is seen, we never re-check.

41cdef dict _torch_type_cache = {} (empty)

42# Tri-state: None = not checked, True/False = result of version check

43cdef object _torch_version_ok = None (empty)

45cdef inline bint _torch_version_check(): (empty)

46 """Return True if 2.3 <= torch <= 2.12 (known AOTI ABI range). Memoized.

48 Lower bound: AOTI functions we use were introduced in PyTorch 2.3.

49 Upper bound: the ``pyobj_to_aten_handle`` trick relies on the

50 THPVariable struct layout (PyObject_HEAD followed by at::Tensor cdata)

51 and the identity ``AtenTensorHandle == at::Tensor*``. Both are

52 undocumented internals that could change in a future PyTorch version.

53 We cap at the latest version we have tested against; unknown versions

54 fall back to the standard DLPack/CAI paths. Bump the upper bound

55 after verifying a new PyTorch release.

56 """

57 global _torch_version_ok

58 if _torch_version_ok is not None:

59 return <bint>_torch_version_ok

60 torch = sys.modules.get("torch")

61 if torch is None:

62 _torch_version_ok = False

63 return False

64 try:

65 major, minor = int(torch.__version__.split(".")[0]), \

66 int(torch.__version__.split(".")[1])

67 _torch_version_ok = (2, 3) <= (major, minor) <= (2, 12)

68 except (ValueError, IndexError):

69 _torch_version_ok = False

70 return <bint>_torch_version_ok

73cdef inline bint _is_torch_tensor(object obj): (empty)

74 cdef type tp = type(obj) 57 ctx2D E F J s m n o p q t u v w x c b K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb8 hb9 H I a l G k e f g h i j

75 cdef object cached = _torch_type_cache.get(tp) 57 ctx2D E F J s m n o p q t u v w x c b K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb8 hb9 H I a l G k e f g h i j

76 if cached is not None: 57 ctx2D E F J s m n o p q t u v w x c b K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb8 hb9 H I a l G k e f g h i j

77 return <bint>cached 51 ctx2F J m n o p q t u v w x c b K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jbH I a l G k e f g h i j

78 cdef str mod = tp.__module__ or "" 6 ctx2D E s 8 hb9

79 cdef bint result = mod.startswith("torch") and hasattr(obj, "data_ptr") \ 6 ctx2D E s 8 hb9

80 and _torch_version_check()

81 _torch_type_cache[tp] = result 6 ctx2D E s 8 hb9

82 return result 6 ctx2D E s 8 hb9

85cdef object _get_tensor_bridge(): (empty)

86 """Bootstrap AOTI symbols, then import _tensor_bridge on first use."""

87 global _tensor_bridge

88 if _tensor_bridge is not None:

89 return _tensor_bridge

90 torch_C = sys.modules.get("torch._C")

91 if torch_C is None:

92 raise RuntimeError(

93 "torch._C is not loaded; cannot initialise the tensor bridge. "

94 "Make sure PyTorch is imported before passing a torch.Tensor.")

95 ctypes.CDLL(torch_C.__file__, mode=ctypes.RTLD_GLOBAL)

96 from cuda.core import _tensor_bridge as tb

97 _tensor_bridge = tb

98 return _tensor_bridge

100

101try: (empty)

102 from ml_dtypes import bfloat16 (empty)

103except ImportError: (empty)

104 bfloat16 = None (empty)

105

106# TODO(leofang): support NumPy structured dtypes

107

108

109cdef extern from "Python.h":

110 ctypedef struct PyTypeObject:

111 void* tp_dict

112 void PyType_Modified(PyTypeObject*)

113

114

115cdef DLPackExchangeAPI _SMV_DLPACK_EXCHANGE_API

116cdef bint _SMV_DLPACK_EXCHANGE_API_INITED = False (empty)

117_SMV_DLPACK_EXCHANGE_API_CAPSULE = cpython.PyCapsule_New( (empty)

118 <void*>&_SMV_DLPACK_EXCHANGE_API,

119 b"dlpack_exchange_api",

120 NULL,

121)

122

123

124cdef class StridedMemoryView:

125 """A class holding metadata of a strided dense array/tensor.

126

127 A :obj:`StridedMemoryView` instance can be created in three ways:

128

129 1. Using the :obj:`args_viewable_as_strided_memory` decorator (recommended)

130 2. Explicit construction relying on DLPack or CUDA Array Interface, see below.

131 3. From :obj:`~_memory.Buffer` and shape and size tuples (see

132 :meth:`from_buffer` classmethod)

133

134 ``StridedMemoryView(obj, stream_ptr)`` can be used to create a view from

135 objects supporting either DLPack (up to v1.0) or CUDA Array Interface

136 (CAI) v3. When wrapping an arbitrary object it will try the DLPack protocol

137 first, then the CAI protocol. A :obj:`BufferError` is raised if neither is

138 supported.

139

140 Since either way would take a consumer stream, for DLPack it is passed to

141 ``obj.__dlpack__()`` as-is (except for :obj:`None`, see below); for CAI, a

142 stream order will be established between the consumer stream and the

143 producer stream (from ``obj.__cuda_array_interface__()["stream"]``), as if

144 ``cudaStreamWaitEvent`` is called by this method.

145

146 To opt-out of the stream ordering operation in either DLPack or CAI,

147 please pass ``stream_ptr=-1``. Note that this deviates (on purpose)

148 from the semantics of ``obj.__dlpack__(stream=None, ...)`` since ``cuda.core``

149 does not encourage using the (legacy) default/null stream, but is

150 consistent with the CAI's semantics. For DLPack, ``stream=-1`` will be

151 internally passed to ``obj.__dlpack__()`` instead.

152

153 Parameters

154 ----------

155 obj : Any

156 Any objects that supports either DLPack (up to v1.0) or CUDA Array

157 Interface (v3).

158 stream_ptr: int

159 The pointer address (as Python `int`) to the **consumer** stream.

160 Stream ordering will be properly established unless ``-1`` is passed.

161

162

163 Attributes

164 -----------

165 ptr : int

166 Pointer to the tensor buffer (as a Python `int`).

167 device_id : int

168 The device ID for where the tensor is located. It is -1 for CPU tensors

169 (meaning those only accessible from the host).

170 is_device_accessible : bool

171 Whether the tensor data can be accessed on the GPU.

172 readonly: bool

173 Whether the tensor data can be modified in place.

174 exporting_obj : Any

175 A reference to the original tensor object that is being viewed.

176 If the view is created with :meth:`from_buffer`,

177 it will be the Buffer instance passed to the method.

178

179 """

180 def __init__(self, obj: object = None, stream_ptr: int | None = None) -> None:

181 cdef str clsname = self.__class__.__name__ 6 ctx2y z A B C lb

182 if obj is not None: 6 ctx2y z A B C lb

183 # populate self's attributes

184 if check_has_dlpack(obj): 5 ctx1yzABC

185 warnings.warn( 6 ctx1dyzABC

186 f"Constructing a {clsname} directly from a DLPack-supporting object is deprecated; " 5 ctx1yzABC

187 "Use `StridedMemoryView.from_dlpack` or `StridedMemoryView.from_any_interface` instead.",

188 DeprecationWarning, 5 ctx1yzABC

189 stacklevel=2,

190 )

191 view_as_dlpack(obj, stream_ptr, self) 5 ctx1yzABC

192 else:

193 warnings.warn(

194 f"Constructing a {clsname} directly from a CUDA-array-interface-supporting object is deprecated; " (empty)

195 "Use `StridedMemoryView.from_cuda_array_interface` or `StridedMemoryView.from_any_interface` instead.",

196 DeprecationWarning,

197 stacklevel=2,

198 )

199 view_as_cai(obj, stream_ptr, self)

200 else:

201 warnings.warn( 2 ctx2d lb

202 f"Constructing an empty {clsname} is deprecated; " 1 ctx2lb

203 "use one of the classmethods `from_dlpack`, `from_cuda_array_interface` or `from_any_interface` "

204 "to construct a StridedMemoryView from an object",

205 DeprecationWarning, 1 ctx2lb

206 stacklevel=2,

207 )

208

209 @classmethod (empty)

210 def from_dlpack(cls, obj: object, stream_ptr: int | None=None) -> StridedMemoryView:

211 """Create a view from an object supporting the `DLPack <https://dmlc.github.io/dlpack/latest/>`_ protocol.

212

213 Parameters

214 ----------

215 obj : object

216 An object implementing the `DLPack <https://dmlc.github.io/dlpack/latest/>`_ protocol

217 (via ``__dlpack__``).

218 stream_ptr : int, optional

219 Stream pointer for synchronization. If ``None``, no synchronization is performed.

220 """

221 cdef StridedMemoryView buf = StridedMemoryView.__new__(cls) 29 ctx1DEFJsmnopqtuvwxcbHIalGkefghij

222 if _is_torch_tensor(obj): 29 ctx1DEFJsmnopqtuvwxcbHIalGkefghij

223 _get_tensor_bridge().view_as_torch_tensor(obj, stream_ptr, buf) (empty)

224 return buf

225 view_as_dlpack(obj, stream_ptr, buf) 29 ctx1DEFJsmnopqtuvwxcbHIalGkefghij

226 return buf 29 ctx1DEFJsmnopqtuvwxcbHIalGkefghij

227

228 @classmethod (empty)

229 def from_cuda_array_interface(cls, obj: object, stream_ptr: int | None=None) -> StridedMemoryView:

230 """Create a view from an object supporting the `__cuda_array_interface__ <https://numba.readthedocs.io/en/stable/cuda/cuda_array_interface.html>`_ protocol.

231

232 Parameters

233 ----------

234 obj : object

235 An object implementing the `__cuda_array_interface__ <https://numba.readthedocs.io/en/stable/cuda/cuda_array_interface.html>`_ protocol.

236 stream_ptr : int, optional

237 Stream pointer for synchronization. If ``None``, no synchronization is performed.

238 """

239 cdef StridedMemoryView buf = StridedMemoryView.__new__(cls) 3 ctx28 hb9

240 if _is_torch_tensor(obj): 3 ctx28 hb9

241 _get_tensor_bridge().view_as_torch_tensor(obj, stream_ptr, buf) (empty)

242 return buf

243 view_as_cai(obj, stream_ptr, buf) 3 ctx28 hb9

244 return buf 2 ctx189

245

246 @classmethod (empty)

247 def from_array_interface(cls, obj: object) -> StridedMemoryView:

248 """Create a view from an object supporting the `__array_interface__ <https://numpy.org/doc/stable/reference/arrays.interface.html>`_ protocol.

249

250 Parameters

251 ----------

252 obj : object

253 An object implementing the `__array_interface__ <https://numpy.org/doc/stable/reference/arrays.interface.html>`_ protocol (e.g., a numpy array).

254 """

255 cdef StridedMemoryView buf = StridedMemoryView.__new__(cls) 25 ctx2K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb

256 if _is_torch_tensor(obj): 25 ctx2K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb

257 _get_tensor_bridge().view_as_torch_tensor(obj, None, buf)

258 return buf (empty)

259 view_as_array_interface(obj, buf) 25 ctx2K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb

260 return buf 24 ctx1KLVMWNXOPQRSTYZ01234567U

261

262 @classmethod (empty)

263 def from_any_interface(cls, obj: object, stream_ptr: int | None = None) -> StridedMemoryView:

264 """Create a view by automatically selecting the best available protocol.

265

266 Tries `DLPack <https://dmlc.github.io/dlpack/latest/>`_ first, then falls back to

267 `__cuda_array_interface__ <https://numba.readthedocs.io/en/stable/cuda/cuda_array_interface.html>`_.

268 ``torch.Tensor`` objects are transparently handled via a fast AOTI path

269 regardless of which protocol is selected.

270

271 Parameters

272 ----------

273 obj : object

274 An object implementing `DLPack <https://dmlc.github.io/dlpack/latest/>`_ or

275 `__cuda_array_interface__ <https://numba.readthedocs.io/en/stable/cuda/cuda_array_interface.html>`_.

276 stream_ptr : int, optional

277 Stream pointer for synchronization. If ``None``, no synchronization is performed.

278 """

279 if check_has_dlpack(obj): 18 ctx1DEFJstuvwxcbHIalGk

280 return cls.from_dlpack(obj, stream_ptr) 18 ctx1DEFJstuvwxcbHIalGk

281 return cls.from_cuda_array_interface(obj, stream_ptr)

282

283 @classmethod (empty)

284 def from_buffer(

285 cls,

286 buffer : Buffer,

287 shape : tuple[int, ...],

288 strides : tuple[int, ...] | None = None,

289 *,

290 itemsize : int | None = None, (empty)

291 dtype : numpy.dtype | None = None, (empty)

292 is_readonly : bool = False (empty)

293 ) -> StridedMemoryView:

294 """

295 Creates a :obj:`StridedMemoryView` instance from a :obj:`~_memory.Buffer` and shape and strides tuples.

296 The Buffer can be either allocation coming from a :obj:`MemoryResource` or an external allocation

297 wrapped in a :obj:`~_memory.Buffer` object with ``Buffer.from_handle(ptr, size, owner=...)``.

298

299 .. caution::

300 When creating a :obj:`StridedMemoryView` from a :obj:`~_memory.Buffer`,

301 no synchronization is performed. It is the user's responsibility to ensure

302 the data in ``buffer`` is properly synchronized when consuming the view.

303

304 Parameters

305 ----------

306 buffer : :obj:`~_memory.Buffer`

307 The buffer to create the view from.

308 shape : :obj:`tuple`

309 The layout describing the shape, strides and itemsize of the elements in

310 the buffer.

311 strides : :obj:`tuple`

312 The layout describing the shape, strides and itemsize of the elements in

313 the buffer.

314 dtype : :obj:`numpy.dtype`

315 Optional dtype.

316 If specified, the dtype's itemsize must match the layout's itemsize.

317 is_readonly : bool, optional

318 Whether the mark the view as readonly.

319 """

320 cdef StridedMemoryView view = StridedMemoryView.__new__(cls) 42 ctx2obpb$ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgbmbqbnb! # kbibr

321 if itemsize is None and dtype is None: 42 ctx2obpb$ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgbmbqbnb! # kbibr

322 raise ValueError("Either itemsize or dtype must be specified") 1 ctx2qb

323 if itemsize is not None and dtype is not None and itemsize != dtype.itemsize: 41 ctx2obpb$ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgbmbnb! # kbibr

324 raise ValueError( 1 ctx2nb

325 f"itemsize ({itemsize}) does not match dtype.itemsize ({dtype.itemsize})" 1 ctx2nb

326 )

327 # (itemsize is None XOR dtype is None) OR they are equal

328 view_buffer_strided( 38 ctx2$ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgbmb! # kbibr

329 view,

330 buffer,

331 _StridedLayout(shape=shape, strides=strides, itemsize=getattr(dtype, "itemsize", itemsize)), 40 ctx2obpb$ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgbmb! # kbibr

332 dtype,

333 is_readonly,

334 )

335 return view 36 ctx2$ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgb! # ibr

336

337 def __dealloc__(self):

338 if self.dl_tensor == NULL: 106 ctx2d obpbD E F J s m n o p q t u v w x y z A B C c b K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb$ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgbmbqbnb! # kbib8 hb9 H I a r lbl G k e f g h i j

339 return 81 ctx2obpbc b K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb$ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgbmbqbnb! # kbib8 hb9 r lbG k e f g h i j

340

341 if cpython.PyCapsule_IsValid( 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

342 self.metadata, DLPACK_VERSIONED_TENSOR_USED_NAME): 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

343 data = cpython.PyCapsule_GetPointer( 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

344 self.metadata, DLPACK_VERSIONED_TENSOR_USED_NAME) 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

345 dlm_tensor_ver = <DLManagedTensorVersioned*>data 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

346 dlm_tensor_ver.deleter(dlm_tensor_ver) 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

347 elif cpython.PyCapsule_IsValid(

348 self.metadata, DLPACK_TENSOR_USED_NAME):

349 data = cpython.PyCapsule_GetPointer(

350 self.metadata, DLPACK_TENSOR_USED_NAME)

351 dlm_tensor = <DLManagedTensor*>data (empty)

352 dlm_tensor.deleter(dlm_tensor)

353

354 def view( (empty)

355 self, layout : _StridedLayout | None = None, dtype : numpy.dtype | None = None

356 ) -> StridedMemoryView:

357 """

358 Creates a new view with adjusted layout and dtype.

359 Same as calling :meth:`from_buffer` with the current buffer.

360 """

361 cdef StridedMemoryView view = StridedMemoryView.__new__(self.__class__) 12 ctx1cb!#Gkefghij

362 if layout is None and dtype is None: 12 ctx1cb!#Gkefghij

363 return self 1 ctx1G

364 if layout is None: 11 ctx1cb!#kefghij

365 layout = self.get_layout() 4 ctx1dcbk

366 if dtype is None: 11 ctx1cb!#kefghij

367 dtype = self.get_dtype() 8 ctx1!#efghij

368 view_buffer_strided(view, self.get_buffer(), layout, dtype, self.readonly) 11 ctx1cb!#kefghij

369 return view 11 ctx1cb!#kefghij

370

371 def as_tensor_map( (empty)

372 self,

373 box_dim=None,

374 *,

375 options=None, (empty)

376 element_strides=None, (empty)

377 data_type=None, (empty)

378 interleave=None, (empty)

379 swizzle=None, (empty)

380 l2_promotion=None, (empty)

381 oob_fill=None, (empty)

382 ):

383 """Create a tiled :obj:`TensorMapDescriptor` from this view.

384

385 This is the public entry point for creating tiled tensor map

386 descriptors in ``cuda.core``. Pass either ``box_dim`` and the

387 individual keyword arguments directly, or provide bundled tiled

388 options via ``options=``.

389 """

390 from cuda.core._tensor_map import TensorMapDescriptor

391

392 kwargs = {}

393 if options is not None: (empty)

394 kwargs["options"] = options

395 if element_strides is not None:

396 kwargs["element_strides"] = element_strides

397 if data_type is not None:

398 kwargs["data_type"] = data_type

399 if interleave is not None:

400 kwargs["interleave"] = interleave

401 if swizzle is not None: (empty)

402 kwargs["swizzle"] = swizzle

403 if l2_promotion is not None:

404 kwargs["l2_promotion"] = l2_promotion

405 if oob_fill is not None:

406 kwargs["oob_fill"] = oob_fill

407 return TensorMapDescriptor._from_tiled(self, box_dim, **kwargs)

408

409 def copy_from( (empty)

410 self, other : StridedMemoryView, stream : Stream,

411 allocator = None,

412 blocking : bool | None = None,

413 ):

414 """

415 Copies the data from the other view into this view.

416

417 The copy can be performed between following memory spaces:

418 host-to-device, device-to-host, device-to-device (on the same device).

419

420 Parameters

421 ----------

422 other : StridedMemoryView

423 The view to copy data from.

424 stream : Stream | None, optional

425 The stream to schedule the copy on.

426 allocator : MemoryResource | None, optional

427 If temporary buffers are needed, the specified memory resources

428 will be used to allocate the memory. If not specified, default

429 resources will be used.

430 blocking : bool | None, optional

431 Whether the call should block until the copy is complete.

432 * ``True``: the ``stream`` is synchronized with the host at the end of the call,

433 blocking until the copy is complete.

434 * ``False``: if possible, the call returns immediately once the copy is scheduled.

435 However, in some cases of host-to-device or device-to-host copies, the call may

436 still synchronize with the host if necessary.

437 * ``None`` (default):

438 * for device-to-device, it defaults to ``False`` (non-blocking),

439 * for host-to-device or device-to-host, it defaults to ``True`` (blocking).

440 """

441 raise NotImplementedError("Sorry, not supported: copy_from") 2 ctx1dH

442

443 def copy_to( (empty)

444 self, other : StridedMemoryView, stream : Stream | None = None,

445 allocator = None,

446 blocking : bool | None = None,

447 ):

448 """

449 Copies the data from this view into the ``other`` view.

450

451 For details, see :meth:`copy_from`.

452 """

453 raise NotImplementedError("Sorry, not supported: copy_to") 1 ctx1I

454

455 def __dlpack__( (empty)

456 self,

457 *,

458 stream: int | None = None, (empty)

459 max_version: tuple[int, int] | None = None, (empty)

460 dl_device: tuple[int, int] | None = None, (empty)

461 copy: bool | None = None, (empty)

462 ):

463 # Similar to Buffer.__dlpack__: no implicit synchronization is performed.

464 if dl_device is not None: 5 ctx1Fcbar

465 raise BufferError("Sorry, not supported: dl_device other than None") 1 ctx1F

466 if copy is True: 5 ctx1Fcbar

467 raise BufferError("Sorry, not supported: copy=True") 1 ctx1F

468

469 cdef bint versioned

470 if max_version is None: 5 ctx1Fcbar

471 versioned = False 3 ctx1cbr

472 else:

473 if not isinstance(max_version, tuple) or len(max_version) != 2: 2 ctx1Fa

474 raise BufferError(f"Expected max_version tuple[int, int], got {max_version}") 1 ctx1F

475 versioned = max_version >= (1, 0) 1 ctx1a

476

477 # NOTE: stream is accepted for protocol compatibility but not used.

478 cdef object capsule = _smv_make_py_capsule(self, versioned) 4 ctx1cbar

479 return capsule 1 ctx1a

480

481 def __dlpack_device__(self) -> tuple[int, int]: (empty)

482 cdef _DLDeviceType device_type

483 cdef int32_t device_id

484 _smv_get_dl_device(self, &device_type, &device_id) 3 ctx1DEa

485 return (<int>device_type, int(device_id)) 3 ctx1DEa

486

487 @property

488 def _layout(self) -> _StridedLayout:

489 """

490 The layout of the tensor. For StridedMemoryView created from DLPack or CAI,

491 the layout is inferred from the tensor object's metadata.

492 """

493 return self.get_layout() 42 ctx2$ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgb! # lbk e f g h i j

494

495 @property

496 def size(self) -> int:

497 return self.get_layout().get_volume() 41 ctx1dmnopqtuvwxyzABCKLVMWNXOPQRSTYZ01234567U8

498

499 @property

500 def shape(self) -> tuple[int, ...]:

501 """

502 Shape of the tensor.

503 """

504 return self.get_layout().get_shape_tuple() 83 ctx2s m n o p q t u v w x y z A B C K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgb! # 8 9 l e f g h i j

505

506 @property

507 def strides(self) -> tuple[int, ...] | None:

508 """

509 Strides of the tensor (in **counts**, not bytes).

510 """

511 return self.get_layout().get_strides_tuple() 75 ctx2s m n o p q t u v w x y z A B C K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgb8 9 l

512

513 @property

514 def dtype(self) -> numpy.dtype | None:

515 """

516 Data type of the tensor.

517

518 Supports standard NumPy dtypes as well as narrow data types (e.g., ``bfloat16``)

519 when the optional `ml_dtypes <https://github.com/jax-ml/ml_dtypes>`_ package is

520 installed. If ``ml_dtypes`` is not available and such a tensor is encountered,

521 a :obj:`NotImplementedError` will be raised.

522 """

523 return self.get_dtype() 66 ctx2d K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgbibl k e f g h i j

524

525 def __repr__(self):

526 return (f"StridedMemoryView(ptr={self.ptr},\n" 1 ctx1l

527 + f" shape={self.shape},\n" 1 ctx1l

528 + f" strides={self.strides},\n" 1 ctx1l

529 + f" itemsize={self._layout.itemsize},\n" 1 ctx1l

530 + f" dtype={get_simple_repr(self.dtype)},\n" 1 ctx1l

531 + f" device_id={self.device_id},\n" 1 ctx1l

532 + f" is_device_accessible={self.is_device_accessible},\n" 1 ctx1l

533 + f" readonly={self.readonly},\n" 1 ctx1l

534 + f" exporting_obj={get_simple_repr(self.exporting_obj)})") 1 ctx1l

535

536 cdef inline _StridedLayout get_layout(self): (empty)

537 if self._layout is None: 91 ctx2s m n o p q t u v w x y z A B C c b K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb$ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgb! # 8 hb9 a r lbl k e f g h i j

538 if self.dl_tensor: 56 ctx2s m n o p q t u v w x y z A B C c b K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb8 hb9 a lbl k e f g h i j

539 self._layout = layout_from_dlpack(self.dl_tensor) 27 ctx1smnopqtuvwxyzABCcbalkefghij

540 elif self.metadata is not None: 29 ctx2K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb8 hb9 lb

541 self._layout = layout_from_cai(self.metadata) 29 ctx2d K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb8 hb9

542 else:

543 raise ValueError("Cannot infer layout from the exporting object") 1 ctx2lb

544 return self._layout 88 ctx2s m n o p q t u v w x y z A B C c b K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgb! # 8 9 a r l k e f g h i j

545

546 cdef inline object get_buffer(self): (empty)

547 """

548 Returns Buffer instance with the underlying data.

549 If the SMV was created from a Buffer, it will return the same Buffer instance.

550 Otherwise, it will create a new instance with owner set to the exporting object.

551 """

552 if self._buffer is None: 11 ctx1cb!#kefghij

553 if isinstance(self.exporting_obj, Buffer): 9 ctx1cbkefghij

554 self._buffer = self.exporting_obj

555 else:

556 self._buffer = Buffer.from_handle(self.ptr, 0, owner=self.exporting_obj) 9 ctx1cbkefghij

557 return self._buffer 11 ctx1cb!#kefghij

558

559 cdef inline object get_dtype(self): (empty)

560 if self._dtype is None: 71 ctx2c b K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgb! # iba r l k e f g h i j

561 if self.dl_tensor != NULL: 33 ctx1KLVMWNXOPQRSTYZ01234567Uarlefghij

562 self._dtype = dtype_dlpack_to_numpy(&self.dl_tensor.dtype) 8 ctx1alefghij

563 elif isinstance(self.metadata, int): 25 ctx1KLVMWNXOPQRSTYZ01234567Ur

564 # AOTI dtype code stored by the torch tensor bridge

565 self._dtype = _get_tensor_bridge().resolve_aoti_dtype( (empty)

566 self.metadata)

567 elif self.metadata is not None: 25 ctx1KLVMWNXOPQRSTYZ01234567Ur

568 self._dtype = _typestr2dtype(self.metadata["typestr"]) 24 ctx1KLVMWNXOPQRSTYZ01234567U

569 return self._dtype 71 ctx2c b K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgb! # iba r l k e f g h i j

570

571

572cdef void _smv_pycapsule_deleter(object capsule) noexcept: (empty)

573 cdef DLManagedTensor* dlm_tensor

574 cdef DLManagedTensorVersioned* dlm_tensor_ver

575 # Do not invoke the deleter on a used capsule.

576 if cpython.PyCapsule_IsValid(capsule, DLPACK_TENSOR_UNUSED_NAME): 1 ctx1a

577 dlm_tensor = <DLManagedTensor*>(

578 cpython.PyCapsule_GetPointer(capsule, DLPACK_TENSOR_UNUSED_NAME)

579 )

580 if dlm_tensor.deleter:

581 dlm_tensor.deleter(dlm_tensor)

582 elif cpython.PyCapsule_IsValid(capsule, DLPACK_VERSIONED_TENSOR_UNUSED_NAME): 1 ctx1a

583 dlm_tensor_ver = <DLManagedTensorVersioned*>( (empty)

584 cpython.PyCapsule_GetPointer(capsule, DLPACK_VERSIONED_TENSOR_UNUSED_NAME)

585 )

586 if dlm_tensor_ver.deleter:

587 dlm_tensor_ver.deleter(dlm_tensor_ver) (empty)

588

589

590cdef inline void _smv_release_export_resources(void* manager_ctx, int64_t* shape_ptr) noexcept with gil: (empty)

591 if shape_ptr: 5 ctx1dcbar

592 stdlib.free(shape_ptr) 1 ctx1a

593 if manager_ctx: 4 ctx1cbar

594 cpython.Py_DECREF(<object>manager_ctx) 4 ctx1cbar

595

596

597cdef void _smv_deleter(DLManagedTensor* tensor) noexcept with gil: (empty)

598 if tensor: 3 ctx1cbr

599 _smv_release_export_resources(tensor.manager_ctx, tensor.dl_tensor.shape) 3 ctx1cbr

600 tensor.manager_ctx = NULL 3 ctx1cbr

601 stdlib.free(tensor) 3 ctx1cbr

602

603

604cdef void _smv_versioned_deleter(DLManagedTensorVersioned* tensor) noexcept with gil: (empty)

605 if tensor: 4 ctx1cbar

606 _smv_release_export_resources(tensor.manager_ctx, tensor.dl_tensor.shape) 1 ctx1a

607 tensor.manager_ctx = NULL 1 ctx1a

608 stdlib.free(tensor) 1 ctx1a

609

610

611cdef inline DLManagedTensorVersioned* _smv_allocate_dlm_tensor_versioned() except? NULL: (empty)

612 cdef DLManagedTensorVersioned* dlm_tensor_ver = NULL 1 ctx1a

613 dlm_tensor_ver = <DLManagedTensorVersioned*>stdlib.malloc(sizeof(DLManagedTensorVersioned)) 2 ctx1da

614 if dlm_tensor_ver == NULL: 1 ctx1a

615 raise MemoryError()

616 dlm_tensor_ver.dl_tensor.shape = NULL 1 ctx1a

617 dlm_tensor_ver.manager_ctx = NULL 1 ctx1a

618 return dlm_tensor_ver 1 ctx1a

619

620

621cdef inline DLManagedTensor* _smv_allocate_dlm_tensor() except? NULL: (empty)

622 cdef DLManagedTensor* dlm_tensor = NULL 3 ctx1cbr

623 dlm_tensor = <DLManagedTensor*>stdlib.malloc(sizeof(DLManagedTensor)) 3 ctx1cbr

624 if dlm_tensor == NULL: 3 ctx1cbr

625 raise MemoryError()

626 dlm_tensor.dl_tensor.shape = NULL 3 ctx1cbr

627 dlm_tensor.manager_ctx = NULL 3 ctx1cbr

628 return dlm_tensor 3 ctx1cbr

629

630

631cdef inline int _smv_dtype_numpy_to_dlpack(object dtype_obj, DLDataType* out_dtype) except -1: (empty)

632 cdef object np_dtype = numpy.dtype(dtype_obj) 4 ctx1dcba

633 if np_dtype.fields is not None: 3 ctx1cba

634 raise BufferError("Structured dtypes are not supported for DLPack export") 1 ctx1c

635 if not np_dtype.isnative and np_dtype.byteorder not in ("=", "|"): 2 ctx1ba

636 raise BufferError("Non-native-endian dtypes are not supported for DLPack export")

637

638 cdef str kind = np_dtype.kind 2 ctx1ba

639 cdef int bits = np_dtype.itemsize * 8 2 ctx1ba

640 cdef uint8_t code

641 if kind == "b": 2 ctx1ba

642 if bits != 8:

643 raise BufferError(f"Unsupported bool dtype itemsize: {np_dtype.itemsize}")

644 code = <uint8_t>kDLBool

645 elif kind == "i": 2 ctx1ba

646 if bits not in (8, 16, 32, 64): 1 ctx1a

647 raise BufferError(f"Unsupported signed integer dtype: {np_dtype}")

648 code = <uint8_t>kDLInt 2 ctx1da

649 elif kind == "u": 1 ctx1b

650 if bits not in (8, 16, 32, 64):

651 raise BufferError(f"Unsupported unsigned integer dtype: {np_dtype}")

652 code = <uint8_t>kDLUInt

653 elif kind == "f": 1 ctx1b

654 if bits not in (16, 32, 64):

655 raise BufferError(f"Unsupported floating dtype: {np_dtype}")

656 code = <uint8_t>kDLFloat

657 elif kind == "c": 1 ctx1b

658 if bits not in (64, 128):

659 raise BufferError(f"Unsupported complex dtype: {np_dtype}")

660 code = <uint8_t>kDLComplex

661 else:

662 raise BufferError(f"Unsupported dtype for DLPack export: {np_dtype}") 1 ctx1b

663

664 out_dtype.code = code 1 ctx1a

665 out_dtype.bits = <uint8_t>bits 1 ctx1a

666 out_dtype.lanes = <uint16_t>1 1 ctx1a

667 return 0 1 ctx1a

668

669

670cdef inline int _smv_get_dl_device( (empty)

671 StridedMemoryView view,

672 _DLDeviceType* out_device_type,

673 int32_t* out_device_id,

674) except -1:

675 cdef _DLDeviceType device_type

676 cdef int32_t device_id

677 cdef object buf

678 if view.dl_tensor != NULL: 4 ctx1dDEa

679 device_type = view.dl_tensor.device.device_type 3 ctx1DEa

680 if device_type == _kDLCUDA: 3 ctx1DEa

681 device_id = view.dl_tensor.device.device_id

682 else:

683 # CPU, CUDAHost, and CUDAManaged use device_id=0 in DLPack.

684 device_id = 0 3 ctx1DEa

685 elif view.is_device_accessible:

686 buf = view.get_buffer()

687 dev_type, dev_id = classify_dl_device(buf)

688 device_type = <_DLDeviceType>dev_type

689 device_id = <int32_t>dev_id

690 else:

691 device_type = _kDLCPU

692 device_id = 0

693

694 out_device_type[0] = device_type 3 ctx1DEa

695 out_device_id[0] = device_id 3 ctx1DEa

696 return 0 3 ctx1DEa

697

698

699cdef inline int _smv_setup_dl_tensor_common( (empty)

700 DLTensor* dl_tensor,

701 StridedMemoryView view,

702 _StridedLayout layout,

703) except -1:

704 cdef object dtype_obj = view.get_dtype() 4 ctx1cbar

705 if dtype_obj is None: 4 ctx1cbar

706 raise BufferError( 1 ctx1r

707 "Cannot export StridedMemoryView via DLPack without dtype information; "

708 "create the view with dtype specified."

709 )

710 _smv_dtype_numpy_to_dlpack(dtype_obj, &dl_tensor.dtype) 3 ctx1cba

711 _smv_get_dl_device(view, &dl_tensor.device.device_type, &dl_tensor.device.device_id) 1 ctx1a

712

713 cdef int ndim = layout.base.ndim 1 ctx1a

714 dl_tensor.ndim = ndim 1 ctx1a

715 if layout.get_volume() == 0: 1 ctx1a

716 dl_tensor.data = NULL

717 else:

718 dl_tensor.data = <void*><intptr_t>view.ptr 1 ctx1a

719 dl_tensor.byte_offset = 0 1 ctx1a

720 return 0 1 ctx1a

721

722

723cdef inline int _smv_setup_dl_tensor(DLTensor* dl_tensor, StridedMemoryView view) except -1: (empty)

724 cdef _StridedLayout layout = view.get_layout() 4 ctx1cbar

725 _smv_setup_dl_tensor_common(dl_tensor, view, layout) 4 ctx1cbar

726

727 cdef int i

728 cdef int64_t* shape_strides = NULL 1 ctx1a

729 cdef int64_t* strides_src = NULL 1 ctx1a

730 cdef int ndim = dl_tensor.ndim 1 ctx1a

731 if ndim == 0: 1 ctx1a

732 dl_tensor.shape = NULL

733 dl_tensor.strides = NULL

734 else:

735 # DLPack v1.2+ requires non-NULL strides for ndim != 0.

736 shape_strides = <int64_t*>stdlib.malloc(sizeof(int64_t) * 2 * ndim) 1 ctx1a

737 if shape_strides == NULL: 1 ctx1a

738 raise MemoryError()

739 try: 1 ctx1a

740 strides_src = get_strides_ptr(layout.base) 1 ctx1a

741 for i in range(ndim): 1 ctx1a

742 shape_strides[i] = layout.base.shape[i] 1 ctx1a

743 shape_strides[i + ndim] = strides_src[i] 1 ctx1a

744 except Exception:

745 stdlib.free(shape_strides)

746 raise

747 dl_tensor.shape = shape_strides 1 ctx1a

748 dl_tensor.strides = shape_strides + ndim 1 ctx1a

749 return 0 1 ctx1a

750

751

752cdef inline int _smv_setup_dltensor_borrowed(DLTensor* dl_tensor, StridedMemoryView view) except -1: (empty)

753 cdef _StridedLayout layout = view.get_layout()

754 _smv_setup_dl_tensor_common(dl_tensor, view, layout)

755

756 if dl_tensor.ndim == 0:

757 dl_tensor.shape = NULL

758 dl_tensor.strides = NULL

759 else:

760 dl_tensor.shape = layout.base.shape

761 # For temporary/non-owning exchange we provide explicit strides.

762 dl_tensor.strides = get_strides_ptr(layout.base)

763 return 0

764

765

766cdef inline int _smv_fill_managed_tensor_versioned( (empty)

767 DLManagedTensorVersioned* dlm_tensor_ver,

768 StridedMemoryView view,

769) except -1:

770 cpython.Py_INCREF(view) 1 ctx1a

771 dlm_tensor_ver.manager_ctx = <void*>view 1 ctx1a

772 dlm_tensor_ver.deleter = _smv_versioned_deleter 1 ctx1a

773 dlm_tensor_ver.version.major = DLPACK_MAJOR_VERSION 1 ctx1a

774 dlm_tensor_ver.version.minor = DLPACK_MINOR_VERSION 1 ctx1a

775 dlm_tensor_ver.flags = DLPACK_FLAG_BITMASK_READ_ONLY if view.readonly else 0 1 ctx1a

776 _smv_setup_dl_tensor(&dlm_tensor_ver.dl_tensor, view) 1 ctx1a

777 return 0 1 ctx1a

778

779

780cdef inline int _smv_fill_managed_tensor( (empty)

781 DLManagedTensor* dlm_tensor,

782 StridedMemoryView view,

783) except -1:

784 cpython.Py_INCREF(view) 3 ctx1cbr

785 dlm_tensor.manager_ctx = <void*>view 3 ctx1cbr

786 dlm_tensor.deleter = _smv_deleter 3 ctx1cbr

787 _smv_setup_dl_tensor(&dlm_tensor.dl_tensor, view) 3 ctx1cbr

788 return 0

789

790

791cdef object _smv_make_py_capsule(StridedMemoryView view, bint versioned): (empty)

792 cdef DLManagedTensor* dlm_tensor = NULL 4 ctx1cbar

793 cdef DLManagedTensorVersioned* dlm_tensor_ver = NULL 4 ctx1cbar

794 cdef object capsule = None 4 ctx1cbar

795 cdef void* tensor_ptr = NULL 4 ctx1cbar

796 cdef const char* capsule_name

797 try: 4 ctx1cbar

798 if versioned: 4 ctx1cbar

799 dlm_tensor_ver = _smv_allocate_dlm_tensor_versioned() 1 ctx1a

800 _smv_fill_managed_tensor_versioned(dlm_tensor_ver, view) 1 ctx1a

801 tensor_ptr = <void*>dlm_tensor_ver 1 ctx1a

802 capsule_name = DLPACK_VERSIONED_TENSOR_UNUSED_NAME 1 ctx1a

803 else:

804 dlm_tensor = _smv_allocate_dlm_tensor() 3 ctx1cbr

805 _smv_fill_managed_tensor(dlm_tensor, view) 3 ctx1cbr

806 tensor_ptr = <void*>dlm_tensor

807 capsule_name = DLPACK_TENSOR_UNUSED_NAME

808 capsule = cpython.PyCapsule_New(tensor_ptr, capsule_name, _smv_pycapsule_deleter) 1 ctx1a

809 except Exception: 3 ctx1cbr

810 if capsule is None: 3 ctx1cbr

811 _smv_deleter(dlm_tensor) 3 ctx1cbr

812 _smv_versioned_deleter(dlm_tensor_ver) 3 ctx1cbr

813 raise 3 ctx1cbr

814 return capsule 1 ctx1a

815

816

817cdef inline StridedMemoryView _smv_from_dlpack_capsule(object capsule, object exporting_obj): (empty)

818 cdef void* data = NULL

819 cdef DLTensor* dl_tensor = NULL

820 cdef DLManagedTensorVersioned* dlm_tensor_ver = NULL

821 cdef DLManagedTensor* dlm_tensor = NULL

822 cdef bint is_readonly = False

823 cdef const char* used_name = NULL

824 if cpython.PyCapsule_IsValid(capsule, DLPACK_VERSIONED_TENSOR_UNUSED_NAME):

825 data = cpython.PyCapsule_GetPointer(capsule, DLPACK_VERSIONED_TENSOR_UNUSED_NAME)

826 dlm_tensor_ver = <DLManagedTensorVersioned*>data

827 dl_tensor = &dlm_tensor_ver.dl_tensor

828 is_readonly = bool((dlm_tensor_ver.flags & DLPACK_FLAG_BITMASK_READ_ONLY) != 0)

829 used_name = DLPACK_VERSIONED_TENSOR_USED_NAME

830 elif cpython.PyCapsule_IsValid(capsule, DLPACK_TENSOR_UNUSED_NAME):

831 data = cpython.PyCapsule_GetPointer(capsule, DLPACK_TENSOR_UNUSED_NAME)

832 dlm_tensor = <DLManagedTensor*>data

833 dl_tensor = &dlm_tensor.dl_tensor

834 is_readonly = False

835 used_name = DLPACK_TENSOR_USED_NAME

836 else:

837 raise BufferError("Invalid DLPack capsule")

838

839 cpython.PyCapsule_SetName(capsule, used_name)

840

841 cdef StridedMemoryView view = StridedMemoryView.__new__(StridedMemoryView)

842 view.dl_tensor = dl_tensor

843 view.metadata = capsule

844 view.ptr = <intptr_t>(dl_tensor.data) + <intptr_t>(dl_tensor.byte_offset)

845 view.readonly = is_readonly

846 view.exporting_obj = exporting_obj

847 if dl_tensor.device.device_type == _kDLCPU:

848 view.device_id = -1

849 view.is_device_accessible = False

850 elif dl_tensor.device.device_type in (_kDLCUDA, _kDLCUDAHost, _kDLCUDAManaged):

851 view.device_id = dl_tensor.device.device_id

852 view.is_device_accessible = True

853 else:

854 raise BufferError("device not supported")

855 return view

856

857

858cdef int _smv_managed_tensor_allocator( (empty)

859 DLTensor* prototype,

860 DLManagedTensorVersioned** out,

861 void* error_ctx,

862 void (*SetError)(void* error_ctx, const char* kind, const char* message) noexcept,

863) noexcept with gil:

864 if out != NULL:

865 out[0] = NULL

866 if SetError != NULL:

867 SetError(error_ctx, b"NotImplementedError", b"managed_tensor_allocator is not supported by StridedMemoryView")

868 cpython.PyErr_SetString(NotImplementedError, b"managed_tensor_allocator is not supported by StridedMemoryView")

869 return -1

870

871

872cdef int _smv_managed_tensor_from_py_object_no_sync( (empty)

873 void* py_object,

874 DLManagedTensorVersioned** out,

875) noexcept with gil:

876 cdef DLManagedTensorVersioned* dlm_tensor_ver = NULL

877 if out == NULL:

878 cpython.PyErr_SetString(RuntimeError, b"out cannot be NULL")

879 return -1

880 out[0] = NULL

881 cdef object obj = <object>py_object

882 if not isinstance(obj, StridedMemoryView):

883 cpython.PyErr_SetString(TypeError, b"py_object must be a StridedMemoryView")

884 return -1

885 try:

886 dlm_tensor_ver = _smv_allocate_dlm_tensor_versioned()

887 _smv_fill_managed_tensor_versioned(dlm_tensor_ver, <StridedMemoryView>obj)

888 except Exception:

889 _smv_versioned_deleter(dlm_tensor_ver)

890 return -1

891 out[0] = dlm_tensor_ver

892 return 0

893

894

895cdef int _smv_managed_tensor_to_py_object_no_sync( (empty)

896 DLManagedTensorVersioned* tensor,

897 void** out_py_object,

898) noexcept with gil:

899 cdef object capsule

900 cdef object py_view

901 if out_py_object == NULL:

902 cpython.PyErr_SetString(RuntimeError, b"out_py_object cannot be NULL")

903 return -1

904 out_py_object[0] = NULL

905 if tensor == NULL:

906 cpython.PyErr_SetString(RuntimeError, b"tensor cannot be NULL")

907 return -1

908 try:

909 capsule = cpython.PyCapsule_New(

910 <void*>tensor,

911 DLPACK_VERSIONED_TENSOR_UNUSED_NAME,

912 _smv_pycapsule_deleter,

913 )

914 py_view = _smv_from_dlpack_capsule(capsule, capsule)

915 cpython.Py_INCREF(py_view)

916 out_py_object[0] = <void*>py_view

917 except Exception:

918 return -1

919 return 0

920

921

922cdef int _smv_dltensor_from_py_object_no_sync( (empty)

923 void* py_object,

924 DLTensor* out,

925) noexcept with gil:

926 if out == NULL:

927 cpython.PyErr_SetString(RuntimeError, b"out cannot be NULL")

928 return -1

929 cdef object obj = <object>py_object

930 if not isinstance(obj, StridedMemoryView):

931 cpython.PyErr_SetString(TypeError, b"py_object must be a StridedMemoryView")

932 return -1

933 try:

934 _smv_setup_dltensor_borrowed(out, <StridedMemoryView>obj)

935 except Exception:

936 return -1

937 return 0

938

939

940cdef int _smv_current_work_stream( (empty)

941 _DLDeviceType device_type,

942 int32_t device_id,

943 void** out_current_stream,

944) noexcept with gil:

945 if out_current_stream == NULL:

946 cpython.PyErr_SetString(RuntimeError, b"out_current_stream cannot be NULL")

947 return -1

948 # cuda.core has no global/current stream state today.

949 out_current_stream[0] = NULL

950 return 0

951

952

953cdef void _init_smv_dlpack_exchange_api(): (empty)

954 global _SMV_DLPACK_EXCHANGE_API_INITED

955 if _SMV_DLPACK_EXCHANGE_API_INITED: (empty)

956 return

957 _SMV_DLPACK_EXCHANGE_API.header.version.major = DLPACK_MAJOR_VERSION (empty)

958 _SMV_DLPACK_EXCHANGE_API.header.version.minor = DLPACK_MINOR_VERSION (empty)

959 _SMV_DLPACK_EXCHANGE_API.header.prev_api = NULL (empty)

960 _SMV_DLPACK_EXCHANGE_API.managed_tensor_allocator = _smv_managed_tensor_allocator (empty)

961 _SMV_DLPACK_EXCHANGE_API.managed_tensor_from_py_object_no_sync = _smv_managed_tensor_from_py_object_no_sync (empty)

962 _SMV_DLPACK_EXCHANGE_API.managed_tensor_to_py_object_no_sync = _smv_managed_tensor_to_py_object_no_sync (empty)

963 _SMV_DLPACK_EXCHANGE_API.dltensor_from_py_object_no_sync = _smv_dltensor_from_py_object_no_sync (empty)

964 _SMV_DLPACK_EXCHANGE_API.current_work_stream = _smv_current_work_stream (empty)

965 _SMV_DLPACK_EXCHANGE_API_INITED = True (empty)

966

967

968_init_smv_dlpack_exchange_api() (empty)

969# cdef classes are immutable types in Cython 3, so inject these attributes

970# directly into the type dict.

971(<dict>(<PyTypeObject*>StridedMemoryView).tp_dict)["__dlpack_c_exchange_api__"] = _SMV_DLPACK_EXCHANGE_API_CAPSULE (empty)

972(<dict>(<PyTypeObject*>StridedMemoryView).tp_dict)["__c_dlpack_exchange_api__"] = _SMV_DLPACK_EXCHANGE_API_CAPSULE (empty)

973PyType_Modified(<PyTypeObject*>StridedMemoryView) (empty)

974

975

976cdef str get_simple_repr(obj): (empty)

977 # TODO: better handling in np.dtype objects

978 cdef object obj_class

979 cdef str obj_repr

980 if isinstance(obj, type): 1 ctx1l

981 obj_class = obj

982 else:

983 obj_class = obj.__class__ 1 ctx1l

984 if obj_class.__module__ in (None, "builtins"): 1 ctx1l

985 obj_repr = obj_class.__name__

986 else:

987 obj_repr = f"{obj_class.__module__}.{obj_class.__name__}" 1 ctx1l

988 return obj_repr 1 ctx1l

989

990

991

992cdef bint check_has_dlpack(obj) except*: (empty)

993 cdef bint has_dlpack

994 if hasattr(obj, "__dlpack__") and hasattr(obj, "__dlpack_device__"): 28 ctx1DEFJsmnopqtuvwxyzABCcbHIalGk

995 has_dlpack = True 28 ctx1DEFJsmnopqtuvwxyzABCcbHIalGk

996 elif hasattr(obj, "__cuda_array_interface__"):

997 has_dlpack = False

998 else:

999 raise RuntimeError(

1000 "the input object does not support any data exchange protocol")

1001 return has_dlpack 28 ctx1DEFJsmnopqtuvwxyzABCcbHIalGk

1002

1003

1004cdef class _StridedMemoryViewProxy:

1005 cdef readonly:

1006 object obj

1007 bint has_dlpack

1008

1009 def __init__(self, obj):

1010 self.obj = obj 5 ctx1mnopq

1011 self.has_dlpack = check_has_dlpack(obj) 5 ctx1mnopq

1012

1013 cpdef StridedMemoryView view(self, stream_ptr=None): (empty)

1014 if self.has_dlpack: 5 ctx1mnopq

1015 return StridedMemoryView.from_dlpack(self.obj, stream_ptr) 5 ctx1mnopq

1016 else:

1017 return StridedMemoryView.from_cuda_array_interface(self.obj, stream_ptr)

1018

1019

1020cdef StridedMemoryView view_as_dlpack(obj, stream_ptr, view=None): (empty)

1021 cdef int dldevice, device_id

1022 cdef bint is_device_accessible, is_readonly

1023 is_device_accessible = False 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1024 dldevice, device_id = obj.__dlpack_device__() 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1025 if dldevice == _kDLCPU: 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1026 assert device_id == 0 32 ctx1FJsmnopqtuvwxyzABCcbHIalGkefghij

1027 device_id = -1 32 ctx1FJsmnopqtuvwxyzABCcbHIalGkefghij

1028 if stream_ptr is None: 32 ctx1FJsmnopqtuvwxyzABCcbHIalGkefghij

1029 raise BufferError("stream=None is ambiguous with view()")

1030 elif stream_ptr == -1: 32 ctx1FJsmnopqtuvwxyzABCcbHIalGkefghij

1031 stream_ptr = None 32 ctx1FJsmnopqtuvwxyzABCcbHIalGkefghij

1032 elif dldevice == _kDLCUDA:

1033 assert device_id >= 0

1034 is_device_accessible = True

1035 # no need to check other stream values, it's a pass-through

1036 if stream_ptr is None:

1037 raise BufferError("stream=None is ambiguous with view()")

1038 elif dldevice in (_kDLCUDAHost, _kDLCUDAManaged):

1039 is_device_accessible = True 2 ctx1DE

1040 # just do a pass-through without any checks, as pinned/managed memory can be

1041 # accessed on both host and device

1042 else:

1043 raise BufferError("device not supported")

1044

1045 cdef object capsule

1046 try: 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1047 capsule = obj.__dlpack__( 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1048 stream=int(stream_ptr) if stream_ptr else None, 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1049 max_version=(DLPACK_MAJOR_VERSION, DLPACK_MINOR_VERSION)) 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1050 except TypeError:

1051 capsule = obj.__dlpack__(

1052 stream=int(stream_ptr) if stream_ptr else None)

1053

1054 cdef void* data = NULL 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1055 cdef DLTensor* dl_tensor

1056 cdef DLManagedTensorVersioned* dlm_tensor_ver

1057 cdef DLManagedTensor* dlm_tensor

1058 cdef const char *used_name

1059 if cpython.PyCapsule_IsValid( 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1060 capsule, DLPACK_VERSIONED_TENSOR_UNUSED_NAME):

1061 data = cpython.PyCapsule_GetPointer( 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1062 capsule, DLPACK_VERSIONED_TENSOR_UNUSED_NAME)

1063 dlm_tensor_ver = <DLManagedTensorVersioned*>data 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1064 dl_tensor = &dlm_tensor_ver.dl_tensor 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1065 is_readonly = bool((dlm_tensor_ver.flags & DLPACK_FLAG_BITMASK_READ_ONLY) != 0) 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1066 used_name = DLPACK_VERSIONED_TENSOR_USED_NAME 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1067 elif cpython.PyCapsule_IsValid(

1068 capsule, DLPACK_TENSOR_UNUSED_NAME):

1069 data = cpython.PyCapsule_GetPointer(

1070 capsule, DLPACK_TENSOR_UNUSED_NAME)

1071 dlm_tensor = <DLManagedTensor*>data

1072 dl_tensor = &dlm_tensor.dl_tensor

1073 is_readonly = False

1074 used_name = DLPACK_TENSOR_USED_NAME

1075 else:

1076 assert False

1077

1078 cpython.PyCapsule_SetName(capsule, used_name) 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1079

1080 cdef StridedMemoryView buf = StridedMemoryView() if view is None else view 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1081 buf.dl_tensor = dl_tensor 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1082 buf.metadata = capsule 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1083 buf.ptr = <intptr_t>(dl_tensor.data) 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1084 buf.device_id = device_id 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1085 buf.is_device_accessible = is_device_accessible 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1086 buf.readonly = is_readonly 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1087 buf.exporting_obj = obj 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1088

1089 return buf 34 ctx1DEFJsmnopqtuvwxyzABCcbHIalGkefghij

1090

1091

1092@functools.lru_cache (empty)

1093def _typestr2dtype(str typestr):

1094 return numpy.dtype(typestr) 11 ctx1KLMNOPQRSTU

1095

1096

1097@functools.lru_cache (empty)

1098def _typestr2itemsize(str typestr):

1099 return _typestr2dtype(typestr).itemsize 11 ctx1KLMNOPQRSTU

1100

1101

1102cdef object dtype_dlpack_to_numpy(DLDataType* dtype): (empty)

1103 cdef int bits = dtype.bits 8 ctx1alefghij

1104 if dtype.lanes != 1: 8 ctx1alefghij

1105 # TODO: return a NumPy structured dtype?

1106 raise NotImplementedError(

1107 f'vector dtypes (lanes={dtype.lanes}) is not supported')

1108 if dtype.code == kDLUInt: 8 ctx1alefghij

1109 if bits == 8:

1110 np_dtype = numpy.uint8

1111 elif bits == 16:

1112 np_dtype = numpy.uint16

1113 elif bits == 32:

1114 np_dtype = numpy.uint32

1115 elif bits == 64:

1116 np_dtype = numpy.uint64

1117 else:

1118 raise TypeError('uint{} is not supported.'.format(bits))

1119 elif dtype.code == kDLInt:

1120 if bits == 8: 8 ctx1alefghij

1121 np_dtype = numpy.int8

1122 elif bits == 16:

1123 np_dtype = numpy.int16

1124 elif bits == 32:

1125 np_dtype = numpy.int32 8 ctx1alefghij

1126 elif bits == 64:

1127 np_dtype = numpy.int64

1128 else:

1129 raise TypeError('int{} is not supported.'.format(bits))

1130 elif dtype.code == kDLFloat:

1131 if bits == 16:

1132 np_dtype = numpy.float16

1133 elif bits == 32:

1134 np_dtype = numpy.float32

1135 elif bits == 64:

1136 np_dtype = numpy.float64

1137 else:

1138 raise TypeError('float{} is not supported.'.format(bits))

1139 elif dtype.code == kDLComplex:

1140 # TODO(leofang): support complex32

1141 if bits == 64:

1142 np_dtype = numpy.complex64

1143 elif bits == 128:

1144 np_dtype = numpy.complex128

1145 else:

1146 raise TypeError('complex{} is not supported.'.format(bits))

1147 elif dtype.code == kDLBool:

1148 if bits == 8:

1149 np_dtype = numpy.bool_

1150 else:

1151 raise TypeError(f'{bits}-bit bool is not supported')

1152 elif dtype.code == kDLBfloat:

1153 if bfloat16 is not None:

1154 np_dtype = numpy.dtype("bfloat16")

1155 else:

1156 raise NotImplementedError(

1157 'Support for bfloat16 within cuda-core requires `ml_dtypes`'

1158 'to be installed.'

1159 )

1160 else:

1161 raise TypeError('Unsupported dtype. dtype code: {}'.format(dtype.code))

1162

1163 # We want the dtype object not just the type object

1164 return numpy.dtype(np_dtype) 8 ctx1alefghij

1165

1166

1167cpdef StridedMemoryView view_as_cai(obj, stream_ptr, view=None): (empty)

1168 cdef dict cai_data = obj.__cuda_array_interface__ 6 ctx2sbrbub8 hb9

1169 if cai_data["version"] < 3: 6 ctx2sbrbub8 hb9

1170 raise BufferError("only CUDA Array Interface v3 or above is supported") 1 ctx2ub

1171 if cai_data.get("mask") is not None: 5 ctx2sbrb8 hb9

1172 raise BufferError("mask is not supported") 1 ctx2sb

1173 if stream_ptr is None: 4 ctx2rb8 hb9

1174 raise BufferError("stream=None is ambiguous with view()") 1 ctx2rb

1175

1176 cdef StridedMemoryView buf = StridedMemoryView() if view is None else view 3 ctx28 hb9

1177 buf.exporting_obj = obj 3 ctx28 hb9

1178 buf.metadata = cai_data 3 ctx28 hb9

1179 buf.dl_tensor = NULL 3 ctx28 hb9

1180 # Validate shape/strides/typestr eagerly so constructor paths fail fast.

1181 buf.get_layout() 3 ctx28 hb9

1182 buf.ptr, buf.readonly = cai_data["data"] 2 ctx189

1183 buf.is_device_accessible = True 2 ctx189

1184 if buf.ptr != 0: 2 ctx189

1185 buf.device_id = handle_return(

1186 driver.cuPointerGetAttribute(

1187 driver.CUpointer_attribute.CU_POINTER_ATTRIBUTE_DEVICE_ORDINAL,

1188 buf.ptr))

1189 else:

1190 buf.device_id = handle_return(driver.cuCtxGetDevice()) 2 ctx189

1191

1192 cdef intptr_t producer_s, consumer_s

1193 cdef EventHandle h_event

1194 stream_ptr = int(stream_ptr) 2 ctx189

1195 if stream_ptr != -1: 2 ctx189

1196 stream = cai_data.get("stream")

1197 if stream is not None:

1198 producer_s = <intptr_t>(stream)

1199 consumer_s = <intptr_t>(stream_ptr)

1200 assert producer_s > 0

1201 # establish stream order

1202 if producer_s != consumer_s:

1203 with nogil:

1204 h_event = create_event_handle_noctx(cydriver.CUevent_flags.CU_EVENT_DISABLE_TIMING)

1205 HANDLE_RETURN(cydriver.cuEventRecord(

1206 as_cu(h_event), <cydriver.CUstream>producer_s))

1207 HANDLE_RETURN(cydriver.cuStreamWaitEvent(

1208 <cydriver.CUstream>consumer_s, as_cu(h_event), 0))

1209 elif _is_torch_tensor(obj):

1210 # PyTorch's __cuda_array_interface__ reports version 2 and

1211 # omits the "stream" field, so the standard CAI sync path

1212 # above is a no-op for torch tensors. This is unsafe: the

1213 # consumer has no guarantee that the producer's work is

1214 # visible. We fix this by querying PyTorch's current CUDA

1215 # stream via the AOTI stable C ABI and performing the same

1216 # event-based stream ordering.

1217 _get_tensor_bridge().sync_torch_stream(

1218 buf.device_id, <intptr_t>(stream_ptr))

1219

1220 return buf 2 ctx189

1221

1222

1223cpdef StridedMemoryView view_as_array_interface(obj, view=None): (empty)

1224 cdef dict data = obj.__array_interface__ 27 ctx2tbvbK L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb

1225 if data["version"] < 3: 27 ctx2tbvbK L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb

1226 raise BufferError("only NumPy Array Interface v3 or above is supported") 1 ctx2vb

1227 if data.get("mask") is not None: 26 ctx2tbK L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb

1228 raise BufferError("mask is not supported") 1 ctx2tb

1229

1230 cdef StridedMemoryView buf = StridedMemoryView() if view is None else view 25 ctx2K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb

1231 buf.exporting_obj = obj 25 ctx2K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb

1232 buf.metadata = data 25 ctx2K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb

1233 buf.dl_tensor = NULL 25 ctx2K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb

1234 # Validate shape/strides/typestr eagerly so constructor paths fail fast.

1235 buf.get_layout() 25 ctx2K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb

1236 buf.ptr, buf.readonly = data["data"] 24 ctx1KLVMWNXOPQRSTYZ01234567U

1237 buf.is_device_accessible = False 24 ctx1KLVMWNXOPQRSTYZ01234567U

1238 buf.device_id = handle_return(driver.cuCtxGetDevice()) 24 ctx1KLVMWNXOPQRSTYZ01234567U

1239 return buf 24 ctx1KLVMWNXOPQRSTYZ01234567U

1240

1241

1242def args_viewable_as_strided_memory(tuple arg_indices): (empty)

1243 """

1244 Decorator to create proxy objects to :obj:`StridedMemoryView` for the

1245 specified positional arguments.

1246

1247 This allows array/tensor attributes to be accessed inside the function

1248 implementation, while keeping the function body array-library-agnostic (if

1249 desired).

1250

1251 Inside the decorated function, the specified arguments become instances

1252 of an (undocumented) proxy type, regardless of its original source. A

1253 :obj:`StridedMemoryView` instance can be obtained by passing the (consumer)

1254 stream pointer (as a Python `int`) to the proxies's ``view()`` method. For

1255 example:

1256

1257 .. code-block:: python

1258

1259 @args_viewable_as_strided_memory((1,))

1260 def my_func(arg0, arg1, arg2, stream: Stream):

1261 # arg1 can be any object supporting DLPack or CUDA Array Interface

1262 view = arg1.view(stream.handle)

1263 assert isinstance(view, StridedMemoryView)

1264 ...

1265

1266 Parameters

1267 ----------

1268 arg_indices : tuple

1269 The indices of the target positional arguments.

1270 """

1271 def wrapped_func_with_indices(func): 5 ctx1mnopq

1272 @functools.wraps(func) 5 ctx1mnopq

1273 def wrapped_func(*args, **kwargs):

1274 args = list(args) 5 ctx1mnopq

1275 cdef int idx

1276 for idx in arg_indices: 5 ctx1mnopq

1277 args[idx] = _StridedMemoryViewProxy(args[idx]) 5 ctx1mnopq

1278 return func(*args, **kwargs) 5 ctx1mnopq

1279 return wrapped_func 5 ctx1mnopq

1280 return wrapped_func_with_indices 5 ctx1mnopq

1281

1282

1283cdef inline _StridedLayout layout_from_dlpack(DLTensor* dl_tensor): (empty)

1284 cdef _StridedLayout layout = _StridedLayout.__new__(_StridedLayout) 27 ctx1smnopqtuvwxyzABCcbalkefghij

1285 cdef int nbits = dl_tensor.dtype.bits * dl_tensor.dtype.lanes 27 ctx1smnopqtuvwxyzABCcbalkefghij

1286 cdef int itemsize = nbits >> 3 27 ctx1smnopqtuvwxyzABCcbalkefghij

1287 if (itemsize << 3) != nbits: 27 ctx1smnopqtuvwxyzABCcbalkefghij

1288 raise ValueError("dl_tensor.dtype.bits must be a multiple of 8")

1289 layout.init_from_ptr(dl_tensor.ndim, dl_tensor.shape, dl_tensor.strides, itemsize) 27 ctx1smnopqtuvwxyzABCcbalkefghij

1290 return layout 27 ctx1smnopqtuvwxyzABCcbalkefghij

1291

1292

1293cdef _StridedLayout layout_from_cai(object metadata): (empty)

1294 cdef _StridedLayout layout = _StridedLayout.__new__(_StridedLayout) 28 ctx2K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb8 hb9

1295 cdef object shape = metadata["shape"] 28 ctx2K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb8 hb9

1296 cdef object strides = metadata.get("strides") 28 ctx2K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb8 hb9

1297 cdef int itemsize = _typestr2itemsize(metadata["typestr"]) 28 ctx2K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb8 hb9

1298 layout.init_from_tuple(shape, strides, itemsize, True) 28 ctx2K L V M W N X O P Q R S T Y Z 0 1 2 3 4 5 6 7 U jb8 hb9

1299 return layout 26 ctx1KLVMWNXOPQRSTYZ01234567U89

1300

1301

1302cdef inline intptr_t get_data_ptr(object buffer, _StridedLayout layout) except? 0: (empty)

1303 return <intptr_t>(int(buffer.handle)) + layout.get_slice_offset_in_bytes() 45 ctx2c b $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgb! # ibr k e f g h i j

1304

1305

1306cdef inline int view_buffer_strided( (empty)

1307 StridedMemoryView view,

1308 object buffer,

1309 _StridedLayout layout,

1310 object dtype,

1311 bint is_readonly,

1312) except -1:

1313 if dtype is not None: 47 ctx2c b $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgbmb! # kbibr k e f g h i j

1314 dtype = numpy.dtype(dtype) 46 ctx2c b $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgbmb! # kbibk e f g h i j

1315 if dtype.itemsize != layout.itemsize: 46 ctx2c b $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgbmb! # kbibk e f g h i j

1316 raise ValueError(

1317 f"The dtype's itemsize ({dtype.itemsize}) does not match the layout's "

1318 f"itemsize ({layout.itemsize})."

1319 )

1320 # Check the layout's offset range [min_offset, max_offset] fits

1321 # within the [0, buffer.size - 1] range.

1322 # The required_size_in_bytes fails if min_offset < 0.

1323 # NB. For external memory, both positive and negative offsets can be valid,

1324 # but for a proper check we'd need to know both size and data offset,

1325 # while neither is reported by the packages.

1326 cdef bint is_allocated = buffer.memory_resource is not None 47 ctx2c b $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgbmb! # kbibr k e f g h i j

1327 if is_allocated and buffer.size < layout.get_required_size_in_bytes(): 47 ctx2c b $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgbmb! # kbibr k e f g h i j

1328 raise ValueError( 1 ctx2kb

1329 f"Buffer size is too small for the layout. " 1 ctx2kb

1330 f"Expected at least {layout.get_required_size_in_bytes()} bytes, " 1 ctx2kb

1331 f"got {buffer.size} bytes." 1 ctx2kb

1332 )

1333 # set the public attributes

1334 view.ptr = get_data_ptr(buffer, layout) 45 ctx2c b $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgb! # ibr k e f g h i j

1335 view.device_id = buffer.device_id 45 ctx2c b $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgb! # ibr k e f g h i j

1336 view.is_device_accessible = buffer.is_device_accessible 45 ctx2c b $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgb! # ibr k e f g h i j

1337 view.readonly = is_readonly 45 ctx2c b $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgb! # ibr k e f g h i j

1338 view.exporting_obj = view._buffer = buffer 45 ctx2c b $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgb! # ibr k e f g h i j

1339 # no dlpack/cai metadata

1340 view.dl_tensor = NULL 45 ctx2c b $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgb! # ibr k e f g h i j

1341 view.metadata = None 45 ctx2c b $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgb! # ibr k e f g h i j

1342 # we get the layout from the caller

1343 view._layout = layout 45 ctx2c b $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgb! # ibr k e f g h i j

1344 view._dtype = dtype 45 ctx2c b $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgb! # ibr k e f g h i j

1345 return 0 45 ctx2c b $ % ' ( ) * + , - . / : ; = ? @ [ ] ^ _ ` { | } ~ abbbcbdbebfbgb! # ibr k e f g h i j

Coverage for cuda / core / _memoryview.pyx: 62.99%

708 statements