#include #ifdef _MSC_VER #include #endif #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include #include template <> void THPPointer::free() { if (ptr) { c10::raw::intrusive_ptr::decref(ptr); } } PyTypeObject* THPStorageClass = nullptr; PyObject* THPStorage_NewWithStorage( PyTypeObject* type, c10::Storage _storage, c10::impl::PyInterpreterStatus status, bool allow_preexisting_pyobj) { TORCH_CHECK( PyType_IsSubtype(type, &THPStorageType), "Creating a Storage subclass from a class that does not inherit from ", "Storage is not possible. Make sure your class inherits from Storage."); auto maybe_pyobj = _storage.unsafeGetStorageImpl()->pyobj_slot()->check_pyobj( getPyInterpreter(), /*ignore_hermetic_tls=*/false); if (maybe_pyobj.has_value() && maybe_pyobj.value()) { TORCH_CHECK( allow_preexisting_pyobj, "Creating a new Storage subclass ", type->tp_name, " but the raw Storage object is already associated to a python object ", "of type ", maybe_pyobj.value()->ob_type->tp_name); PyObject* obj = *maybe_pyobj; PyTypeObject* obj_type = Py_TYPE(obj); TORCH_CHECK( obj_type == type || PyType_IsSubtype(obj_type, type), "Creating a new Storage subclass ", type->tp_name, " but the raw Storage object is already associated to a python object ", "of type ", maybe_pyobj.value()->ob_type->tp_name, " which is not a subclass of the " "requested type"); return THPStorage_Wrap(std::move(_storage)); } PyObject* obj = type->tp_alloc(type, 0); TORCH_CHECK(obj, "Failed to allocate a ", type->tp_name, " object"); auto s = (THPStorage*)obj; new (&s->cdata) c10::MaybeOwned(); s->cdata = c10::MaybeOwned::owned(std::move(_storage)); if (!c10::impl::HermeticPyObjectTLS::get_state()) { s->is_hermetic = false; const auto& storage = THPStorage_Unpack(s); storage.unsafeGetStorageImpl()->pyobj_slot()->init_pyobj( getPyInterpreter(), obj, status); } else { s->is_hermetic = true; } return obj; } // Wraps the c10::Storage with a storage PyObject PyObject* THPStorage_Wrap(c10::Storage storage) { c10::StorageImpl* storage_impl = storage.unsafeGetStorageImpl(); if (c10::impl::HermeticPyObjectTLS::get_state()) { return THPStorage_NewWithStorage( THPStorageClass, std::move(storage), c10::impl::PyInterpreterStatus::DEFINITELY_UNINITIALIZED); } c10::impl::PyObjectSlot* pyobj_slot = storage_impl->pyobj_slot(); // If the StorageImpl has a PyObject that is managed by a different // interpreter than the current one, create a new StorageImpl that points to // the same data and then create the Python storage from that. // NOTE: This is only supposed to happen in MultiPy if (pyobj_slot->has_pyobj_nonhermetic() && !pyobj_slot->check_interpreter(getPyInterpreter())) { return THPStorage_NewWithStorage( THPStorageClass, c10::newStorageImplFromRefcountedDataPtr(storage), c10::impl::PyInterpreterStatus::DEFINITELY_UNINITIALIZED); } std::optional maybe_pyobj = pyobj_slot->check_pyobj( getPyInterpreter(), /*ignore_hermetic_tls=*/false); c10::impl::PyInterpreterStatus status = c10::impl::PyInterpreterStatus::TAGGED_BY_US; if (maybe_pyobj.has_value()) { auto obj = *maybe_pyobj; if (obj) { TORCH_CHECK( THPStorage_Check(obj), "Expected a storage type, but got ", Py_TYPE(obj)->tp_name); if (pyobj_slot->owns_pyobj()) { pyobj_slot->set_owns_pyobj(false); reinterpret_cast(obj)->cdata = c10::MaybeOwned::owned(std::move(storage)); return obj; } else { Py_INCREF(obj); return obj; } } status = c10::impl::PyInterpreterStatus::TAGGED_BY_US; } else { if (storage.use_count() <= 1) { status = c10::impl::PyInterpreterStatus::DEFINITELY_UNINITIALIZED; } else { status = c10::impl::PyInterpreterStatus::MAYBE_UNINITIALIZED; } } return THPStorage_NewWithStorage(THPStorageClass, std::move(storage), status); } static bool THPStorage_isPreservable(THPStorage* self) { if (self->cdata.unsafeIsBorrowed()) { return false; } auto const& storage = THPStorage_Unpack(self); if (self->is_hermetic) { return false; } if (storage.unsafeGetStorageImpl()->pyobj_slot()->check_pyobj( getPyInterpreter(), /*ignore_hermetic_tls=*/true) != std::make_optional((PyObject*)self)) { return false; } if (storage.use_count() <= 1) { return false; } return true; } static bool THPStorage_tryPreserve(THPStorage* self) { if (!THPStorage_isPreservable(self)) { return false; } const auto& storage = THPStorage_Unpack(self); c10::StorageImpl* storage_impl = storage.unsafeGetStorageImpl(); auto maybe_pyobj = storage_impl->pyobj_slot()->check_pyobj( getPyInterpreter(), /*ignore_hermetic_tls=*/true); // NOTE: It is possible to just set the PyObjectSlot here, but the point is // that we should have already set PyObjectSlot when the storage PyObject was // created. TORCH_INTERNAL_ASSERT( maybe_pyobj.has_value(), "Trying to preserve a Python storage whose PyObjectSlot does not have a PyObject"); PyObject* pyobj = *maybe_pyobj; TORCH_CHECK( THPStorage_Check(pyobj), "Expected a storage type, but got ", Py_TYPE(pyobj)->tp_name); TORCH_INTERNAL_ASSERT( (void*)pyobj == (void*)self, "Python storage and the PyObject in the internal PyObjectSlot are not at the same address"); TORCH_INTERNAL_ASSERT(!storage_impl->pyobj_slot()->owns_pyobj()); storage_impl->pyobj_slot()->set_owns_pyobj(true); Py_INCREF(self); self->cdata = c10::MaybeOwned::borrowed(storage); return true; } static void THPStorage_subclass_dealloc(PyObject* self) { THPStorage* _self = (THPStorage*)self; if (THPStorage_tryPreserve(_self)) { return; } // Some subclass of StorageBase could be GC-tracked objects even // though the base class is not auto* type = Py_TYPE(self); if (PyType_HasFeature(type, Py_TPFLAGS_HAVE_GC) != 0) { PyObject_GC_UnTrack(self); } bool has_finalizer = type->tp_finalize || type->tp_del; if (type->tp_finalize) { PyObject_GC_Track(self); if (PyObject_CallFinalizerFromDealloc(self) < 0) { // The finalizer has resurrected the PyObject and there is a new Python // reference to it, so we can just stop deallocating. Read about // resurrection from `__del__` here: // https://docs.python.org/3/reference/datamodel.html#object.__del__ return; } PyObject_GC_UnTrack(self); } // base test is unnecessary as THPStorae does not set this if (type->tp_weaklistoffset) { PyObject_ClearWeakRefs(self); } if (type->tp_del) { PyObject_GC_Track(self); type->tp_del(self); if (Py_REFCNT(self) > 0) { // Resurrected (see above comment about resurrection from `__del__`) return; } PyObject_GC_UnTrack(self); } if (has_finalizer) { /* New weakrefs could be created during the finalizer call. If this occurs, clear them out without calling their finalizers since they might rely on part of the object being finalized that has already been destroyed. */ if (type->tp_weaklistoffset) { /* Modeled after GET_WEAKREFS_LISTPTR() */ PyWeakReference** list = (PyWeakReference**)PyObject_GET_WEAKREFS_LISTPTR(self); while (*list) _PyWeakref_ClearRef(*list); } } // Clear slots { PyTypeObject* base = type; while (base != &THPStorageType) { if (Py_SIZE(base)) { clear_slots(base, self); } base = base->tp_base; TORCH_INTERNAL_ASSERT(base); } } // Clear __dict__ if (C10_LIKELY(type->tp_dictoffset)) { PyObject** dictptr = _PyObject_GetDictPtr(self); if (dictptr != nullptr) { PyObject* dict = *dictptr; if (dict != nullptr) { Py_DECREF(dict); *dictptr = nullptr; } } } TORCH_INTERNAL_ASSERT(Py_TYPE(self) == type); _self->cdata.~MaybeOwned(); Py_TYPE(_self)->tp_free(self); TORCH_INTERNAL_ASSERT(type->tp_flags & Py_TPFLAGS_HEAPTYPE); Py_DECREF(type); } static PyObject* THPStorage_pynew( PyTypeObject* type, PyObject* args, PyObject* kwargs) { HANDLE_TH_ERRORS TORCH_CHECK( type != &THPStorageType, "Cannot directly construct StorageBase; subclass it and then construct that"); static torch::PythonArgParser parser({ THPStorageStr "(*, int64_t allocator=None, Device device=None)", THPStorageStr "(int64_t size, *, int64_t allocator=None, Device device=None)", THPStorageStr "(PyObject* sequence, *, int64_t allocator=None, Device device=None)", }); torch::ParsedArgs<3> parsed_args; auto r = parser.parse(args, kwargs, parsed_args); int allocator_arg_idx = 0; int device_arg_idx = 1; if (r.idx > 0) { allocator_arg_idx = 1; device_arg_idx = 2; } std::optional allocator_opt = r.toInt64Optional(allocator_arg_idx); std::optional device_opt = r.deviceOptional(device_arg_idx); TORCH_CHECK( !allocator_opt.has_value() || !device_opt.has_value(), THPStorageStr, "(): only one or neither of 'allocator' or 'device' can ", "be given, but not both"); PyObject* self = nullptr; c10::Allocator* allocator = nullptr; at::OptionalDeviceGuard device_guard; if (allocator_opt.has_value()) { // NOLINTNEXTLINE(performance-no-int-to-ptr) allocator = reinterpret_cast(allocator_opt.value()); } else if (device_opt.has_value()) { at::Device device = device_opt.value(); torch::utils::maybe_initialize_device(device); switch (device.type()) { case at::kCPU: allocator = c10::GetDefaultCPUAllocator(); break; #ifdef USE_CUDA case at::kCUDA: allocator = c10::cuda::CUDACachingAllocator::get(); break; #endif #ifdef USE_MPS case at::kMPS: allocator = at::mps::GetMPSAllocator(); break; #endif case at::DeviceType::XPU: case at::DeviceType::HPU: case at::DeviceType::Meta: case at::DeviceType::PrivateUse1: case at::DeviceType::MAIA: allocator = c10::GetAllocator(device.type()); break; default: // NOLINTEND(bugprone-branch-clone) TORCH_CHECK( false, THPStorageStr, "(): Storage device not recognized: ", device.type()); } device_guard.reset_device(device); } else { allocator = c10::GetDefaultCPUAllocator(); } // torch.Storage(*, ...) if (r.idx == 0) { self = THPStorage_NewWithStorage( type, make_storage_impl( c10::StorageImpl::use_byte_size_t(), 0, at::DataPtr(), allocator, /*resizable=*/true, device_opt), c10::impl::PyInterpreterStatus::DEFINITELY_UNINITIALIZED); // torch.Storage(size, *, ...) } else if (r.idx == 1) { int64_t size = r.toInt64(0); self = THPStorage_NewWithStorage( type, make_storage_impl( c10::StorageImpl::use_byte_size_t(), size, at::DataPtr(), allocator, /*resizable=*/true, device_opt), c10::impl::PyInterpreterStatus::DEFINITELY_UNINITIALIZED); // torch.Storage(sequence, *, ...) } else if (r.idx == 2) { PyObject* sequence = r.pyobject(0); Py_ssize_t length = PySequence_Length(sequence); TORCH_CHECK( PySequence_Check(sequence), THPStorageStr, "(): Expected a sequence type, but got ", THPUtils_typename(sequence)); TORCH_CHECK( length >= 0, THPStorageStr, "(): Could not obtain the length of sequence of type ", THPUtils_typename(sequence)); self = THPStorage_NewWithStorage( type, make_storage_impl( c10::StorageImpl::use_byte_size_t(), length, at::DataPtr(), allocator, /*resizable=*/true, device_opt), c10::impl::PyInterpreterStatus::DEFINITELY_UNINITIALIZED); THPObjectPtr item; try { const auto& storage = THPStorage_Unpack(self); for (Py_ssize_t i = 0; i < length; i++) { item = PySequence_GetItem(sequence, i); uint8_t value = THPByteUtils_unpackReal(item.get()); if (allocator == c10::GetDefaultCPUAllocator()) { static_cast(storage.mutable_data())[i] = value; } else { // TODO: this might be slow - consider batched updates? storage_set(storage, i, value); } } } catch (const std::exception& e) { TORCH_CHECK( THPStorageStr "(): tried to construct a storage from a sequence (", THPUtils_typename(sequence), "), ", "but one of the items was of type ", THPUtils_typename(item.get()), " instead of int"); return nullptr; } } return self; Py_RETURN_NONE; END_HANDLE_TH_ERRORS } static Py_ssize_t THPStorage_length(THPStorage* self) { HANDLE_TH_ERRORS THPStorage_assertNotNull(self); return static_cast(THPStorage_Unpack(self).nbytes()); END_HANDLE_TH_ERRORS_RET(-1) } static PyObject* THPStorage_get(THPStorage* self, PyObject* index) { HANDLE_TH_ERRORS THPStorage_assertNotNull(self); const auto& storage = THPStorage_Unpack(self); int64_t len = static_cast(storage.nbytes()); /* Integer index */ if (THPUtils_checkLong(index)) { int64_t nindex = THPUtils_unpackLong(index); if (nindex < 0) nindex += len; if (nindex < 0 || nindex >= len) { PyErr_SetString( PyExc_IndexError, fmt::format( "index {} out of range for storage of size {}", nindex, len)); return nullptr; } uint8_t value = storage_get(storage, nindex); return THPByteUtils_newReal(value); /* Slice index */ } else if (PySlice_Check(index)) { // NOLINTNEXTLINE(cppcoreguidelines-init-variables) Py_ssize_t start, stop, slicelength, step; if (PySlice_Unpack(index, &start, &stop, &step) < 0) { return nullptr; } slicelength = PySlice_AdjustIndices(len, &start, &stop, step); if (step != 1) { TORCH_CHECK( "Trying to slice with a step of ", step, ", but only a step of " "1 is supported"); return nullptr; } const auto& storage = THPStorage_Unpack(self); auto data = static_cast(storage.mutable_data()); at::StorageImpl* old_storage_impl = storage.unsafeGetStorageImpl(); c10::raw::intrusive_ptr::incref(old_storage_impl); std::optional device_opt = old_storage_impl->device(); auto new_storage_impl = make_storage_impl( c10::StorageImpl::use_byte_size_t(), #ifdef THQUANTIZED slicelength * sizeof(quantized_t), #else slicelength, #endif at::DataPtr( static_cast(data + start), old_storage_impl, [](void* s) { c10::raw::intrusive_ptr::decref(static_cast(s)); }, old_storage_impl->device()), old_storage_impl->allocator(), /* resizable */ false, device_opt); PyObject* _ret = THPStorage_NewWithStorage( Py_TYPE(self), std::move(new_storage_impl), c10::impl::PyInterpreterStatus::DEFINITELY_UNINITIALIZED); return _ret; } PyErr_Format( PyExc_TypeError, "can't index a " THPStorageStr " with %s", THPUtils_typename(index)); return nullptr; END_HANDLE_TH_ERRORS } static int THPStorage_set(THPStorage* self, PyObject* index, PyObject* value) { HANDLE_TH_ERRORS THPStorage_assertNotNull(self); if (!THPByteUtils_checkReal(value)) { TORCH_CHECK( "can only set storage content with a int types, but got ", THPUtils_typename(value), " instead"); return -1; } uint8_t rvalue = THPByteUtils_unpackReal(value); const auto& storage = THPStorage_Unpack(self); if (THPUtils_checkLong(index)) { int64_t nindex = THPUtils_unpackLong(index); storage_set(storage, nindex, rvalue); return 0; } else if (PySlice_Check(index)) { // NOLINTNEXTLINE(cppcoreguidelines-init-variables) Py_ssize_t start, stop, step; Py_ssize_t len = static_cast(storage.nbytes()); if (PySlice_Unpack(index, &start, &stop, &step) < 0) { return -1; } PySlice_AdjustIndices(len, &start, &stop, step); if (step != 1) { TORCH_CHECK( "Trying to slice with a step of ", step, ", but only a step of " "1 is supported"); return 0; } // TODO: check the bounds only once // TODO: fill? for (; start < stop; start++) storage_set(storage, start, rvalue); return 0; } TORCH_CHECK( "can't index a " THPStorageStr " with ", THPUtils_typename(index)); return -1; END_HANDLE_TH_ERRORS_RET(-1) } static PyMappingMethods THPStorage_mappingmethods = { (lenfunc)THPStorage_length, (binaryfunc)THPStorage_get, (objobjargproc)THPStorage_set}; struct THPStorageMeta { PyHeapTypeObject base; }; int THPStorageMetaType_init(PyObject* cls, PyObject* args, PyObject* kwargs); PyTypeObject THPStorageMetaType = { PyVarObject_HEAD_INIT( DEFERRED_ADDRESS(&PyType_Type), 0) "torch._C._StorageMeta", /* tp_name */ sizeof(THPStorageMeta), /* tp_basicsize */ 0, /* tp_itemsize */ nullptr, /* tp_dealloc */ 0, /* tp_vectorcall_offset */ nullptr, /* tp_getattr */ nullptr, /* tp_setattr */ nullptr, /* tp_reserved */ nullptr, /* tp_repr */ nullptr, /* tp_as_number */ nullptr, /* tp_as_sequence */ nullptr, /* tp_as_mapping */ nullptr, /* tp_hash */ nullptr, /* tp_call */ nullptr, /* tp_str */ nullptr, /* tp_getattro */ nullptr, /* tp_setattro */ nullptr, /* tp_as_buffer */ // NOLINTNEXTLINE(misc-redundant-expression) Py_TPFLAGS_DEFAULT | Py_TPFLAGS_BASETYPE, /* tp_flags */ nullptr, /* tp_doc */ nullptr, /* tp_traverse */ nullptr, /* tp_clear */ nullptr, /* tp_richcompare */ 0, /* tp_weaklistoffset */ nullptr, /* tp_iter */ nullptr, /* tp_iternext */ nullptr, /* tp_methods */ nullptr, /* tp_members */ nullptr, /* tp_getset */ DEFERRED_ADDRESS(&PyType_Type), /* tp_base */ nullptr, /* tp_dict */ nullptr, /* tp_descr_get */ nullptr, /* tp_descr_set */ 0, /* tp_dictoffset */ THPStorageMetaType_init, /* tp_init */ nullptr, /* tp_alloc */ nullptr, /* tp_new */ }; // TODO: implement equality PyTypeObject THPStorageType = { PyVarObject_HEAD_INIT( &THPStorageMetaType, 0) "torch._C.StorageBase", /* tp_name */ sizeof(THPStorage), /* tp_basicsize */ 0, /* tp_itemsize */ nullptr, /* tp_dealloc */ 0, /* tp_vectorcall_offset */ nullptr, /* tp_getattr */ nullptr, /* tp_setattr */ nullptr, /* tp_reserved */ nullptr, /* tp_repr */ nullptr, /* tp_as_number */ nullptr, /* tp_as_sequence */ &THPStorage_mappingmethods, /* tp_as_mapping */ nullptr, /* tp_hash */ nullptr, /* tp_call */ nullptr, /* tp_str */ nullptr, /* tp_getattro */ nullptr, /* tp_setattro */ nullptr, /* tp_as_buffer */ // NOLINTNEXTLINE(misc-redundant-expression) Py_TPFLAGS_DEFAULT | Py_TPFLAGS_BASETYPE, /* tp_flags */ nullptr, /* tp_doc */ nullptr, /* tp_traverse */ nullptr, /* tp_clear */ nullptr, /* tp_richcompare */ 0, /* tp_weaklistoffset */ nullptr, /* tp_iter */ nullptr, /* tp_iternext */ nullptr, /* will be assigned in init */ /* tp_methods */ nullptr, /* will be assigned in init */ /* tp_members */ nullptr, /* tp_getset */ nullptr, /* tp_base */ nullptr, /* tp_dict */ nullptr, /* tp_descr_get */ nullptr, /* tp_descr_set */ 0, /* tp_dictoffset */ nullptr, /* tp_init */ nullptr, /* tp_alloc */ THPStorage_pynew, /* tp_new */ }; int THPStorageMetaType_init(PyObject* cls, PyObject* args, PyObject* kwargs) { if (PyType_Type.tp_init(cls, args, kwargs) < 0) { return -1; } ((PyTypeObject*)cls)->tp_dealloc = (destructor)THPStorage_subclass_dealloc; return 0; } static PyObject* THPStorage_device(THPStorage* self, void* unused) { HANDLE_TH_ERRORS THPStorage_assertNotNull(self); return THPDevice_New(THPStorage_Unpack(self).device()); END_HANDLE_TH_ERRORS } PyObject* THPStorage_get_cdata(THPStorage* self, void* unused) { HANDLE_TH_ERRORS return PyLong_FromVoidPtr(THPStorage_Unpack(self).unsafeGetStorageImpl()); END_HANDLE_TH_ERRORS } typedef PyObject* (*getter)(PyObject*, void*); // NOLINTNEXTLINE(cppcoreguidelines-avoid-c-arrays,modernize-avoid-c-arrays,cppcoreguidelines-avoid-non-const-global-variables) static struct PyGetSetDef THPStorage_properties[] = { {"device", (getter)THPStorage_device, nullptr, nullptr, nullptr}, {"_cdata", (getter)THPStorage_get_cdata, nullptr, nullptr, nullptr}, {nullptr}}; bool THPStorage_init(PyObject* module) { static std::vector methods; THPUtils_addPyMethodDefs(methods, THPStorage_getMethods()); THPUtils_addPyMethodDefs(methods, THPStorage_getSharingMethods()); THPStorageMetaType.tp_base = &PyType_Type; if (PyType_Ready(&THPStorageMetaType) < 0) return false; Py_INCREF(&THPStorageMetaType); PyModule_AddObject(module, "_StorageMeta", (PyObject*)&THPStorageMetaType); THPStorageType.tp_methods = methods.data(); THPStorageType.tp_getset = THPStorage_properties; if (PyType_Ready(&THPStorageType) < 0) return false; Py_INCREF(&THPStorageType); PyModule_AddObject(module, "StorageBase", (PyObject*)&THPStorageType); return true; } void THPStorage_postInit(PyObject* module) { THPStorageClass = (PyTypeObject*)PyObject_GetAttrString(module, "UntypedStorage"); if (!THPStorageClass) throw python_error(); } void THPStorage_assertNotNull(THPStorage* storage) { TORCH_CHECK( THPStorage_Unpack(storage).unsafeGetStorageImpl(), "Got a null Storage"); } void THPStorage_assertNotNull(PyObject* obj) { THPStorage_assertNotNull((THPStorage*)obj); }