Track base class pointers of instances

This commits adds base class pointers of offset base classes (i.e. due
to multiple inheritance) to `registered_instances` so that if such a
pointer is returned we properly recognize it as an existing instance.

Without this, returning a base class pointer will cast to the existing
instance if the pointer happens to coincide with the instance pointer,
but constructs a new instance (quite possibly with a segfault, if
ownership is applied) for unequal base class pointers due to multiple
inheritance.
This commit is contained in:
Jason Rhinelander 2017-04-21 19:01:30 -04:00
parent 14e70650fe
commit 1f8a100d38
5 changed files with 102 additions and 21 deletions

View File

@ -24,6 +24,7 @@ inline PyTypeObject *make_default_metaclass();
/// Additional type information which does not fit into the PyTypeObject /// Additional type information which does not fit into the PyTypeObject
struct type_info { struct type_info {
PyTypeObject *type; PyTypeObject *type;
const std::type_info *cpptype;
size_t type_size; size_t type_size;
void *(*operator_new)(size_t); void *(*operator_new)(size_t);
void (*init_holder)(PyObject *, const void *); void (*init_holder)(PyObject *, const void *);
@ -35,9 +36,11 @@ struct type_info {
void *get_buffer_data = nullptr; void *get_buffer_data = nullptr;
/** A simple type never occurs as a (direct or indirect) parent /** A simple type never occurs as a (direct or indirect) parent
* of a class that makes use of multiple inheritance */ * of a class that makes use of multiple inheritance */
bool simple_type = true; bool simple_type : 1;
/* True if there is no multiple inheritance in this type's inheritance tree */
bool simple_ancestors : 1;
/* for base vs derived holder_type checks */ /* for base vs derived holder_type checks */
bool default_holder = true; bool default_holder : 1;
}; };
PYBIND11_NOINLINE inline internals &get_internals() { PYBIND11_NOINLINE inline internals &get_internals() {
@ -197,7 +200,7 @@ inline PyThreadState *get_thread_state_unchecked() {
// Forward declarations // Forward declarations
inline void keep_alive_impl(handle nurse, handle patient); inline void keep_alive_impl(handle nurse, handle patient);
inline void register_instance(void *self); inline void register_instance(void *self, const type_info *tinfo);
inline PyObject *make_new_instance(PyTypeObject *type, bool allocate_value = true); inline PyObject *make_new_instance(PyTypeObject *type, bool allocate_value = true);
class type_caster_generic { class type_caster_generic {
@ -338,7 +341,7 @@ public:
throw cast_error("unhandled return_value_policy: should not happen!"); throw cast_error("unhandled return_value_policy: should not happen!");
} }
register_instance(wrapper); register_instance(wrapper, tinfo);
tinfo->init_holder(inst.ptr(), existing_holder); tinfo->init_holder(inst.ptr(), existing_holder);
return inst.release(); return inst.release();

View File

@ -185,18 +185,35 @@ inline PyTypeObject* make_default_metaclass() {
return type; return type;
} }
inline void register_instance(void *self) { /// For multiple inheritance types we need to recursively register/deregister base pointers for any
auto *inst = (instance_essentials<void> *) self; /// base classes with pointers that are difference from the instance value pointer so that we can
get_internals().registered_instances.emplace(inst->value, self); /// correctly recognize an offset base class pointer. This calls a function with any offset base ptrs.
inline void traverse_offset_bases(void *valueptr, const detail::type_info *tinfo, void *self,
bool (*f)(void * /*parentptr*/, void * /*self*/)) {
for (handle h : reinterpret_borrow<tuple>(tinfo->type->tp_bases)) {
if (auto parent_tinfo = get_type_info((PyTypeObject *) h.ptr())) {
for (auto &c : parent_tinfo->implicit_casts) {
if (c.first == tinfo->cpptype) {
auto *parentptr = c.second(valueptr);
if (parentptr != valueptr)
f(parentptr, self);
traverse_offset_bases(parentptr, parent_tinfo, self, f);
break;
}
}
}
}
} }
inline bool deregister_instance(void *self) { inline bool register_instance_impl(void *ptr, void *self) {
auto *inst = (instance_essentials<void> *) self; get_internals().registered_instances.emplace(ptr, self);
auto type = Py_TYPE(inst); return true; // unused, but gives the same signature as the deregister func
}
inline bool deregister_instance_impl(void *ptr, void *self) {
auto &registered_instances = get_internals().registered_instances; auto &registered_instances = get_internals().registered_instances;
auto range = registered_instances.equal_range(inst->value); auto range = registered_instances.equal_range(ptr);
for (auto it = range.first; it != range.second; ++it) { for (auto it = range.first; it != range.second; ++it) {
if (type == Py_TYPE(it->second)) { if (Py_TYPE(self) == Py_TYPE(it->second)) {
registered_instances.erase(it); registered_instances.erase(it);
return true; return true;
} }
@ -204,6 +221,21 @@ inline bool deregister_instance(void *self) {
return false; return false;
} }
inline void register_instance(void *self, const type_info *tinfo) {
auto *inst = (instance_essentials<void> *) self;
register_instance_impl(inst->value, self);
if (!tinfo->simple_ancestors)
traverse_offset_bases(inst->value, tinfo, self, register_instance_impl);
}
inline bool deregister_instance(void *self, const detail::type_info *tinfo) {
auto *inst = (instance_essentials<void> *) self;
bool ret = deregister_instance_impl(inst->value, self);
if (!tinfo->simple_ancestors)
traverse_offset_bases(inst->value, tinfo, self, deregister_instance_impl);
return ret;
}
/// Creates a new instance which, by default, includes allocation (but not construction of) the /// Creates a new instance which, by default, includes allocation (but not construction of) the
/// wrapped C++ instance. If allocating value, the instance is registered; otherwise /// wrapped C++ instance. If allocating value, the instance is registered; otherwise
/// register_instance will need to be called once the value has been assigned. /// register_instance will need to be called once the value has been assigned.
@ -215,7 +247,7 @@ inline PyObject *make_new_instance(PyTypeObject *type, bool allocate_value /*= t
instance->holder_constructed = false; instance->holder_constructed = false;
if (allocate_value) { if (allocate_value) {
instance->value = tinfo->operator_new(tinfo->type_size); instance->value = tinfo->operator_new(tinfo->type_size);
register_instance(self); register_instance(self, tinfo);
} else { } else {
instance->value = nullptr; instance->value = nullptr;
} }
@ -248,12 +280,15 @@ extern "C" inline int pybind11_object_init(PyObject *self, PyObject *, PyObject
inline void clear_instance(PyObject *self) { inline void clear_instance(PyObject *self) {
auto instance = (instance_essentials<void> *) self; auto instance = (instance_essentials<void> *) self;
bool has_value = instance->value; bool has_value = instance->value;
type_info *tinfo = nullptr;
if (has_value || instance->holder_constructed) { if (has_value || instance->holder_constructed) {
auto type = Py_TYPE(self); auto type = Py_TYPE(self);
get_type_info(type)->dealloc(self); tinfo = get_type_info(type);
tinfo->dealloc(self);
} }
if (has_value) { if (has_value) {
if (!deregister_instance(self)) if (!tinfo) tinfo = get_type_info(Py_TYPE(self));
if (!deregister_instance(self, tinfo))
pybind11_fail("pybind11_object_dealloc(): Tried to deallocate unregistered instance!"); pybind11_fail("pybind11_object_dealloc(): Tried to deallocate unregistered instance!");
if (instance->weakrefs) if (instance->weakrefs)

View File

@ -813,10 +813,13 @@ protected:
/* Register supplemental type information in C++ dict */ /* Register supplemental type information in C++ dict */
auto *tinfo = new detail::type_info(); auto *tinfo = new detail::type_info();
tinfo->type = (PyTypeObject *) m_ptr; tinfo->type = (PyTypeObject *) m_ptr;
tinfo->cpptype = rec.type;
tinfo->type_size = rec.type_size; tinfo->type_size = rec.type_size;
tinfo->operator_new = rec.operator_new; tinfo->operator_new = rec.operator_new;
tinfo->init_holder = rec.init_holder; tinfo->init_holder = rec.init_holder;
tinfo->dealloc = rec.dealloc; tinfo->dealloc = rec.dealloc;
tinfo->simple_type = true;
tinfo->simple_ancestors = true;
auto &internals = get_internals(); auto &internals = get_internals();
auto tindex = std::type_index(*rec.type); auto tindex = std::type_index(*rec.type);
@ -825,8 +828,14 @@ protected:
internals.registered_types_cpp[tindex] = tinfo; internals.registered_types_cpp[tindex] = tinfo;
internals.registered_types_py[m_ptr] = tinfo; internals.registered_types_py[m_ptr] = tinfo;
if (rec.bases.size() > 1 || rec.multiple_inheritance) if (rec.bases.size() > 1 || rec.multiple_inheritance) {
mark_parents_nonsimple(tinfo->type); mark_parents_nonsimple(tinfo->type);
tinfo->simple_ancestors = false;
}
else if (rec.bases.size() == 1) {
auto parent_tinfo = get_type_info((PyTypeObject *) rec.bases[0].ptr());
tinfo->simple_ancestors = parent_tinfo->simple_ancestors;
}
} }
/// Helper function which tags all parents of a type using mult. inheritance /// Helper function which tags all parents of a type using mult. inheritance

View File

@ -107,8 +107,16 @@ test_initializer multiple_inheritance_casting([](py::module &m) {
py::class_<I801C, I801B1, I801B2, std::shared_ptr<I801C>>(m, "I801C").def(py::init<>()); py::class_<I801C, I801B1, I801B2, std::shared_ptr<I801C>>(m, "I801C").def(py::init<>());
py::class_<I801D, I801C, std::shared_ptr<I801D>>(m, "I801D").def(py::init<>()); py::class_<I801D, I801C, std::shared_ptr<I801D>>(m, "I801D").def(py::init<>());
// When returned a base class pointer to a derived instance, we cannot assume that the // Two separate issues here: first, we want to recognize a pointer to a base type as being a
// pointer is `reinterpret_cast`able to the derived pointer because the base class // known instance even when the pointer value is unequal (i.e. due to a non-first
// multiple-inheritance base class):
m.def("i801b1_c", [](I801C *c) { return static_cast<I801B1 *>(c); });
m.def("i801b2_c", [](I801C *c) { return static_cast<I801B2 *>(c); });
m.def("i801b1_d", [](I801D *d) { return static_cast<I801B1 *>(d); });
m.def("i801b2_d", [](I801D *d) { return static_cast<I801B2 *>(d); });
// Second, when returned a base class pointer to a derived instance, we cannot assume that the
// pointer is `reinterpret_cast`able to the derived pointer because, like above, the base class
// pointer could be offset. // pointer could be offset.
m.def("i801c_b1", []() -> I801B1 * { return new I801C(); }); m.def("i801c_b1", []() -> I801B1 * { return new I801C(); });
m.def("i801c_b2", []() -> I801B2 * { return new I801C(); }); m.def("i801c_b2", []() -> I801B2 * { return new I801C(); });

View File

@ -112,6 +112,32 @@ def test_mi_dynamic_attributes():
assert d.dynamic == 1 assert d.dynamic == 1
def test_mi_unaligned_base():
"""Returning an offset (non-first MI) base class pointer should recognize the instance"""
from pybind11_tests import I801C, I801D, i801b1_c, i801b2_c, i801b1_d, i801b2_d
n_inst = ConstructorStats.detail_reg_inst()
c = I801C()
d = I801D()
# + 4 below because we have the two instances, and each instance has offset base I801B2
assert ConstructorStats.detail_reg_inst() == n_inst + 4
b1c = i801b1_c(c)
assert b1c is c
b2c = i801b2_c(c)
assert b2c is c
b1d = i801b1_d(d)
assert b1d is d
b2d = i801b2_d(d)
assert b2d is d
assert ConstructorStats.detail_reg_inst() == n_inst + 4 # no extra instances
del c, b1c, b2c
assert ConstructorStats.detail_reg_inst() == n_inst + 2
del d, b1d, b2d
assert ConstructorStats.detail_reg_inst() == n_inst
def test_mi_base_return(): def test_mi_base_return():
"""Tests returning an offset (non-first MI) base class pointer to a derived instance""" """Tests returning an offset (non-first MI) base class pointer to a derived instance"""
from pybind11_tests import (I801B2, I801C, I801D, i801c_b1, i801c_b2, i801d_b1, i801d_b2, from pybind11_tests import (I801B2, I801C, I801D, i801c_b1, i801c_b2, i801d_b1, i801d_b2,
@ -129,7 +155,7 @@ def test_mi_base_return():
assert d1.a == 1 assert d1.a == 1
assert d1.b == 2 assert d1.b == 2
assert ConstructorStats.detail_reg_inst() == n_inst + 2 assert ConstructorStats.detail_reg_inst() == n_inst + 4
c2 = i801c_b2() c2 = i801c_b2()
assert type(c2) is I801C assert type(c2) is I801C
@ -141,10 +167,10 @@ def test_mi_base_return():
assert d2.a == 1 assert d2.a == 1
assert d2.b == 2 assert d2.b == 2
assert ConstructorStats.detail_reg_inst() == n_inst + 4 assert ConstructorStats.detail_reg_inst() == n_inst + 8
del c2 del c2
assert ConstructorStats.detail_reg_inst() == n_inst + 3 assert ConstructorStats.detail_reg_inst() == n_inst + 6
del c1, d1, d2 del c1, d1, d2
assert ConstructorStats.detail_reg_inst() == n_inst assert ConstructorStats.detail_reg_inst() == n_inst