-
-
Notifications
You must be signed in to change notification settings - Fork 32k
gh-92888: Fix memoryview bad __index__
use after free
#92946
New issue
Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.
By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.
Already on GitHub? Sign in to your account
Changes from 10 commits
73ffb29
3581de7
43c66d6
18b921f
2f3c04f
a250b02
c818990
42a706c
b650764
47bd91f
6890713
d3edf74
File filter
Filter by extension
Conversations
Jump to
Diff view
Diff view
There are no files selected for viewing
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -545,6 +545,104 @@ def test_pickle(self): | |
with self.assertRaises(TypeError): | ||
pickle.dumps(m, proto) | ||
|
||
def test_use_released_memory(self): | ||
size = 128 | ||
def release(): | ||
m.release() | ||
nonlocal ba | ||
ba = bytearray(size) | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. That's useless, no? There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. No, we need it for tests below that tests indexing into There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. We allocate a bytearray of the same size as the bytearray just released in memoryview in hope that it will be allocated at the same memory. It helps to check that we do nor read/write a freed memory. |
||
class MyIndex: | ||
def __index__(self): | ||
release() | ||
return 4 | ||
class MyFloat: | ||
def __float__(self): | ||
release() | ||
return 4.25 | ||
class MyBool: | ||
def __bool__(self): | ||
release() | ||
return True | ||
|
||
ba = None | ||
m = memoryview(bytearray(b'\xff'*size)) | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. In my PR, I tried to make the code more generic to test more cases: https://github.com/python/cpython/pull/93127/files#diff-d41c6bb40a1e03fea5a20d15c4077413e0ddde65651147922b625b03a66a2f16R399:
|
||
with self.assertRaises(ValueError): | ||
m[MyIndex()] | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. This test is very long. Can you try to factorize similar code and use loop with subTest(), and put pack operations in one test method and unpack in another test method? There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Then we will need to duplicate the definitions of internal classes. The tested code is so different, that it is difficult to use a loop. And I think that the result will be more complicated. |
||
|
||
ba = None | ||
m = memoryview(bytearray(b'\xff'*size)) | ||
self.assertEqual(list(m[:MyIndex()]), [255] * 4) | ||
|
||
ba = None | ||
m = memoryview(bytearray(b'\xff'*size)) | ||
self.assertEqual(list(m[MyIndex():8]), [255] * 4) | ||
|
||
Fidget-Spinner marked this conversation as resolved.
Show resolved
Hide resolved
|
||
ba = None | ||
m = memoryview(bytearray(b'\xff'*size)).cast('B', (64, 2)) | ||
with self.assertRaisesRegex(ValueError, "operation forbidden"): | ||
m[MyIndex(), 0] | ||
|
||
ba = None | ||
m = memoryview(bytearray(b'\xff'*size)).cast('B', (2, 64)) | ||
with self.assertRaisesRegex(ValueError, "operation forbidden"): | ||
m[0, MyIndex()] | ||
|
||
ba = None | ||
m = memoryview(bytearray(b'\xff'*size)) | ||
with self.assertRaisesRegex(ValueError, "operation forbidden"): | ||
m[MyIndex()] = 42 | ||
self.assertEqual(ba[:8], b'\0'*8) | ||
|
||
ba = None | ||
m = memoryview(bytearray(b'\xff'*size)) | ||
with self.assertRaisesRegex(ValueError, "operation forbidden"): | ||
m[:MyIndex()] = b'spam' | ||
self.assertEqual(ba[:8], b'\0'*8) | ||
|
||
ba = None | ||
m = memoryview(bytearray(b'\xff'*size)) | ||
with self.assertRaisesRegex(ValueError, "operation forbidden"): | ||
m[MyIndex():8] = b'spam' | ||
self.assertEqual(ba[:8], b'\0'*8) | ||
|
||
Fidget-Spinner marked this conversation as resolved.
Show resolved
Hide resolved
|
||
ba = None | ||
m = memoryview(bytearray(b'\xff'*size)).cast('B', (64, 2)) | ||
with self.assertRaisesRegex(ValueError, "operation forbidden"): | ||
m[MyIndex(), 0] = 42 | ||
self.assertEqual(ba[8:16], b'\0'*8) | ||
ba = None | ||
m = memoryview(bytearray(b'\xff'*size)).cast('B', (2, 64)) | ||
with self.assertRaisesRegex(ValueError, "operation forbidden"): | ||
m[0, MyIndex()] = 42 | ||
self.assertEqual(ba[:8], b'\0'*8) | ||
|
||
ba = None | ||
m = memoryview(bytearray(b'\xff'*size)) | ||
with self.assertRaisesRegex(ValueError, "operation forbidden"): | ||
m[0] = MyIndex() | ||
self.assertEqual(ba[:8], b'\0'*8) | ||
|
||
for fmt in 'bhilqnBHILQN': | ||
with self.subTest(fmt=fmt): | ||
ba = None | ||
m = memoryview(bytearray(b'\xff'*size)).cast(fmt) | ||
with self.assertRaisesRegex(ValueError, "operation forbidden"): | ||
m[0] = MyIndex() | ||
self.assertEqual(ba[:8], b'\0'*8) | ||
|
||
for fmt in 'fd': | ||
with self.subTest(fmt=fmt): | ||
ba = None | ||
m = memoryview(bytearray(b'\xff'*size)).cast(fmt) | ||
with self.assertRaisesRegex(ValueError, "operation forbidden"): | ||
m[0] = MyFloat() | ||
self.assertEqual(ba[:8], b'\0'*8) | ||
|
||
ba = None | ||
m = memoryview(bytearray(b'\xff'*size)).cast('?') | ||
with self.assertRaisesRegex(ValueError, "operation forbidden"): | ||
m[0] = MyBool() | ||
self.assertEqual(ba[:8], b'\0'*8) | ||
|
||
if __name__ == "__main__": | ||
unittest.main() |
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,2 @@ | ||
Fix ``memoryview`` use after free when accessing the backing buffer in certain cases. | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. I propose to mention more explicitly that the protection is about released views:
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Not always an exception is raised. The bug was in reading or wring the freed memory. Now it is prevented -- you either get an exception or free the memory after reading. @Fidget-Spinner's description is more correct. I am going to address such inconsistency in a separate issue. |
||
|
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -381,8 +381,9 @@ copy_rec(const Py_ssize_t *shape, Py_ssize_t ndim, Py_ssize_t itemsize, | |
|
||
/* Faster copying of one-dimensional arrays. */ | ||
static int | ||
copy_single(const Py_buffer *dest, const Py_buffer *src) | ||
copy_single(PyMemoryViewObject *self, const Py_buffer *dest, const Py_buffer *src) | ||
{ | ||
CHECK_RELEASED_INT(self); /* See gh-92888 for why we need this here */ | ||
There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Can you move the check after the equiv_structure() test? There was a problem hiding this comment. Choose a reason for hiding this commentThe reason will be displayed to describe this comment to others. Learn more. Would not access to Py_buffer of the released object cause reading after free? |
||
char *mem = NULL; | ||
|
||
assert(dest->ndim == 1); | ||
|
@@ -1677,7 +1678,7 @@ pylong_as_zu(PyObject *item) | |
module syntax. This function is very sensitive to small changes. With this | ||
layout gcc automatically generates a fast jump table. */ | ||
static inline PyObject * | ||
unpack_single(const char *ptr, const char *fmt) | ||
unpack_single(PyMemoryViewObject *self, const char *ptr, const char *fmt) | ||
{ | ||
unsigned long long llu; | ||
unsigned long lu; | ||
|
@@ -1689,6 +1690,8 @@ unpack_single(const char *ptr, const char *fmt) | |
unsigned char uc; | ||
void *p; | ||
|
||
CHECK_RELEASED(self); /* See gh-92888 for why we need this here */ | ||
Fidget-Spinner marked this conversation as resolved.
Show resolved
Hide resolved
|
||
|
||
switch (fmt[0]) { | ||
|
||
/* signed integers and fast path for 'B' */ | ||
|
@@ -1767,7 +1770,7 @@ unpack_single(const char *ptr, const char *fmt) | |
/* Pack a single item. 'fmt' can be any native format character in | ||
struct module syntax. */ | ||
static int | ||
pack_single(char *ptr, PyObject *item, const char *fmt) | ||
pack_single(PyMemoryViewObject *self, char *ptr, PyObject *item, const char *fmt) | ||
{ | ||
unsigned long long llu; | ||
unsigned long lu; | ||
|
@@ -1778,12 +1781,15 @@ pack_single(char *ptr, PyObject *item, const char *fmt) | |
double d; | ||
void *p; | ||
|
||
CHECK_RELEASED_INT(self); /* See gh-92888 for why we need this here */ | ||
Fidget-Spinner marked this conversation as resolved.
Show resolved
Hide resolved
|
||
|
||
switch (fmt[0]) { | ||
/* signed integers */ | ||
case 'b': case 'h': case 'i': case 'l': | ||
ld = pylong_as_ld(item); | ||
if (ld == -1 && PyErr_Occurred()) | ||
goto err_occurred; | ||
CHECK_RELEASED_INT(self); /* See gh-92888 for why we need this here */ | ||
switch (fmt[0]) { | ||
case 'b': | ||
if (ld < SCHAR_MIN || ld > SCHAR_MAX) goto err_range; | ||
|
@@ -1804,6 +1810,7 @@ pack_single(char *ptr, PyObject *item, const char *fmt) | |
lu = pylong_as_lu(item); | ||
if (lu == (unsigned long)-1 && PyErr_Occurred()) | ||
goto err_occurred; | ||
CHECK_RELEASED_INT(self); /* See gh-92888 for why we need this here */ | ||
switch (fmt[0]) { | ||
case 'B': | ||
if (lu > UCHAR_MAX) goto err_range; | ||
|
@@ -1824,12 +1831,14 @@ pack_single(char *ptr, PyObject *item, const char *fmt) | |
lld = pylong_as_lld(item); | ||
if (lld == -1 && PyErr_Occurred()) | ||
goto err_occurred; | ||
CHECK_RELEASED_INT(self); /* See gh-92888 for why we need this here */ | ||
PACK_SINGLE(ptr, lld, long long); | ||
break; | ||
case 'Q': | ||
llu = pylong_as_llu(item); | ||
if (llu == (unsigned long long)-1 && PyErr_Occurred()) | ||
goto err_occurred; | ||
CHECK_RELEASED_INT(self); /* See gh-92888 for why we need this here */ | ||
PACK_SINGLE(ptr, llu, unsigned long long); | ||
break; | ||
|
||
|
@@ -1838,12 +1847,14 @@ pack_single(char *ptr, PyObject *item, const char *fmt) | |
zd = pylong_as_zd(item); | ||
if (zd == -1 && PyErr_Occurred()) | ||
goto err_occurred; | ||
CHECK_RELEASED_INT(self); /* See gh-92888 for why we need this here */ | ||
PACK_SINGLE(ptr, zd, Py_ssize_t); | ||
break; | ||
case 'N': | ||
zu = pylong_as_zu(item); | ||
if (zu == (size_t)-1 && PyErr_Occurred()) | ||
goto err_occurred; | ||
CHECK_RELEASED_INT(self); /* See gh-92888 for why we need this here */ | ||
PACK_SINGLE(ptr, zu, size_t); | ||
break; | ||
|
||
|
@@ -1852,6 +1863,7 @@ pack_single(char *ptr, PyObject *item, const char *fmt) | |
d = PyFloat_AsDouble(item); | ||
if (d == -1.0 && PyErr_Occurred()) | ||
goto err_occurred; | ||
CHECK_RELEASED_INT(self); /* See gh-92888 for why we need this here */ | ||
if (fmt[0] == 'f') { | ||
PACK_SINGLE(ptr, d, float); | ||
} | ||
|
@@ -1865,6 +1877,7 @@ pack_single(char *ptr, PyObject *item, const char *fmt) | |
ld = PyObject_IsTrue(item); | ||
if (ld < 0) | ||
return -1; /* preserve original error */ | ||
CHECK_RELEASED_INT(self); /* See gh-92888 for why we need this here */ | ||
PACK_SINGLE(ptr, ld, _Bool); | ||
break; | ||
|
||
|
@@ -1882,6 +1895,7 @@ pack_single(char *ptr, PyObject *item, const char *fmt) | |
p = PyLong_AsVoidPtr(item); | ||
if (p == NULL && PyErr_Occurred()) | ||
goto err_occurred; | ||
CHECK_RELEASED_INT(self); /* See gh-92888 for why we need this here */ | ||
PACK_SINGLE(ptr, p, void *); | ||
break; | ||
|
||
|
@@ -2048,7 +2062,7 @@ adjust_fmt(const Py_buffer *view) | |
|
||
/* Base case for multi-dimensional unpacking. Assumption: ndim == 1. */ | ||
static PyObject * | ||
tolist_base(const char *ptr, const Py_ssize_t *shape, | ||
tolist_base(PyMemoryViewObject *self, const char *ptr, const Py_ssize_t *shape, | ||
const Py_ssize_t *strides, const Py_ssize_t *suboffsets, | ||
const char *fmt) | ||
{ | ||
|
@@ -2061,7 +2075,7 @@ tolist_base(const char *ptr, const Py_ssize_t *shape, | |
|
||
for (i = 0; i < shape[0]; ptr+=strides[0], i++) { | ||
const char *xptr = ADJUST_PTR(ptr, suboffsets, 0); | ||
item = unpack_single(xptr, fmt); | ||
item = unpack_single(self, xptr, fmt); | ||
if (item == NULL) { | ||
Py_DECREF(lst); | ||
return NULL; | ||
|
@@ -2075,7 +2089,7 @@ tolist_base(const char *ptr, const Py_ssize_t *shape, | |
/* Unpack a multi-dimensional array into a nested list. | ||
Assumption: ndim >= 1. */ | ||
static PyObject * | ||
tolist_rec(const char *ptr, Py_ssize_t ndim, const Py_ssize_t *shape, | ||
tolist_rec(PyMemoryViewObject *self, const char *ptr, Py_ssize_t ndim, const Py_ssize_t *shape, | ||
const Py_ssize_t *strides, const Py_ssize_t *suboffsets, | ||
const char *fmt) | ||
{ | ||
|
@@ -2087,15 +2101,15 @@ tolist_rec(const char *ptr, Py_ssize_t ndim, const Py_ssize_t *shape, | |
assert(strides != NULL); | ||
|
||
if (ndim == 1) | ||
return tolist_base(ptr, shape, strides, suboffsets, fmt); | ||
return tolist_base(self, ptr, shape, strides, suboffsets, fmt); | ||
|
||
lst = PyList_New(shape[0]); | ||
if (lst == NULL) | ||
return NULL; | ||
|
||
for (i = 0; i < shape[0]; ptr+=strides[0], i++) { | ||
const char *xptr = ADJUST_PTR(ptr, suboffsets, 0); | ||
item = tolist_rec(xptr, ndim-1, shape+1, | ||
item = tolist_rec(self, xptr, ndim-1, shape+1, | ||
strides+1, suboffsets ? suboffsets+1 : NULL, | ||
fmt); | ||
if (item == NULL) { | ||
|
@@ -2129,15 +2143,15 @@ memoryview_tolist_impl(PyMemoryViewObject *self) | |
if (fmt == NULL) | ||
return NULL; | ||
if (view->ndim == 0) { | ||
return unpack_single(view->buf, fmt); | ||
return unpack_single(self, view->buf, fmt); | ||
} | ||
else if (view->ndim == 1) { | ||
return tolist_base(view->buf, view->shape, | ||
return tolist_base(self, view->buf, view->shape, | ||
view->strides, view->suboffsets, | ||
fmt); | ||
} | ||
else { | ||
return tolist_rec(view->buf, view->ndim, view->shape, | ||
return tolist_rec(self, view->buf, view->ndim, view->shape, | ||
view->strides, view->suboffsets, | ||
fmt); | ||
} | ||
|
@@ -2345,7 +2359,7 @@ memory_item(PyMemoryViewObject *self, Py_ssize_t index) | |
char *ptr = ptr_from_index(view, index); | ||
if (ptr == NULL) | ||
return NULL; | ||
return unpack_single(ptr, fmt); | ||
return unpack_single(self, ptr, fmt); | ||
} | ||
|
||
PyErr_SetString(PyExc_NotImplementedError, | ||
|
@@ -2376,7 +2390,7 @@ memory_item_multi(PyMemoryViewObject *self, PyObject *tup) | |
ptr = ptr_from_tuple(view, tup); | ||
if (ptr == NULL) | ||
return NULL; | ||
return unpack_single(ptr, fmt); | ||
return unpack_single(self, ptr, fmt); | ||
} | ||
|
||
static inline int | ||
|
@@ -2463,7 +2477,7 @@ memory_subscript(PyMemoryViewObject *self, PyObject *key) | |
const char *fmt = adjust_fmt(view); | ||
if (fmt == NULL) | ||
return NULL; | ||
return unpack_single(view->buf, fmt); | ||
return unpack_single(self, view->buf, fmt); | ||
} | ||
else if (key == Py_Ellipsis) { | ||
Py_INCREF(self); | ||
|
@@ -2538,7 +2552,7 @@ memory_ass_sub(PyMemoryViewObject *self, PyObject *key, PyObject *value) | |
if (key == Py_Ellipsis || | ||
(PyTuple_Check(key) && PyTuple_GET_SIZE(key)==0)) { | ||
ptr = (char *)view->buf; | ||
return pack_single(ptr, value, fmt); | ||
return pack_single(self, ptr, value, fmt); | ||
} | ||
else { | ||
PyErr_SetString(PyExc_TypeError, | ||
|
@@ -2560,7 +2574,7 @@ memory_ass_sub(PyMemoryViewObject *self, PyObject *key, PyObject *value) | |
ptr = ptr_from_index(view, index); | ||
if (ptr == NULL) | ||
return -1; | ||
return pack_single(ptr, value, fmt); | ||
return pack_single(self, ptr, value, fmt); | ||
} | ||
/* one-dimensional: fast path */ | ||
if (PySlice_Check(key) && view->ndim == 1) { | ||
|
@@ -2583,7 +2597,7 @@ memory_ass_sub(PyMemoryViewObject *self, PyObject *key, PyObject *value) | |
goto end_block; | ||
dest.len = dest.shape[0] * dest.itemsize; | ||
|
||
ret = copy_single(&dest, &src); | ||
ret = copy_single(self, &dest, &src); | ||
|
||
end_block: | ||
PyBuffer_Release(&src); | ||
|
@@ -2599,7 +2613,7 @@ memory_ass_sub(PyMemoryViewObject *self, PyObject *key, PyObject *value) | |
ptr = ptr_from_tuple(view, key); | ||
if (ptr == NULL) | ||
return -1; | ||
return pack_single(ptr, value, fmt); | ||
return pack_single(self, ptr, value, fmt); | ||
} | ||
if (PySlice_Check(key) || is_multislice(key)) { | ||
/* Call memory_subscript() to produce a sliced lvalue, then copy | ||
|
@@ -3200,7 +3214,7 @@ memoryiter_next(memoryiterobject *it) | |
if (ptr == NULL) { | ||
return NULL; | ||
} | ||
return unpack_single(ptr, it->it_fmt); | ||
return unpack_single(seq, ptr, it->it_fmt); | ||
} | ||
|
||
it->it_seq = NULL; | ||
|
Uh oh!
There was an error while loading. Please reload this page.