diff options
author | Raymond Hettinger <rhettinger@users.noreply.github.com> | 2019-08-29 16:02:58 (GMT) |
---|---|---|
committer | GitHub <noreply@github.com> | 2019-08-29 16:02:58 (GMT) |
commit | 88ea166dadb8aeb34541a0a464662dea222629e5 (patch) | |
tree | b9645a7bc80d97fb831ad252d467ff649f29b435 | |
parent | 4901fe274bc82b95dc89bcb3de8802a3dfedab32 (diff) | |
download | cpython-88ea166dadb8aeb34541a0a464662dea222629e5.zip cpython-88ea166dadb8aeb34541a0a464662dea222629e5.tar.gz cpython-88ea166dadb8aeb34541a0a464662dea222629e5.tar.bz2 |
bpo-8425: Fast path for set inplace difference when the second set is large (GH-15590)
-rw-r--r-- | Misc/NEWS.d/next/Core and Builtins/2019-08-29-01-55-38.bpo-8425.FTq4A8.rst | 3 | ||||
-rw-r--r-- | Objects/setobject.c | 18 |
2 files changed, 20 insertions, 1 deletions
diff --git a/Misc/NEWS.d/next/Core and Builtins/2019-08-29-01-55-38.bpo-8425.FTq4A8.rst b/Misc/NEWS.d/next/Core and Builtins/2019-08-29-01-55-38.bpo-8425.FTq4A8.rst new file mode 100644 index 0000000..8e5ec0b --- /dev/null +++ b/Misc/NEWS.d/next/Core and Builtins/2019-08-29-01-55-38.bpo-8425.FTq4A8.rst @@ -0,0 +1,3 @@ +Optimize set difference_update for the case when the other set is much +larger than the base set. (Suggested by Evgeny Kapun with code contributed +by Michele OrrĂ¹). diff --git a/Objects/setobject.c b/Objects/setobject.c index 56858db..fafc2fa 100644 --- a/Objects/setobject.c +++ b/Objects/setobject.c @@ -1463,9 +1463,25 @@ set_difference_update_internal(PySetObject *so, PyObject *other) setentry *entry; Py_ssize_t pos = 0; + /* Optimization: When the other set is more than 8 times + larger than the base set, replace the other set with + interesection of the two sets. + */ + if ((PySet_GET_SIZE(other) >> 3) > PySet_GET_SIZE(so)) { + other = set_intersection(so, other); + if (other == NULL) + return -1; + } else { + Py_INCREF(other); + } + while (set_next((PySetObject *)other, &pos, &entry)) - if (set_discard_entry(so, entry->key, entry->hash) < 0) + if (set_discard_entry(so, entry->key, entry->hash) < 0) { + Py_DECREF(other); return -1; + } + + Py_DECREF(other); } else { PyObject *key, *it; it = PyObject_GetIter(other); |