-
-
Notifications
You must be signed in to change notification settings - Fork 181
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Support recursive and empty closure cells (#443)
* Fix #229 * .get still fails when index is unhashable * Cells are not allowed to change before 3.7 * Uncomment test cases if Python > 3.7 * Add more complex test case * Spooky edits at a distance * Wrap in exec to prevent syntax errors in Python 2 * Fix testcase * Test impossible in Py2 * Small correction * Correct the correction * Add Python 2 support * Turn feature on for Python 2 * Prefer function over object when possible * Add changes from review * Turn off test_circular_reference for Python 2 * Reformat and support empty cells * Solve some more versioning issues * Add shim that chooses the correct function at unpickling * Avoid pickling dill._dill * Small correction * This is why dill._dill would try to pickle * Add shim for reference cells * Copy functions for sentinel * Recursive function cells * Turn on test case for Python 3 only * Cell manipulation on PyPy 2.7 * Not possible in PyPy 2.7 * Correctly remove test case * Fix coverage * PyPy 2.7 Attempt 3 * Fix small issue * Clean up _create_cell * Empty cells in PyPy2 * Only two _create_cell functions * Fixes from review * Was probably not a good idea They can probably implement it better for their own use-case or it can be added later. * Split part of Shim into GetAttrShim * Strange issue with exec in PyPy3.6 * Better _shims.py * Rename cell_stack back to postproc It is more flexible and allows for future plans in going to cPickle. * Add _CELL_EMPTY to Python 3 in case it makes cPickle implementation easier * Add postproc_list to _save_with_postproc * Recursive functions and warnings * Better warning messages * Remove words "perfectly" and "would"
- Loading branch information
1 parent
9f3c64c
commit 0392e14
Showing
8 changed files
with
672 additions
and
138 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Large diffs are not rendered by default.
Oops, something went wrong.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,266 @@ | ||
#!/usr/bin/env python | ||
# | ||
# Author: Mike McKerns (mmckerns @caltech and @uqfoundation) | ||
# Author: Anirudh Vegesana ([email protected]) | ||
# Copyright (c) 2021 The Uncertainty Quantification Foundation. | ||
# License: 3-clause BSD. The full license text is available at: | ||
# - https://github.com/uqfoundation/dill/blob/master/LICENSE | ||
""" | ||
Provides shims for compatibility between versions of dill and Python. | ||
Compatibility shims should be provided in this file. Here are two simple example | ||
use cases. | ||
Deprecation of constructor function: | ||
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ||
Assume that we were transitioning _import_module in _dill.py to | ||
the builtin function importlib.import_module when present. | ||
@move_to(_dill) | ||
def _import_module(import_name): | ||
... # code already in _dill.py | ||
_import_module = Getattr(importlib, 'import_module', Getattr(_dill, '_import_module', None)) | ||
The code will attempt to find import_module in the importlib module. If not | ||
present, it will use the _import_module function in _dill. | ||
Emulate new Python behavior in older Python versions: | ||
~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ | ||
CellType.cell_contents behaves differently in Python 3.6 and 3.7. It is | ||
read-only in Python 3.6 and writable and deletable in 3.7. | ||
if _dill.OLD37 and _dill.HAS_CTYPES and ...: | ||
@move_to(_dill) | ||
def _setattr(object, name, value): | ||
if type(object) is _dill.CellType and name == 'cell_contents': | ||
_PyCell_Set.argtypes = (ctypes.py_object, ctypes.py_object) | ||
_PyCell_Set(object, value) | ||
else: | ||
setattr(object, name, value) | ||
... # more cases below | ||
_setattr = Getattr(_dill, '_setattr', setattr) | ||
_dill._setattr will be used when present to emulate Python 3.7 functionality in | ||
older versions of Python while defaulting to the standard setattr in 3.7+. | ||
See this PR for the discussion that lead to this system: | ||
https://github.com/uqfoundation/dill/pull/443 | ||
""" | ||
|
||
import inspect, sys | ||
|
||
_dill = sys.modules['dill._dill'] | ||
|
||
|
||
class Reduce(object): | ||
""" | ||
Reduce objects are wrappers used for compatibility enforcement during | ||
unpickle-time. They should only be used in calls to pickler.save and | ||
other Reduce objects. They are only evaluated within unpickler.load. | ||
Pickling a Reduce object makes the two implementations equivalent: | ||
pickler.save(Reduce(*reduction)) | ||
pickler.save_reduce(*reduction, obj=reduction) | ||
""" | ||
__slots__ = ['reduction'] | ||
def __new__(cls, *reduction, **kwargs): | ||
""" | ||
Args: | ||
*reduction: a tuple that matches the format given here: | ||
https://docs.python.org/3/library/pickle.html#object.__reduce__ | ||
is_callable: a bool to indicate that the object created by | ||
unpickling `reduction` is callable. If true, the current Reduce | ||
is allowed to be used as the function in further save_reduce calls | ||
or Reduce objects. | ||
""" | ||
is_callable = kwargs.get('is_callable', False) # Pleases Py2. Can be removed later | ||
if is_callable: | ||
self = object.__new__(_CallableReduce) | ||
else: | ||
self = object.__new__(Reduce) | ||
self.reduction = reduction | ||
return self | ||
def __repr__(self): | ||
return 'Reduce%s' % (self.reduction,) | ||
def __copy__(self): | ||
return self # pragma: no cover | ||
def __deepcopy__(self, memo): | ||
return self # pragma: no cover | ||
def __reduce__(self): | ||
return self.reduction | ||
def __reduce_ex__(self, protocol): | ||
return self.__reduce__() | ||
|
||
class _CallableReduce(Reduce): | ||
# A version of Reduce for functions. Used to trick pickler.save_reduce into | ||
# thinking that Reduce objects of functions are themselves meaningful functions. | ||
def __call__(self, *args, **kwargs): | ||
reduction = self.__reduce__() | ||
func = reduction[0] | ||
f_args = reduction[1] | ||
obj = func(*f_args) | ||
return obj(*args, **kwargs) | ||
|
||
__NO_DEFAULT = _dill.Sentinel('Getattr.NO_DEFAULT') | ||
|
||
def Getattr(object, name, default=__NO_DEFAULT): | ||
""" | ||
A Reduce object that represents the getattr operation. When unpickled, the | ||
Getattr will access an attribute 'name' of 'object' and return the value | ||
stored there. If the attribute doesn't exist, the default value will be | ||
returned if present. | ||
The following statements are equivalent: | ||
Getattr(collections, 'OrderedDict') | ||
Getattr(collections, 'spam', None) | ||
Getattr(*args) | ||
Reduce(getattr, (collections, 'OrderedDict')) | ||
Reduce(getattr, (collections, 'spam', None)) | ||
Reduce(getattr, args) | ||
During unpickling, the first two will result in collections.OrderedDict and | ||
None respectively because the first attribute exists and the second one does | ||
not, forcing it to use the default value given in the third argument. | ||
""" | ||
|
||
if default is Getattr.NO_DEFAULT: | ||
reduction = (getattr, (object, name)) | ||
else: | ||
reduction = (getattr, (object, name, default)) | ||
|
||
return Reduce(*reduction, is_callable=callable(default)) | ||
|
||
Getattr.NO_DEFAULT = __NO_DEFAULT | ||
del __NO_DEFAULT | ||
|
||
def move_to(module, name=None): | ||
def decorator(func): | ||
if name is None: | ||
fname = func.__name__ | ||
else: | ||
fname = name | ||
module.__dict__[fname] = func | ||
func.__module__ = module.__name__ | ||
return func | ||
return decorator | ||
|
||
###################### | ||
## Compatibility Shims are defined below | ||
###################### | ||
|
||
_CELL_EMPTY = Getattr(_dill, '_CELL_EMPTY', None) | ||
|
||
if _dill.OLD37: | ||
if _dill.HAS_CTYPES and hasattr(_dill.ctypes, 'pythonapi') and hasattr(_dill.ctypes.pythonapi, 'PyCell_Set'): | ||
# CPython | ||
ctypes = _dill.ctypes | ||
|
||
_PyCell_Set = ctypes.pythonapi.PyCell_Set | ||
|
||
@move_to(_dill) | ||
def _setattr(object, name, value): | ||
if type(object) is _dill.CellType and name == 'cell_contents': | ||
_PyCell_Set.argtypes = (ctypes.py_object, ctypes.py_object) | ||
_PyCell_Set(object, value) | ||
else: | ||
setattr(object, name, value) | ||
|
||
@move_to(_dill) | ||
def _delattr(object, name): | ||
if type(object) is _dill.CellType and name == 'cell_contents': | ||
_PyCell_Set.argtypes = (ctypes.py_object, ctypes.c_void_p) | ||
_PyCell_Set(object, None) | ||
else: | ||
delattr(object, name) | ||
|
||
# General Python (not CPython) up to 3.6 is in a weird case, where it is | ||
# possible to pickle recursive cells, but we can't assign directly to the | ||
# cell. | ||
elif _dill.PY3: | ||
# Use nonlocal variables to reassign the cell value. | ||
# https://stackoverflow.com/a/59276835 | ||
__nonlocal = ('nonlocal cell',) | ||
exec('''def _setattr(cell, name, value): | ||
if type(cell) is _dill.CellType and name == 'cell_contents': | ||
def cell_setter(value): | ||
%s | ||
cell = value # pylint: disable=unused-variable | ||
func = _dill.FunctionType(cell_setter.__code__, globals(), "", None, (cell,)) # same as cell_setter, but with cell being the cell's contents | ||
func(value) | ||
else: | ||
setattr(cell, name, value)''' % __nonlocal) | ||
move_to(_dill)(_setattr) | ||
|
||
exec('''def _delattr(cell, name): | ||
if type(cell) is _dill.CellType and name == 'cell_contents': | ||
try: | ||
cell.cell_contents | ||
except: | ||
return | ||
def cell_deleter(): | ||
%s | ||
del cell # pylint: disable=unused-variable | ||
func = _dill.FunctionType(cell_deleter.__code__, globals(), "", None, (cell,)) # same as cell_deleter, but with cell being the cell's contents | ||
func() | ||
else: | ||
delattr(cell, name)''' % __nonlocal) | ||
move_to(_dill)(_delattr) | ||
|
||
else: | ||
# Likely PyPy 2.7. Simulate the nonlocal keyword with bytecode | ||
# manipulation. | ||
|
||
# The following function is based on 'cell_set' from 'cloudpickle' | ||
# https://github.com/cloudpipe/cloudpickle/blob/5d89947288a18029672596a4d719093cc6d5a412/cloudpickle/cloudpickle.py#L393-L482 | ||
# Copyright (c) 2012, Regents of the University of California. | ||
# Copyright (c) 2009 `PiCloud, Inc. <http://www.picloud.com>`_. | ||
# License: https://github.com/cloudpipe/cloudpickle/blob/master/LICENSE | ||
@move_to(_dill) | ||
def _setattr(cell, name, value): | ||
if type(cell) is _dill.CellType and name == 'cell_contents': | ||
_cell_set = _dill.FunctionType( | ||
_cell_set_template_code, {}, '_cell_set', (), (cell,),) | ||
_cell_set(value) | ||
else: | ||
setattr(cell, name, value) | ||
|
||
def _cell_set_factory(value): | ||
lambda: cell | ||
cell = value | ||
|
||
co = _cell_set_factory.__code__ | ||
|
||
_cell_set_template_code = _dill.CodeType( | ||
co.co_argcount, | ||
co.co_nlocals, | ||
co.co_stacksize, | ||
co.co_flags, | ||
co.co_code, | ||
co.co_consts, | ||
co.co_names, | ||
co.co_varnames, | ||
co.co_filename, | ||
co.co_name, | ||
co.co_firstlineno, | ||
co.co_lnotab, | ||
co.co_cellvars, # co_freevars is initialized with co_cellvars | ||
(), # co_cellvars is made empty | ||
) | ||
|
||
del co | ||
|
||
@move_to(_dill) | ||
def _delattr(cell, name): | ||
if type(cell) is _dill.CellType and name == 'cell_contents': | ||
pass | ||
else: | ||
delattr(cell, name) | ||
|
||
_setattr = Getattr(_dill, '_setattr', setattr) | ||
_delattr = Getattr(_dill, '_delattr', delattr) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Oops, something went wrong.