|
@@ -3,62 +3,148 @@
|
|
|
Custom Django Model Fields.
|
|
|
|
|
|
"""
|
|
|
-from django.db import models
|
|
|
-from django.conf import settings
|
|
|
-from celery.serialization import pickle
|
|
|
|
|
|
+from copy import deepcopy
|
|
|
+from base64 import b64encode, b64decode
|
|
|
+from zlib import compress, decompress
|
|
|
+try:
|
|
|
+ from cPickle import loads, dumps
|
|
|
+except ImportError:
|
|
|
+ from pickle import loads, dumps
|
|
|
+
|
|
|
+from django.db import models
|
|
|
+from django.utils.encoding import force_unicode
|
|
|
|
|
|
class PickledObject(str):
|
|
|
- """A subclass of string so it can be told whether a string is
|
|
|
- a pickled object or not (if the object is an instance of this class
|
|
|
- then it must [well, should] be a pickled one)."""
|
|
|
+ """
|
|
|
+ A subclass of string so it can be told whether a string is a pickled
|
|
|
+ object or not (if the object is an instance of this class then it must
|
|
|
+ [well, should] be a pickled one).
|
|
|
+
|
|
|
+ Only really useful for passing pre-encoded values to ``default``
|
|
|
+ with ``dbsafe_encode``, not that doing so is necessary. If you
|
|
|
+ remove PickledObject and its references, you won't be able to pass
|
|
|
+ in pre-encoded values anymore, but you can always just pass in the
|
|
|
+ python objects themselves.
|
|
|
+
|
|
|
+ """
|
|
|
pass
|
|
|
|
|
|
+def dbsafe_encode(value, compress_object=False):
|
|
|
+ """
|
|
|
+ We use deepcopy() here to avoid a problem with cPickle, where dumps
|
|
|
+ can generate different character streams for same lookup value if
|
|
|
+ they are referenced differently.
|
|
|
+
|
|
|
+ The reason this is important is because we do all of our lookups as
|
|
|
+ simple string matches, thus the character streams must be the same
|
|
|
+ for the lookups to work properly. See tests.py for more information.
|
|
|
+ """
|
|
|
+ if not compress_object:
|
|
|
+ value = b64encode(dumps(deepcopy(value)))
|
|
|
+ else:
|
|
|
+ value = b64encode(compress(dumps(deepcopy(value))))
|
|
|
+ return PickledObject(value)
|
|
|
|
|
|
-if settings.DATABASE_ENGINE == "postgresql_psycopg2":
|
|
|
- import psycopg2.extensions
|
|
|
- # register PickledObject as a QuotedString otherwise we will see
|
|
|
- # can't adapt errors from psycopg2.
|
|
|
- psycopg2.extensions.register_adapter(PickledObject,
|
|
|
- psycopg2.extensions.QuotedString)
|
|
|
-
|
|
|
+def dbsafe_decode(value, compress_object=False):
|
|
|
+ if not compress_object:
|
|
|
+ value = loads(b64decode(value))
|
|
|
+ else:
|
|
|
+ value = loads(decompress(b64decode(value)))
|
|
|
+ return value
|
|
|
|
|
|
class PickledObjectField(models.Field):
|
|
|
- """A field that automatically pickles/unpickles its value."""
|
|
|
+ """
|
|
|
+ A field that will accept *any* python object and store it in the
|
|
|
+ database. PickledObjectField will optionally compress it's values if
|
|
|
+ declared with the keyword argument ``compress=True``.
|
|
|
+
|
|
|
+ Does not actually encode and compress ``None`` objects (although you
|
|
|
+ can still do lookups using None). This way, it is still possible to
|
|
|
+ use the ``isnull`` lookup type correctly. Because of this, the field
|
|
|
+ defaults to ``null=True``, as otherwise it wouldn't be able to store
|
|
|
+ None values since they aren't pickled and encoded.
|
|
|
+
|
|
|
+ """
|
|
|
__metaclass__ = models.SubfieldBase
|
|
|
+
|
|
|
+ def __init__(self, *args, **kwargs):
|
|
|
+ self.compress = kwargs.pop('compress', False)
|
|
|
+ self.protocol = kwargs.pop('protocol', 2)
|
|
|
+ kwargs.setdefault('null', True)
|
|
|
+ kwargs.setdefault('editable', False)
|
|
|
+ super(PickledObjectField, self).__init__(*args, **kwargs)
|
|
|
+
|
|
|
+ def get_default(self):
|
|
|
+ """
|
|
|
+ Returns the default value for this field.
|
|
|
+
|
|
|
+ The default implementation on models.Field calls force_unicode
|
|
|
+ on the default, which means you can't set arbitrary Python
|
|
|
+ objects as the default. To fix this, we just return the value
|
|
|
+ without calling force_unicode on it. Note that if you set a
|
|
|
+ callable as a default, the field will still call it. It will
|
|
|
+ *not* try to pickle and encode it.
|
|
|
+
|
|
|
+ """
|
|
|
+ if self.has_default():
|
|
|
+ if callable(self.default):
|
|
|
+ return self.default()
|
|
|
+ return self.default
|
|
|
+ # If the field doesn't have a default, then we punt to models.Field.
|
|
|
+ return super(PickledObjectField, self).get_default()
|
|
|
|
|
|
def to_python(self, value):
|
|
|
- """Convert the database value to a python value."""
|
|
|
- if isinstance(value, PickledObject):
|
|
|
- # If the value is a definite pickle; and an error is
|
|
|
- # raised in de-pickling it should be allowed to propogate.
|
|
|
- return pickle.loads(str(value))
|
|
|
- else:
|
|
|
+ """
|
|
|
+ B64decode and unpickle the object, optionally decompressing it.
|
|
|
+
|
|
|
+ If an error is raised in de-pickling and we're sure the value is
|
|
|
+ a definite pickle, the error is allowed to propogate. If we
|
|
|
+ aren't sure if the value is a pickle or not, then we catch the
|
|
|
+ error and return the original value instead.
|
|
|
+
|
|
|
+ """
|
|
|
+ if value is not None:
|
|
|
try:
|
|
|
- return pickle.loads(str(value))
|
|
|
- except Exception:
|
|
|
- # If an error was raised, just return the plain value
|
|
|
- return value
|
|
|
+ value = dbsafe_decode(value, self.compress)
|
|
|
+ except:
|
|
|
+ # If the value is a definite pickle; and an error is raised in
|
|
|
+ # de-pickling it should be allowed to propogate.
|
|
|
+ if isinstance(value, PickledObject):
|
|
|
+ raise
|
|
|
+ return value
|
|
|
|
|
|
- def get_db_prep_save(self, value):
|
|
|
- """get_db_prep_save"""
|
|
|
+ def get_db_prep_value(self, value):
|
|
|
+ """
|
|
|
+ Pickle and b64encode the object, optionally compressing it.
|
|
|
+
|
|
|
+ The pickling protocol is specified explicitly (by default 2),
|
|
|
+ rather than as -1 or HIGHEST_PROTOCOL, because we don't want the
|
|
|
+ protocol to change over time. If it did, ``exact`` and ``in``
|
|
|
+ lookups would likely fail, since pickle would now be generating
|
|
|
+ a different string.
|
|
|
+
|
|
|
+ """
|
|
|
if value is not None and not isinstance(value, PickledObject):
|
|
|
- value = PickledObject(pickle.dumps(value))
|
|
|
+ # We call force_unicode here explicitly, so that the encoded string
|
|
|
+ # isn't rejected by the postgresql_psycopg2 backend. Alternatively,
|
|
|
+ # we could have just registered PickledObject with the psycopg
|
|
|
+ # marshaller (telling it to store it like it would a string), but
|
|
|
+ # since both of these methods result in the same value being stored,
|
|
|
+ # doing things this way is much easier.
|
|
|
+ value = force_unicode(dbsafe_encode(value, self.compress))
|
|
|
return value
|
|
|
|
|
|
- def get_internal_type(self):
|
|
|
- """The database field type used by this field."""
|
|
|
- return 'TextField'
|
|
|
+ def value_to_string(self, obj):
|
|
|
+ value = self._get_val_from_obj(obj)
|
|
|
+ return self.get_db_prep_value(value)
|
|
|
|
|
|
+ def get_internal_type(self):
|
|
|
+ return 'TextField'
|
|
|
+
|
|
|
def get_db_prep_lookup(self, lookup_type, value):
|
|
|
- """get_db_prep_lookup"""
|
|
|
- if lookup_type == 'exact':
|
|
|
- value = self.get_db_prep_save(value)
|
|
|
- return super(PickledObjectField, self).get_db_prep_lookup(
|
|
|
- lookup_type, value)
|
|
|
- elif lookup_type == 'in':
|
|
|
- value = [self.get_db_prep_save(v) for v in value]
|
|
|
- return super(PickledObjectField, self).get_db_prep_lookup(
|
|
|
- lookup_type, value)
|
|
|
- else:
|
|
|
+ if lookup_type not in ['exact', 'in', 'isnull']:
|
|
|
raise TypeError('Lookup type %s is not supported.' % lookup_type)
|
|
|
+ # The Field model already calls get_db_prep_value before doing the
|
|
|
+ # actual lookup, so all we need to do is limit the lookup types.
|
|
|
+ return super(PickledObjectField, self).get_db_prep_lookup(lookup_type, value)
|