django-anonymizer / anonymizer /

Full commit
from django.db import transaction
from django.db.utils import IntegrityError
from faker import Faker

class DjangoFaker(object):
    Class that provides fake data, using Django specific knowledge to ensure
    acceptable data for Django models.
    faker = Faker()

    def __init__(self):
        self.init_values = {}

    def _prep_init(self, field):
        if field in self.init_values:

        field_vals = set(x[0] for x in field.model._default_manager.values_list(
        self.init_values[field] = field_vals

    def get_allowed_value(self, source, field):
        retval = source()

        # Enforce unique.  Eensure we don't set the same values, as either
        # any of the existing values, or any of the new ones we make up.
        unique = getattr(field, 'unique', None)
        if unique:
            used = self.init_values[field]
            for i in xrange(0, 10):
                if retval in used:
                    retval = source()

            if retval in used:
                raise Exception("Cannot generate unique data for field %s. Last value tried %s" % (field, retval))

        # Enforce max_length
        max_length = getattr(field, 'max_length', None)
        if max_length is not None:
            retval = retval[:max_length]

        return retval

    def __getattr__(self, name):
        # we delegate all calls to faker, but add checks
        def func(*args, **kwargs):
            source = getattr(self.faker, name)
            field = kwargs.get('field', None)
            if field is not None:
                return self.get_allowed_value(source, field)
                return source()
        return func

class Anonymizer(object):

   model = None
   # attributes is a dictionary of {attribute_name: replacer}, where replacer is
   # a callable that takes as arguments this Anonymizer instance, the object to
   # be altered, the field to be altered, and the current field value, and
   # returns a replacement value.

   # This signature is designed to be useful for making lambdas that call the
   # 'faker' instance provided on this class, but it can be used with any
   # function.

   attributes = None

   # To impose an order on Anonymizers within a module, this can be set - lower
   # values are done first.
   order = 0

   faker = DjangoFaker()

   def get_query_set(self):
       Returns the QuerySet to be manipulated
       if self.model is None:
           raise Exception("'model' attribute must be set")
       return self.model._default_manager.get_query_set().order_by('id')

   def get_attributes(self):
       if self.attributes is None:
           raise Exception("'attributes' attribute must be set")
       return self.attributes

   def alter_object(self, obj):
       Alters all the attributes in an individual object.

       If it returns False, the object will not be saved
       attributes = self.get_attributes()
       for attname, replacer in attributes.items():
           self.alter_object_attribute(obj, attname, replacer)

   def alter_object_attribute(self, obj, attname, replacer):
       Alters a single attribute in an object.
       currentval = getattr(obj, attname)
       field = obj._meta.get_field_by_name(attname)[0]
       replacement = replacer(self, obj, field, currentval)
       setattr(obj, attname, replacement)

   def run(self):
       for obj in self.get_query_set():
           retval = self.alter_object(obj)
           if retval is not False:
                   sid = transaction.savepoint()
               except IntegrityError:
                   from IPython.Shell import IPShellEmbed; IPShellEmbed([])()