conceived and written by rjsparks@nostrum.com, with some additions and adaptation as a management command by henrik@levkowetz.com. This integrity checker, when run on the IETF database in November 2015, seemed to have a factor on the order of 100 better speed and lower memory consumption than the code in https://stackoverflow.com/questions/4734645/is-there-a-tool-to-check-database-integrity-in-django No exact figure is available, as the latter had to be killed when it had taken all available ram (~14G) on the development machine, and started to cause heavy swapping. - Legacy-Id: 10508
72 lines
3.4 KiB
Python
72 lines
3.4 KiB
Python
|
|
import django
|
|
django.setup()
|
|
|
|
from django.core.management.base import BaseCommand #, CommandError
|
|
from django.core.exceptions import FieldError
|
|
from django.db import models
|
|
from django.db.models.fields.related import ForeignKey, OneToOneField
|
|
|
|
class Command(BaseCommand):
|
|
help = "Check all models for referential integrity."
|
|
|
|
def handle(self, *args, **options):
|
|
verbosity = options.get("verbosity", "1")
|
|
verbosity = int(verbosity) if verbosity.isdigit() else 1
|
|
|
|
def check_field(field):
|
|
foreign_model = field.related.parent_model
|
|
if verbosity > 1:
|
|
print " %s -> %s.%s"%(field.name,foreign_model.__module__,foreign_model.__name__),
|
|
used = set(field.model.objects.values_list(field.name,flat=True))
|
|
used.discard(None)
|
|
exists = set(foreign_model.objects.values_list('pk',flat=True))
|
|
if verbosity > 1:
|
|
if used - exists:
|
|
print ' ** Bad key values:',list(used - exists)
|
|
else:
|
|
print 'ok'
|
|
else:
|
|
if used - exists:
|
|
print '%s.%s.%s->%s.%s Bad key values:'%(model.__module__,model.__name__,field.name,foreign_model.__module__,foreign_model.__name__),list(used - exists)
|
|
|
|
def check_reverse_field(field):
|
|
foreign_model = field.related.parent_model
|
|
if foreign_model == field.model:
|
|
return
|
|
foreign_field_name = field.related.var_name
|
|
foreign_accessor_name = field.related.get_accessor_name()
|
|
if verbosity > 1:
|
|
print " %s.%s.%s -> %s"%(foreign_model.__module__, foreign_model.__name__, foreign_field_name, field.model.__name__),
|
|
try:
|
|
used = set(foreign_model.objects.values_list(foreign_field_name, flat=True))
|
|
except FieldError:
|
|
try:
|
|
used = set(foreign_model.objects.values_list(foreign_accessor_name, flat=True))
|
|
except FieldError:
|
|
print " ** Warning: could not find reverse name for %s.%s -> %s.%s" % (field.model.__module__, field.model.__name__, foreign_model.__name__, foreign_field_name),
|
|
used.discard(None)
|
|
exists = set(field.model.objects.values_list('pk',flat=True))
|
|
if verbosity > 1:
|
|
if used - exists:
|
|
print ' ** Bad key values:\n ',list(used - exists)
|
|
else:
|
|
print ' ok'
|
|
else:
|
|
if used - exists:
|
|
print " %s.%s.%s -> %s.%s ** Bad key values:\n "%(foreign_model.__module__, foreign_model.__name__, foreign_field_name, field.model.__module__, field.model.__name__), list(used - exists)
|
|
|
|
for app in [a for a in models.get_apps() if a.__name__.startswith('ietf.')]:
|
|
if verbosity > 1:
|
|
print "Checking",app.__name__
|
|
for model in models.get_models(app):
|
|
if model._meta.proxy:
|
|
continue
|
|
if verbosity > 1:
|
|
print " %s.%s"%(model.__module__,model.__name__)
|
|
for field in [f for f in model._meta.fields if isinstance(f, (ForeignKey, OneToOneField)) ]:
|
|
check_field(field)
|
|
for field in [f for f in model._meta.many_to_many ]:
|
|
check_field(field)
|
|
check_reverse_field(field)
|