* src/plugins/Check.py: add remove empty objects. This needs testing...

2007-10-03 Benny Malengier <benny.malengier@gramps-project.org> 


svn: r9072
This commit is contained in:
Benny Malengier 2007-10-03 21:56:05 +00:00
parent c195fa2b29
commit 82042ed16e
2 changed files with 175 additions and 7 deletions

View File

@ -1,3 +1,6 @@
2007-10-03 Benny Malengier <benny.malengier@gramps-project.org>
* src/plugins/Check.py: add remove empty objects. This needs testing...
2007-10-03 Benny Malengier <benny.malengier@gramps-project.org> 2007-10-03 Benny Malengier <benny.malengier@gramps-project.org>
* src/GrampsDb/_GrampsDbBase.py: copy bookmark list, don't reference * src/GrampsDb/_GrampsDbBase.py: copy bookmark list, don't reference
* src/GrampsDb/_ReadXML.py: only add bookmarks if not present already, #1187 * src/GrampsDb/_ReadXML.py: only add bookmarks if not present already, #1187

View File

@ -170,6 +170,8 @@ class Check(Tool.BatchTool):
prev_total = -1 prev_total = -1
total = 0 total = 0
#start with empty objects, broken links can be corrected below then
checker.cleanup_empty_objects()
while prev_total != total: while prev_total != total:
prev_total = total prev_total = total
@ -219,6 +221,14 @@ class CheckIntegrity:
self.invalid_source_references = [] self.invalid_source_references = []
self.invalid_repo_references = [] self.invalid_repo_references = []
self.removed_name_format = [] self.removed_name_format = []
self.empty_objects = {'persons' : [],
'families': [],
'events' : [],
'sources' : [],
'media' : [],
'places' : [],
'repos' : [],
}
self.progress = Utils.ProgressMeter(_('Checking database'),'') self.progress = Utils.ProgressMeter(_('Checking database'),'')
def family_errors(self): def family_errors(self):
@ -545,13 +555,127 @@ class CheckIntegrity:
elif missmedia_action == 3: elif missmedia_action == 3:
select_clicked() select_clicked()
self.progress.step() self.progress.step()
def cleanup_empty_objects(self):
#the position of the change column in the primary objects
CHANGE_PERSON = 17
CHANGE_FAMILY = 12
CHANGE_EVENT = 10
CHANGE_SOURCE = 8
CHANGE_PLACE = 11
CHANGE_MEDIA = 8
# REPOS CHANGE ONLY ADDED IN VERSION >= 3.0
CHANGE_REPOS = None
empty_person_data = RelLib.Person().serialize()
empty_family_data = RelLib.Family().serialize()
empty_event_data = RelLib.Event().serialize()
empty_source_data = RelLib.Source().serialize()
empty_place_data = RelLib.Place().serialize()
empty_media_data = RelLib.MediaObject().serialize()
empty_repos_data = RelLib.Repository().serialize()
tables = {
'persons' : {'get_func': self.db.get_person_from_handle,
'cursor_func': self.db.get_person_cursor,
'total_func' : self.db.get_number_of_people,
'progress' : _('Looking for empty people records'),
'check_func' : lambda x : self._check_empty(x,
empty_person_data,
CHANGE_PERSON),
'remove' : self.db.remove_person},
'families': {'get_func': self.db.get_family_from_handle,
'cursor_func': self.db.get_family_cursor,
'total_func' : self.db.get_number_of_families,
'progress' : _('Looking for empty family records'),
'check_func' : lambda x : self._check_empty(x,
empty_family_data,
CHANGE_FAMILY),
'remove' : self.db.remove_family},
'events' : {'get_func': self.db.get_event_from_handle,
'cursor_func': self.db.get_event_cursor,
'total_func' : self.db.get_number_of_events,
'progress' : _('Looking for empty event records'),
'check_func' : lambda x : self._check_empty(x,
empty_event_data,
CHANGE_EVENT),
'remove' : self.db.remove_event},
'sources' : {'get_func': self.db.get_source_from_handle,
'cursor_func': self.db.get_source_cursor,
'total_func' : self.db.get_number_of_sources,
'progress' : _('Looking for empty source records'),
'check_func' : lambda x : self._check_empty(x,
empty_source_data,
CHANGE_SOURCE),
'remove' : self.db.remove_source},
'places' : {'get_func': self.db.get_place_from_handle,
'cursor_func': self.db.get_place_cursor,
'total_func' : self.db.get_number_of_places,
'progress' : _('Looking for empty place records'),
'check_func' : lambda x : self._check_empty(x,
empty_place_data,
CHANGE_PLACE),
'remove' : self.db.remove_place},
'media' : {'get_func': self.db.get_object_from_handle,
'cursor_func': self.db.get_media_cursor,
'progress' : _('Looking for empty media records'),
'total_func' : self.db.get_number_of_media_objects,
'check_func' : lambda x : self._check_empty(x,
empty_media_data,
CHANGE_MEDIA),
'remove' : self.db.remove_object},
'repos' : {'get_func': self.db.get_repository_from_handle,
'cursor_func': self.db.get_repository_cursor,
'total_func' : self.db.get_number_of_repositories,
'progress' : _('Looking for empty repository records'),
'check_func' : lambda x : self._check_empty(x,
empty_repos_data,
CHANGE_REPOS),
'remove' : self.db.remove_repository},
}
for the_type in tables.keys():
cursor = tables[the_type]['cursor_func']()
total = tables[the_type]['total_func']()
check = tables[the_type]['check_func']
remove_func = tables[the_type]['remove']
self.progress.set_pass(tables[the_type]['progress'],total)
item = cursor.first()
while item:
self.progress.step()
(handle,data) = item
if check(data):
self.empty_objects[the_type].append(handle)
#we cannot remove here as that would destroy cursor
item = cursor.next()
cursor.close()
#now remove
for handle in self.empty_objects[the_type]:
remove_func(handle, self.trans)
def _check_empty(self, data, empty_data, changepos):
"""compare the data with the data of an empty object
change, handle and gramps_id are not compared """
print 'checking'
print data
print empty_data
if changepos is not None:
return (data[2:changepos] == empty_data[2:changepos] and
data[changepos+1:] == empty_data[changepos+1:]
)
else :
return data[2:] == empty_data[2:]
def cleanup_empty_families(self,automatic): def cleanup_empty_families(self,automatic):
fhandle_list = self.db.get_family_handles() fhandle_list = self.db.get_family_handles()
self.progress.set_pass(_('Looking for empty families'), self.progress.set_pass(
len(fhandle_list)) _('Looking for families with no parents or children'),
len(fhandle_list))
for family_handle in fhandle_list: for family_handle in fhandle_list:
self.progress.step() self.progress.step()
@ -886,10 +1010,21 @@ class CheckIntegrity:
source_references = len(self.invalid_source_references) source_references = len(self.invalid_source_references)
repo_references = len(self.invalid_repo_references) repo_references = len(self.invalid_repo_references)
name_format = len(self.removed_name_format) name_format = len(self.removed_name_format)
empty_objs = ( len(self.empty_objects['persons'])
+ len(self.empty_objects['families'])
+ len(self.empty_objects['events'])
+ len(self.empty_objects['sources'])
+ len(self.empty_objects['media'])
+ len(self.empty_objects['places'])
+ len(self.empty_objects['repos'])
)
print 'empty objs:',empty_objs
errors = blink + efam + photos + rel + person + event_invalid\ errors = (photos + efam + blink + plink + slink + rel
+ person_references + place_references + source_references\ + event_invalid + person
+ repo_references + person_references + place_references + source_references
+ repo_references + name_format + empty_objs
)
if errors == 0: if errors == 0:
if cl: if cl:
@ -962,61 +1097,91 @@ class CheckIntegrity:
self.text.write("\t%s\n" % self.empty_family[0]) self.text.write("\t%s\n" % self.empty_family[0])
elif efam > 1: elif efam > 1:
self.text.write(_("%d empty families were found\n") % efam) self.text.write(_("%d empty families were found\n") % efam)
if rel == 1: if rel == 1:
self.text.write(_("1 corrupted family relationship fixed\n")) self.text.write(_("1 corrupted family relationship fixed\n"))
elif rel > 1: elif rel > 1:
self.text.write(_("%d corrupted family relationship fixed\n") % rel) self.text.write(_("%d corrupted family relationship fixed\n") % rel)
if person_references == 1: if person_references == 1:
self.text.write(_("1 person was referenced but not found\n")) self.text.write(_("1 person was referenced but not found\n"))
elif person_references > 1: elif person_references > 1:
self.text.write(_("%d persons were referenced, but not found\n") % person_references) self.text.write(_("%d persons were referenced, but not found\n") % person_references)
if repo_references == 1: if repo_references == 1:
self.text.write(_("1 repository was referenced but not found\n")) self.text.write(_("1 repository was referenced but not found\n"))
elif repo_references > 1: elif repo_references > 1:
self.text.write(_("%d repositories were referenced, but not found\n") % repo_references) self.text.write(_("%d repositories were referenced, but not found\n") % repo_references)
if photos == 1: if photos == 1:
self.text.write(_("1 media object was referenced, but not found\n")) self.text.write(_("1 media object was referenced, but not found\n"))
elif photos > 1: elif photos > 1:
self.text.write(_("%d media objects were referenced, but not found\n") % photos) self.text.write(_("%d media objects were referenced, but not found\n") % photos)
if bad_photos == 1: if bad_photos == 1:
self.text.write(_("Reference to 1 missing media object was kept\n")) self.text.write(_("Reference to 1 missing media object was kept\n"))
elif bad_photos > 1: elif bad_photos > 1:
self.text.write(_("References to %d media objects were kept\n") % bad_photos) self.text.write(_("References to %d media objects were kept\n") % bad_photos)
if replaced_photos == 1: if replaced_photos == 1:
self.text.write(_("1 missing media object was replaced\n")) self.text.write(_("1 missing media object was replaced\n"))
elif replaced_photos > 1: elif replaced_photos > 1:
self.text.write(_("%d missing media objects were replaced\n") % replaced_photos) self.text.write(_("%d missing media objects were replaced\n") % replaced_photos)
if removed_photos == 1: if removed_photos == 1:
self.text.write(_("1 missing media object was removed\n")) self.text.write(_("1 missing media object was removed\n"))
elif removed_photos > 1: elif removed_photos > 1:
self.text.write(_("%d missing media objects were removed\n") % removed_photos) self.text.write(_("%d missing media objects were removed\n") % removed_photos)
if event_invalid == 1: if event_invalid == 1:
self.text.write(_("1 invalid event reference was removed\n")) self.text.write(_("1 invalid event reference was removed\n"))
elif event_invalid > 1: elif event_invalid > 1:
self.text.write(_("%d invalid event references were removed\n") % event_invalid) self.text.write(_("%d invalid event references were removed\n") % event_invalid)
if birth_invalid == 1: if birth_invalid == 1:
self.text.write(_("1 invalid birth event name was fixed\n")) self.text.write(_("1 invalid birth event name was fixed\n"))
elif birth_invalid > 1: elif birth_invalid > 1:
self.text.write(_("%d invalid birth event names were fixed\n") % birth_invalid) self.text.write(_("%d invalid birth event names were fixed\n") % birth_invalid)
if death_invalid == 1: if death_invalid == 1:
self.text.write(_("1 invalid death event name was fixed\n")) self.text.write(_("1 invalid death event name was fixed\n"))
elif death_invalid > 1: elif death_invalid > 1:
self.text.write(_("%d invalid death event names were fixed\n") % death_invalid) self.text.write(_("%d invalid death event names were fixed\n") % death_invalid)
if place_references == 1: if place_references == 1:
self.text.write(_("1 place was referenced but not found\n")) self.text.write(_("1 place was referenced but not found\n"))
elif place_references > 1: elif place_references > 1:
self.text.write(_("%d places were referenced, but not found\n") % place_references) self.text.write(_("%d places were referenced, but not found\n") % place_references)
if source_references == 1: if source_references == 1:
self.text.write(_("1 source was referenced but not found\n")) self.text.write(_("1 source was referenced but not found\n"))
elif source_references > 1: elif source_references > 1:
self.text.write(_("%d sources were referenced, but not found\n") % source_references) self.text.write(_("%d sources were referenced, but not found\n") % source_references)
if name_format == 1: if name_format == 1:
self.text.write(_("1 invalid name format reference was removed\n")) self.text.write(_("1 invalid name format reference was removed\n"))
elif name_format > 1: elif name_format > 1:
self.text.write(_("%d invalid name format references were removed\n") self.text.write(_("%d invalid name format references were removed\n")
% name_format) % name_format)
if empty_objs > 0 :
self.text.write(_("%d empty objects removed:\n"
" %d person objects\n"
" %d family objects\n"
" %d event objects\n"
" %d source objects\n"
" %d media objects\n"
" %d place objects\n"
" %d repository objects\n"
) % (empty_objs,
len(self.empty_objects['persons']),
len(self.empty_objects['families']),
len(self.empty_objects['events']),
len(self.empty_objects['sources']),
len(self.empty_objects['media']),
len(self.empty_objects['places']),
len(self.empty_objects['repos'])
) )
return errors return errors
#------------------------------------------------------------------------- #-------------------------------------------------------------------------