more optimisations to name display.

svn: r7930
This commit is contained in:
Richard Taylor 2007-01-18 16:30:28 +00:00
parent a13e41b57d
commit c0f9fcb160
2 changed files with 110 additions and 76 deletions

View File

@ -1,3 +1,6 @@
2007-01-18 Richard Taylor <rjt-gramps@thegrindstone.me.uk>
* src/NameDisplay.py: yet more optimisations for name display.
2007-01-17 Martin Hawlisch <Martin.Hawlisch@gmx.de> 2007-01-17 Martin Hawlisch <Martin.Hawlisch@gmx.de>
* src/DataViews/_PedigreeView.py: Cache result of probably_alive(); Call * src/DataViews/_PedigreeView.py: Cache result of probably_alive(); Call
find_tree() only once for all sizes; Cache results in FormattingHelper; find_tree() only once for all sizes; Cache results in FormattingHelper;

View File

@ -77,6 +77,7 @@ class NameDisplay:
""" """
format_funcs = {} format_funcs = {}
raw_format_funcs = {}
# FIXME: Is this used anywhere? I cannot see that it is. # FIXME: Is this used anywhere? I cannot see that it is.
sort_field = (Name.get_surname, Name.get_surname, sort_field = (Name.get_surname, Name.get_surname,
@ -114,7 +115,7 @@ class NameDisplay:
raw_data[_FIRSTNAME], raw_data[_FIRSTNAME],
raw_data[_PATRONYM], raw_data[_PATRONYM],
raw_data[_SUFFIX]) raw_data[_SUFFIX])
return ' '.join([ x for x in result.split(" ") if x != '']) return ' '.join(result.split())
def _raw_fnln(self,raw_data): def _raw_fnln(self,raw_data):
result = "%s %s %s %s %s" % (raw_data[_FIRSTNAME], result = "%s %s %s %s %s" % (raw_data[_FIRSTNAME],
@ -122,18 +123,18 @@ class NameDisplay:
raw_data[_PREFIX], raw_data[_PREFIX],
raw_data[_SURNAME], raw_data[_SURNAME],
raw_data[_SUFFIX]) raw_data[_SUFFIX])
return ' '.join([ x for x in result.split(" ") if x != '']) return ' '.join(result.split())
def _raw_ptfn(self,raw_data): def _raw_ptfn(self,raw_data):
result = "%s %s, %s %s" % (raw_data[_PREFIX], result = "%s %s, %s %s" % (raw_data[_PREFIX],
raw_data[_PATRONYM], raw_data[_PATRONYM],
raw_data[_SUFFIX], raw_data[_SUFFIX],
raw_data[_FIRSTNAME]) raw_data[_FIRSTNAME])
return ' '.join([ x for x in result.split(" ") if x != '']) return ' '.join(result.split())
def _raw_fn(self,raw_data): def _raw_fn(self,raw_data):
result = raw_data[_FIRSTNAME] result = raw_data[_FIRSTNAME]
return ' '.join([ x for x in result.split(" ") if x != '']) return ' '.join(result.split())
def set_name_format(self,formats): def set_name_format(self,formats):
raw_func_dict = { raw_func_dict = {
@ -230,74 +231,87 @@ class NameDisplay:
#------------------------------------------------------------------------- #-------------------------------------------------------------------------
def format_str(self,name,format_str):
return self._format_str_base(name.first_name,name.surname,name.prefix,
name.suffix,name.patronymic,name.title,
name.call,format_str)
def format_str_raw(self,raw_data,format_str): def _gen_raw_func(self, format_str):
surname = raw_data[_SURNAME] """The job of building the name from a format string is rather
prefix = raw_data[_PREFIX] expensive and it is called lots and lots of times. So it is worth
first = raw_data[_FIRSTNAME] going to some length to optimise it as much as possible.
patronymic = raw_data[_PATRONYM]
suffix = raw_data[_SUFFIX]
title = raw_data[_TITLE]
call = raw_data[_CALL]
return self._format_str_base(first,surname,prefix,suffix,patronymic,
title,call,format_str)
# def _format_str_base(self,first,surname,prefix,suffix,patronymic, This method constructs a new function that is specifically written
# title,call,format_str): to format a name given a particualar format string. This is worthwhile
# """ because the format string itself rarely changes, so by caching the new
# Generates name from a format string. function and calling it directly when asked to format a name to the
same format string again we can be as quick as possible.
# The following substitutions are made: The new function is of the form:
# %t -> title
# %f -> given name (first name)
# %p -> prefix
# %s -> suffix
# %l -> family name (last name, surname)
# %y -> patronymic
# %c -> call name
# The capital letters are substituted for capitalized name components.
# The %% is substituted with the single % character.
# All the other characters in the fmt_str are unaffected.
# """ def fn(raw_data):
return "%s %s %s %s %s" % (raw_data[_TITLE],
raw_data[_FIRSTNAME],
raw_data[_PREFIX],
raw_data[_SURNAME],
raw_data[_SUFFIX])
# output = format_str """
# output = output.replace("%t",title) # we need the names of each of the variables or methods that are
# output = output.replace("%f",first) # called to fill in each format flag.
# output = output.replace("%p",prefix) d = {"%t":"raw_data[_TITLE]",
# output = output.replace("%l",surname) "%f":"raw_data[_FIRSTNAME]",
# output = output.replace("%s",suffix) "%p":"raw_data[_PREFIX]",
# output = output.replace("%y",patronymic) "%l":"raw_data[_SURNAME]",
# output = output.replace("%c",call) "%s":"raw_data[_SUFFIX]",
"%y":"raw_data[_PATRONYM]",
"%c":"raw_data[_CALL]",
"%T":"raw_data[_TITLE].upper()",
"%F":"raw_data[_FIRSTNAME].upper()",
"%P":"raw_data[_PREFIX].upper()",
"%L":"raw_data[_SURNAME].upper()",
"%S":"raw_data[_SUFFIX].upper()",
"%Y":"raw_data[_PATRONYM].upper()",
"%C":"raw_data[_CALL].upper()",
"%%":"'%'"}
# output = output.replace("%T",title.upper()) new_fmt = format_str
# output = output.replace("%F",first.upper())
# output = output.replace("%P",prefix.upper())
# output = output.replace("%L",surname.upper())
# output = output.replace("%S",suffix.upper())
# output = output.replace("%Y",patronymic.upper())
# output = output.replace("%C",call.upper())
# output = output.replace("%%",'%')
# # Suppress multiple spaces # replace the specific format string flags with a
# prev_space = -1 # flag that works in standard python format strings.
# namestr = '' new_fmt = new_fmt.replace("%t","%s")
# for i in range(len(output)): new_fmt = new_fmt.replace("%f","%s")
# if output[i] == ' ': new_fmt = new_fmt.replace("%p","%s")
# dist = i - prev_space new_fmt = new_fmt.replace("%l","%s")
# prev_space = i new_fmt = new_fmt.replace("%s","%s")
# if dist == 1: new_fmt = new_fmt.replace("%y","%s")
# continue new_fmt = new_fmt.replace("%c","%s")
# namestr += output[i]
# return namestr.strip() new_fmt = new_fmt.replace("%T","%s")
new_fmt = new_fmt.replace("%F","%s")
new_fmt = new_fmt.replace("%P","%s")
new_fmt = new_fmt.replace("%L","%s")
new_fmt = new_fmt.replace("%S","%s")
new_fmt = new_fmt.replace("%Y","%s")
new_fmt = new_fmt.replace("%C","%s")
new_fmt = new_fmt.replace("%%",'%')
def _gen_func(self, format_str): # find each format flag in the original format string
# for each one we find the variable name that is needed to
# replace it and add this to a list. This list will be used
# generate the replacement tuple.
pat = re.compile("%.")
param = ()
mat = pat.search(format_str)
while mat:
param = param + (d[mat.group(0)],)
mat = pat.search(format_str,mat.end())
s = 'def fn(raw_data):\n'\
' return "%s" %% (%s)' % (new_fmt,",".join(param))
exec(s)
return fn
def _gen_cooked_func(self, format_str):
"""The job of building the name from a format string is rather """The job of building the name from a format string is rather
expensive and it is called lots and lots of times. So it is worth expensive and it is called lots and lots of times. So it is worth
going to some length to optimise it as much as possible. going to some length to optimise it as much as possible.
@ -355,9 +369,6 @@ class NameDisplay:
new_fmt = new_fmt.replace("%C","%s") new_fmt = new_fmt.replace("%C","%s")
new_fmt = new_fmt.replace("%%",'%') new_fmt = new_fmt.replace("%%",'%')
# remove any double spaces in the format
new_fmt = ' '.join([ x for x in new_fmt.split(" ") if x != ''])
# find each format flag in the original format string # find each format flag in the original format string
# for each one we find the variable name that is needed to # for each one we find the variable name that is needed to
# replace it and add this to a list. This list will be used # replace it and add this to a list. This list will be used
@ -376,6 +387,28 @@ class NameDisplay:
return fn return fn
def format_str(self,name,format_str):
return self._format_str_base(name.first_name,name.surname,name.prefix,
name.suffix,name.patronymic,name.title,
name.call,format_str)
def format_str_raw(self,raw_data,format_str):
"""
Format a name from the raw name list. To make this as fast as possible
this uses _gen_raw_func to generate a new method for each new format_string.
Is does not call _format_str_base because it would introduce an extra
method call and we need all the speed we can squeeze out of this.
"""
func = self.__class__.raw_format_funcs.get(format_str)
if func == None:
func = self._gen_raw_func(format_str)
self.__class__.raw_format_funcs[format_str] = func
s = func(raw_data)
return ' '.join(s.split())
def _format_str_base(self,first,surname,prefix,suffix,patronymic, def _format_str_base(self,first,surname,prefix,suffix,patronymic,
title,call,format_str): title,call,format_str):
""" """
@ -397,13 +430,11 @@ class NameDisplay:
func = self.__class__.format_funcs.get(format_str) func = self.__class__.format_funcs.get(format_str)
if func == None: if func == None:
func = self._gen_func(format_str) func = self._gen_cooked_func(format_str)
self.__class__.format_funcs[format_str] = func self.__class__.format_funcs[format_str] = func
return func(first,surname,prefix,suffix,patronymic,title,call) s = func(first,surname,prefix,suffix,patronymic,title,call)
# I have moved this to remove the spaces from the format string return ' '.join(s.split())
# I am not sure if this was the correct thing to do. - rjt
#return ' '.join([ x for x in s.split(" ") if x != ''])
#------------------------------------------------------------------------- #-------------------------------------------------------------------------