Updated draft submission author extraction module to handle dash-separated double given names.

- Legacy-Id: 5088
This commit is contained in:
Henrik Levkowetz 2012-12-03 13:17:33 +00:00
parent 158f501653
commit 4946a3f694

View file

@ -40,7 +40,7 @@ import stat
import sys
import time
version = "0.28"
version = "0.29"
program = os.path.basename(sys.argv[0])
progdir = os.path.dirname(sys.argv[0])
@ -480,6 +480,11 @@ class Draft():
# if there's a middle part, let it be optional
first, middle = first.split(" ", 1)
first = "%s( +%s)?" % (first, middle)
# Double names (e.g., Jean-Michel) are abbreviated as two letter
# connected by a dash -- let this expand appropriately
first = re.sub("^([A-Z])-([A-Z])\.\*", r"\1.*-\2.*", first)
# Some chinese names are shown with double-letter(latin) abbreviated given names, rather than
# a single-letter(latin) abbreviation:
first = re.sub("^([A-Z])[A-Z]+\.\*", r"\1[-\w]+", first)