mirror of
git://xwords.git.sourceforge.net/gitroot/xwords/xwords
synced 2025-01-16 15:41:16 +01:00
fix to allow plurals items not in English
Change copy-strings.py to insist that no language provide a format string not also found in English (since parameters to match all English format string are sure to exist, but other languages are free NOT to match them.) It's ok for other languages to provide "few", for example, when English doesn't.
This commit is contained in:
parent
9c4854e91f
commit
2f339450f3
1 changed files with 60 additions and 12 deletions
|
@ -187,43 +187,91 @@ def checkAndCopy( parser, engNames, engFormats, src, dest, verbose ):
|
||||||
|
|
||||||
for elem in doc.findall('plurals'):
|
for elem in doc.findall('plurals'):
|
||||||
if not checkPlurals(engNames, elem, src, verbose):
|
if not checkPlurals(engNames, elem, src, verbose):
|
||||||
|
# print('checkAndCopy(): removing {}'.format(elem))
|
||||||
elem.getparent().remove(elem)
|
elem.getparent().remove(elem)
|
||||||
|
|
||||||
|
# Languages don't have to provide the same set of plurals items:
|
||||||
|
# one, zero, few, other etc. (My English doesn't include "few" so
|
||||||
|
# far.) What can't happen is for there to be a format string in the
|
||||||
|
# totality of them that's not in the totality of English, or for
|
||||||
|
# there to be internal inconsistencies among their format strings,
|
||||||
|
# e.g. a %1$d in "one" and a %1$s in "other"
|
||||||
formats = getFormats( doc, src )
|
formats = getFormats( doc, src )
|
||||||
for name in formats:
|
for name in formats:
|
||||||
if name in formats and not engFormats[name] == formats[name]:
|
if not engFormats[name].hasAll( formats[name] ):
|
||||||
exitWithFormatError( engFormats[name], formats[name], name, dest )
|
exitWithFormatError( engFormats[name], formats[name], name, dest )
|
||||||
|
|
||||||
writeDoc(doc, src, dest)
|
writeDoc(doc, src, dest)
|
||||||
|
|
||||||
|
class FormatSet():
|
||||||
|
def __init__(self):
|
||||||
|
self.fmts = {
|
||||||
|
's': set(),
|
||||||
|
'd': set(),
|
||||||
|
}
|
||||||
|
|
||||||
|
def add(self, fmt):
|
||||||
|
assert(len(fmt) == 4)
|
||||||
|
typ = fmt[3]
|
||||||
|
indx = int(fmt[1])
|
||||||
|
# print('FormatSet.add({},{})'.format(fmt, typ))
|
||||||
|
self.fmts[typ].add(indx)
|
||||||
|
|
||||||
|
def append( self, ps ):
|
||||||
|
for ch in ['s', 'd']:
|
||||||
|
self.fmts[ch].update( ps.fmts[ch] )
|
||||||
|
|
||||||
|
# assert don't have any indices in BOTH sets
|
||||||
|
def check(self):
|
||||||
|
isOK = True
|
||||||
|
if self.fmts['d'].intersection(self.fmts['s']):
|
||||||
|
isOK = False
|
||||||
|
print('error!!!: same index in both: {}'.format(self))
|
||||||
|
return isOK
|
||||||
|
|
||||||
|
def hasAll(self, other):
|
||||||
|
result = True
|
||||||
|
for ch in ['s', 'd']:
|
||||||
|
result = result and 0 == len(other.fmts[ch] - self.fmts[ch])
|
||||||
|
return result
|
||||||
|
|
||||||
|
def __str__(self):
|
||||||
|
return '{}'.format(self.fmts)
|
||||||
|
|
||||||
def setForElem( elem, name ):
|
def setForElem( elem, name ):
|
||||||
result = set()
|
result = FormatSet()
|
||||||
splits = re.split( g_formatsPat, elem.text )
|
splits = re.split( g_formatsPat, elem.text )
|
||||||
nParts = len(splits)
|
nParts = len(splits)
|
||||||
|
# print( 'setForElem({}): text: {}; nParts: {}'.format( name, elem.text, nParts ))
|
||||||
if 1 < nParts:
|
if 1 < nParts:
|
||||||
for ii in range(nParts):
|
for ii in range(nParts):
|
||||||
part = splits[ii]
|
part = splits[ii]
|
||||||
if re.match( g_formatsPat, part ):
|
if re.match( g_formatsPat, part ):
|
||||||
result.add( part )
|
result.add( part )
|
||||||
# print( 'setForElem(', name, ') =>', result)
|
# print( 'setForElem({}) => {}'.format( name, result))
|
||||||
return result
|
return result
|
||||||
|
|
||||||
def getFormats( doc, path ):
|
def getFormats( doc, path ):
|
||||||
result = {}
|
result = {}
|
||||||
for elem in doc.findall('string'):
|
typ = 'string'
|
||||||
name = elem.get('name')
|
for elem in doc.findall(typ):
|
||||||
|
name = typ + '/' + elem.get('name')
|
||||||
result[name] = setForElem( elem, name )
|
result[name] = setForElem( elem, name )
|
||||||
for elem in doc.findall('plurals'):
|
|
||||||
name = elem.get('name')
|
typ = 'plurals'
|
||||||
|
for elem in doc.findall(typ):
|
||||||
|
name = typ + '/' + elem.get('name')
|
||||||
|
pluralsSet = FormatSet()
|
||||||
for item in elem.findall('item'):
|
for item in elem.findall('item'):
|
||||||
quantity = item.get('quantity')
|
quantity = item.get('quantity')
|
||||||
if not item.text or 0 == len(item.text):
|
if not item.text or 0 == len(item.text):
|
||||||
exitWithError( 'plurals ' + name + ' has empty quantity ' + quantity \
|
exitWithError( '{} has empty quantity {} in file {}'.format( name, quantity, lang ) )
|
||||||
+ ' in file ' + lang )
|
|
||||||
else:
|
else:
|
||||||
add = name + '/' + quantity
|
pluralsSet.append(setForElem( item, name ))
|
||||||
result[add] = setForElem( item, add )
|
if not pluralsSet.check():
|
||||||
# print( 'getFormats(', path, ') => ', result)
|
exitWithError( '{} has overlapping sets: {}'.format(name, pluralsSet))
|
||||||
|
result[name] = pluralsSet
|
||||||
|
# print( 'getFormats({}) => {}'.format( path, result ) )
|
||||||
return result
|
return result
|
||||||
|
|
||||||
def main():
|
def main():
|
||||||
|
|
Loading…
Reference in a new issue