katie/scripts/genlocale.py

#!/usr/bin/python3
#-*- coding: UTF-8 -*-

# Data is from https://unicode.org/Public/cldr/44/core.zip

import os, sys, glob, re
import xml.etree.ElementTree as ET

printenumsandexit = ('--printenums' in sys.argv)
printdocsandexit = ('--printdocs' in sys.argv)

def mapcopy(frommap, tomap):
    for key in frommap.keys():
        tomap[key] = frommap[key]

def mapmerge(frommap, tomap, defaultmap):
    for key in frommap.keys():
        if frommap[key] == defaultmap[key]:
            continue
        tomap[key] = frommap[key]

def listcopy(fromlist, tolist):
    for entry in fromlist:
        tolist.append(entry)

def stripxmltext(fromxmltext):
    result = fromxmltext.replace('\n', '')
    result = result.replace('\t', '')
    # 3-passes of double-space removal seems to be enough for all cases
    for r in range(3):
        result = result.replace('  ', ' ')
    return result.strip()

def normalizestring(fromstring):
    result = fromstring.replace(' ', '')
    result = result.replace('-', '')
    result = result.replace(',', '')
    result = result.replace("'", '')
    result = result.replace('&', 'And')
    result = result.replace('(', '')
    result = result.replace(')', '')
    result = result.replace('St.', 'St')
    result = result.replace('U.S.', 'UnitedStates')
    # UTF-8 chars
    result = result.replace(u'ʼ', '')
    result = result.replace(u'’', '')
    result = result.replace(u'ü', 'u')
    result = result.replace(u'å', 'a')
    result = result.replace(u'ç', 'c')
    result = result.replace(u'õ', 'o')
    result = result.replace(u'Å', 'A')
    result = result.replace(u'ô', 'o')
    result = result.replace(u'ã', 'a')
    result = result.replace(u'é', 'e')
    result = result.replace(u'í', 'i')
    result = result.replace(u'ā', 'a')
    result = result.replace(u'á', 'a')
    return result

def xmlmerge(fromxml, fromxml2):
    tree = ET.parse(fromxml)
    root = tree.getroot()
    tree2 = ET.parse(fromxml2)
    root2 = tree2.getroot()
    for element in root:
        root2.insert(0, element)
    return root2

def touint(fromstring):
    # NOTE: symbols (plus, minus, etc.) are assumed to be single character which is not true for
    # many of the locales, however the API for those does not handle them as strings thus the first
    # character only is used
    return ord(fromstring)

def tochar(fromstring):
    if fromstring:
        return '"%s\\0"' % fromstring
    return 'nullptr'

def tochararray(fromstringlist):
    result = '{ '
    for string in fromstringlist:
        result = '%s%s, ' % (result, tochar(string))
    result = '%s }' % result
    result = result.replace(',  }', ' }')
    return result

def todayenum(day):
    if day == 'mon':
        return 'Qt::Monday'
    elif day == 'tue':
        return 'Qt::Tuesday'
    elif day == 'wed':
        return 'Qt::Wednesday'
    elif day == 'thu':
        return 'Qt::Thursday'
    elif day == 'fri':
        return 'Qt::Friday'
    elif day == 'sat':
        return 'Qt::Saturday'
    elif day == 'sun':
        return 'Qt::Sunday'
    print('Unknown day: %s' % day)
    sys.exit(1)

def todatetimeformat(fromformat):
    # valid are y, m, M, d, h, H, s, a, A, z and t
    unsupportedtags = [
        'g',
        'u',
        'q',
        'l',
        'w',
        'f',
        'j',
    ]
    replacementtags = {
        'MMMMM' : 'MMM', # narrow month name
        'LLLLL' : 'MMM', # stand-alone narrow month name
        'E' : 'ddd', 'EE' : 'ddd', 'EEE' : 'ddd', 'EEEEE' : 'ddd', 'EEEE' : 'dddd', # day of week
        'e' : 'ddd', 'ee' : 'ddd', 'eee' : 'ddd', 'eeeee' : 'ddd', 'eeee' : 'dddd', # local day of week
        'c' : 'ddd', 'cc' : 'ddd', 'ccc' : 'ddd', 'ccccc' : 'ddd', 'cccc' : 'dddd', # stand-alone local day of week
        'K' : 'h', # Hour 0-11
        'k' : 'H', # Hour 1-24
        'z' : 'Z', 'zz' : 'Z', 'zzz' : 'Z', 'zzzz' : 'Z', # timezone
        'Z' : 'Z', 'ZZ' : 'Z', 'ZZZ' : 'Z', 'ZZZZ' : 'Z', # timezone
        'v' : 'Z', 'vv' : 'Z', 'vvv' : 'Z', 'vvvv' : 'Z', # timezone
        'V' : 'Z', 'VV' : 'Z', 'VVV' : 'Z', 'VVVV' : 'Z',  # timezone
        'L' : 'M', # stand-alone month names. not supported
    }
    replacementregex = {
        r'y' : 'yyyy',       # four-digit year without leading zeroes
        r'yyy{3,}' : 'yyyy', # more that three digits hence convert to four-digit year
        r'S{1,}' : '',       # fractional seconds. not supported.
        r'A{1,}' : '',       # milliseconds in day. not supported.
        r'a' : 'AP',         # AM/PM
    }
    possibleoccurences = [
        '%s, ',
        ', %s',
        '%s.',
        '.%s',
        '%s-',
        '-%s',
        '(%s)',
        "('%s')",
        '%s ',
        ' %s',
        '%s',
    ]
    result = fromformat
    for tag in unsupportedtags:
        uppertag = tag.upper()
        for occurence in possibleoccurences:
            result = result.replace(occurence % (tag * 4), '')
            result = result.replace(occurence % (tag * 3), '')
            result = result.replace(occurence % (tag * 2), '')
            result = result.replace(occurence % tag, '')
            result = result.replace(occurence % (uppertag * 4), '')
            result = result.replace(occurence % (uppertag * 3), '')
            result = result.replace(occurence % (uppertag * 2), '')
            result = result.replace(occurence % uppertag, '')
    for key in replacementregex.keys():
        result = re.sub(key, replacementregex[key], result)
    for key in replacementtags.keys():
        result = result.replace(key, replacementtags[key])
    return result

def tomonthslist(fromxmlelements, initialvalues):
    result = []
    listcopy(initialvalues, result)
    for month in fromxmlelements:
        monthtype = month.get('type')
        if monthtype == '1':
            result[0] = month.text
        elif monthtype == '2':
            result[1] = month.text
        elif monthtype == '3':
            result[2] = month.text
        elif monthtype == '4':
            result[3] = month.text
        elif monthtype == '5':
            result[4] = month.text
        elif monthtype == '6':
            result[5] = month.text
        elif monthtype == '7':
            result[6] = month.text
        elif monthtype == '8':
            result[7] = month.text
        elif monthtype == '9':
            result[8] = month.text
        elif monthtype == '10':
            result[9] = month.text
        elif monthtype == '11':
            result[10] = month.text
        elif monthtype == '12':
            result[11] = month.text
        else:
            print('Unknown month: %s' % monthtype)
            sys.exit(1)
    return result

def todayslist(fromxmlelements, initialvalues):
    result = []
    listcopy(initialvalues, result)
    for day in fromxmlelements:
        daytype = day.get('type')
        if daytype == 'mon':
            result[0] = day.text
        elif daytype == 'tue':
            result[1] = day.text
        elif daytype == 'wed':
            result[2] = day.text
        elif daytype == 'thu':
            result[3] = day.text
        elif daytype == 'fri':
            result[4] = day.text
        elif daytype == 'sat':
            result[5] = day.text
        elif daytype == 'sun':
            result[6] = day.text
        else:
            print('Unknown day: %s' % daytype)
            sys.exit(1)
    return result

def tolanguageenum(fromstring):
    for key in languagemap.keys():
        if fromstring == languagemap[key]['code']:
            return 'QLocale::Language::%s' % key
    # print('Unknown language: %s' % fromstring)
    # sys.exit(1)

def toscriptenum(fromstring):
    for key in scriptmap.keys():
        if fromstring == scriptmap[key]['code']:
            return 'QLocale::Script::%s' % key
    # print('Unknown script: %s' % fromstring)
    # sys.exit(1)

def tocountryenum(fromstring):
    for key in countrymap.keys():
        if fromstring == countrymap[key]['code']:
            return 'QLocale::Country::%s' % key
    # print('Unknown country: %s' % fromstring)
    # sys.exit(1)

# printenum prints mapped values that have unique code only, the rest are set to the enum of the
# first occurence. the reason for doing so is because table lookups for figuring out language,
# script and country required for constructing QLocale from string (named locales) relies on the
# fact that there is only one code for each, if that is not the case constructing copy of locale
# from its name will not copy it correctly. printtable skips duplicate code entries entirely
def printenum(frommap, prefix):
    keyscount = 0
    aliascodes = []
    seencodes = []

    print('    enum %s {' % prefix)
    # print Default and C first
    for key in frommap.keys():
        if not key in ('Any%s' % prefix, 'C'):
            continue
        print('        %s = %d,' % (key, keyscount))
        keyscount += 1

    # now everything except those, save last key for later
    lastkey = ''
    for key in sorted(frommap.keys()):
        if key in ('Any%s' % prefix, 'C'):
            continue
        code = frommap[key]['code']
        if code in seencodes:
            aliascodes.append(key)
            continue
        seencodes.append(code)
        print('        %s = %d,' % (key, keyscount))
        lastkey = key
        keyscount += 1

    # now aliases
    print('')
    for alias in sorted(aliascodes):
        aliascode = frommap[alias]['code']
        aliasenum = None
        for key in sorted(frommap.keys()):
            code = frommap[key]['code']
            if aliascode == code:
                aliasenum == key
                break
        print('        %s = %s,' % (alias, key))

    # print last key
    print('\n        Last%s = %s' % (prefix, lastkey))

    print('    };\n')
def printdoc(frommap, prefix):
    print('// %s' % prefix)
    for key in sorted(frommap.keys()):
        if key in ('Any%s' % prefix, 'C'):
            continue
        print('    \\value %s' % key)
    print('')

def printtable(frommap, prefix):
    lowerprefix = prefix.lower()
    seencodes = []

    print('''static const struct %sTblData {
    const QLocale::%s %s;
    const char* name;
    const char* code;
} %sTbl[] = {''' % (lowerprefix, prefix, lowerprefix, lowerprefix))

    # print Default and C first
    for key in frommap.keys():
        if not key in ('Any%s' % prefix, 'C'):
            continue
        code = frommap[key]['code']
        name = frommap[key]['name']
        print('    { QLocale::%s::%s, %s, %s },' % (prefix, key, tochar(name), tochar(code)))

    # now everything except those but only unique code values
    for key in sorted(frommap.keys()):
        if key in ('Any%s' % prefix, 'C'):
            continue
        code = frommap[key]['code']
        if code in seencodes:
            continue
        seencodes.append(code)
        name = frommap[key]['name']
        print('    { QLocale::%s::%s, %s, %s },' % (prefix, key, tochar(name), tochar(code)))

    print('};')
    print('static const qint16 %sTblSize = sizeof(%sTbl) / sizeof(%sTblData);\n' % (lowerprefix, lowerprefix, lowerprefix))

def printlocaledata(frommap, key):
    value = frommap[key]
    # skip table entries without country (non-territory), unless it is artificial, this is done to
    # preserve the assumption in QLocalePrivate::findLocale that "AnyCountry" means "find me a
    # language, no matter what country it is spoken in" if "AnyCountry" is passed to it as argument
    # and also shrinks the table
    if value['country'] == 'QLocale::Country::AnyCountry' and not key == 'C':
        return
    # HACK: skip table entries the language of which is unknown
    if key == 'apc_SY' or key == 'skr_PK':
        return
    # HACK: skip table entries with and without specifiec script
    if key == 'ha_Arab_NG':
        return
    print('''    {
        %s, %s, %s,
        %s, %s, %s,
        %s, %s, %s, %s, %s, %s, %s, %s,
        %s, %s, %s, %s,
        %s, %s,
        %s,
        %s,
        %s,
        %s,
        %s,
        %s,
        %s,
        %s,
        %s,
        %s,
        %s,
        %s
    }, // %s''' % (
            value['language'],
            value['script'],
            value['country'],
            value['first_day_of_week'],
            value['weekend_start'],
            value['weekend_end'],
            touint(value['decimal']),
            touint(value['group']),
            touint(value['list']),
            touint(value['percent']),
            touint(value['minus']),
            touint(value['plus']),
            touint(value['exponential']),
            touint(value['zero']),
            tochar(value['short_date_format']),
            tochar(value['long_date_format']),
            tochar(value['short_time_format']),
            tochar(value['long_time_format']),
            tochar(value['am']),
            tochar(value['pm']),
            tochararray(value['standalone_short_month_names']),
            tochararray(value['standalone_long_month_names']),
            tochararray(value['standalone_narrow_month_names']),
            tochararray(value['short_month_names']),
            tochararray(value['long_month_names']),
            tochararray(value['narrow_month_names']),
            tochararray(value['standalone_short_day_names']),
            tochararray(value['standalone_long_day_names']),
            tochararray(value['standalone_narrow_day_names']),
            tochararray(value['short_day_names']),
            tochararray(value['long_day_names']),
            tochararray(value['narrow_day_names']),
            key,
        )
    )

def printaliastable(frommap, prefix):
    print('''static const struct %sAliasTblData {
    const char* original;
    const char* substitute;
} %sAliasTbl[] = {''' % (prefix, prefix))

    for key in sorted(frommap):
        # territories and scripts entries can contain multiple replacements, add one for each
        splitvalue = frommap[key].split(' ')
        for value in splitvalue:
            print('    { "%s", "%s" },' % (key, value))

    print('};')
    print('static const qint16 %sAliasTblSize = sizeof(%sAliasTbl) / sizeof(%sAliasTblData);\n' % (prefix, prefix, prefix))

# main maps
languagemap = {}
countrymap = {}
scriptmap = {}
localemap = {}
likelysubtagsmap = {}
languagealiasmap = {}
countryaliasmap = {}
scriptaliasmap = {}
# cross-reference maps
localeparentmap = {}
localeparentvaluesmap = {}
localescriptmap = {}
localefirstdaymap = {}
localeweekendstartmap = {}
localeweekendendmap = {}
localenumberingmap = {}
# regular expressions
localeregex = re.compile('([^_|\-|\.|@]+)+')

# artificial entries
languagemap['AnyLanguage'] = {
    'code': '',
    'name': 'Default',
}
languagemap['C'] = {
    'code': 'C',
    'name': 'C',
}
countrymap['AnyCountry'] = {
    'code': '',
    'name': 'Default',
}
scriptmap['AnyScript'] = {
    'code': '',
    'name': 'Default',
}

# locale to parent parsing
tree = ET.parse('common/supplemental/supplementalData.xml')
root = tree.getroot()
for parentlocale in root.findall('./parentLocales/parentLocale'):
    parentlocaleparent = parentlocale.get('parent')
    parentlocalelocales = parentlocale.get('locales')
    localeparentmap[parentlocaleparent] = parentlocalelocales.split(' ')

# locale to script parsing
# only languages with one primary script are mapped because if there are multiple it should be
# specified in the locale data, see:
# https://sites.google.com/site/cldr/development/updating-codes/update-language-script-info/language-script-description
# secondary scripts are not taken into account at all
for suppllanguage in root.findall('./languageData/language'):
    suppllanguagetype = suppllanguage.get('type')
    suppllanguagescripts = suppllanguage.get('scripts')
    suppllanguagealt = suppllanguage.get('alt')
    if not suppllanguagescripts or suppllanguagealt == 'secondary':
        # alternative entry, skip it
        continue
    suppllanguagescriptslist = suppllanguagescripts.split(' ')
    if not len(suppllanguagescriptslist) == 1:
        # skip entries without definitive primary script
        continue
    suppllanguageterritories = suppllanguage.get('territories')
    if not suppllanguageterritories:
        # territories is optional, if not specified use artifical value to map all languages of
        # that type to the script
        suppllanguageterritories = 'AnyTerritory'
    localescriptmap[suppllanguagetype] = {
        'script': suppllanguagescripts,
        'territories': suppllanguageterritories.split(' '),
    }

# locale to first day parsing
for firstday in root.findall('./weekData/firstDay'):
    firstdayday = firstday.get('day')
    firstdayterritories = firstday.get('territories')
    localefirstdaymap[todayenum(firstdayday)] = stripxmltext(firstdayterritories).split(' ')

# locale to weekend start parsing
for weekstart in root.findall('./weekData/weekendStart'):
    weekstartday = weekstart.get('day')
    weekstartterritories = weekstart.get('territories')
    localeweekendstartmap[todayenum(weekstartday)] = stripxmltext(weekstartterritories).split(' ')

# locale to weekend end parsing
for weekend in root.findall('./weekData/weekendEnd'):
    weekendday = weekend.get('day')
    weekendterritories = weekend.get('territories')
    localeweekendendmap[todayenum(weekendday)] = stripxmltext(weekendterritories).split(' ')

# locale to numbering system parsing
tree = ET.parse('common/supplemental/numberingSystems.xml')
root = tree.getroot()
for numberingsystem  in root.findall('./numberingSystems/numberingSystem'):
    numberingsystemid = numberingsystem.get('id')
    numberingsystemdigits = numberingsystem.get('digits')
    if numberingsystemdigits:
        # either digits or rules is set
        localenumberingmap[numberingsystemid] = stripxmltext(numberingsystemdigits)

# language parsing
tree = ET.parse('common/main/en.xml')
root = tree.getroot()
for language in root.findall('./localeDisplayNames/languages/language'):
    languagetype = language.get('type')
    normallanguage = normalizestring(language.text)
    if normallanguage in ('Nauru', 'Tokelau', 'Tuvalu'):
        # country and language are the same, suffix to solve enum clashes
        normallanguage = '%sLanguage' % normallanguage
    languagemap[normallanguage] = {
        'code': languagetype,
        'name': language.text,
    }

if printenumsandexit:
    printenum(languagemap, 'Language')
elif printdocsandexit:
    printdoc(languagemap, 'Language')
else:
    printtable(languagemap, 'Language')

# country parsing
for country in root.findall('./localeDisplayNames/territories/territory'):
    countrytype = country.get('type')
    normalcountry = normalizestring(country.text)
    countrymap[normalcountry] = {
        'code': countrytype,
        'name': country.text,
    }

if printenumsandexit:
    printenum(countrymap, 'Country')
elif printdocsandexit:
    printdoc(countrymap, 'Country')
else:
    printtable(countrymap, 'Country')

# scripts parsing
for script in root.findall('./localeDisplayNames/scripts/script'):
    scripttype = script.get('type')
    normalscript = normalizestring(script.text)
    if not normalscript.endswith('Script'):
        # suffix script if needed
        normalscript = '%sScript' % normalscript
    if normalscript in ('UnknownScript', 'CommonScript'):
        # only interested in specific scripts
        continue
    scriptmap[normalscript] = {
        'code': scripttype,
        'name': script.text,
    }

if printenumsandexit:
    printenum(scriptmap, 'Script')
    sys.exit(0)
elif printdocsandexit:
    printdoc(scriptmap, 'Script')
    sys.exit(0)
else:
    printtable(scriptmap, 'Script')

# these defaults are used as parent locales fallback, C uses them as actual values because root
# contains UTF-8 characters and for compatibility. for the rest defaults are set from root
localedefaults = {
    # enums
    'language': 'QLocale::Language::AnyLanguage',
    'script': 'QLocale::Script::AnyScript',
    'country': 'QLocale::Country::AnyCountry',
    'first_day_of_week': 'Qt::Monday',
    'weekend_start': 'Qt::Saturday',
    'weekend_end': 'Qt::Sunday',
    # characters
    'decimal': '.',
    'group': ',',
    'list': ';',
    'percent': '%',
    'zero': '0',
    'minus': '-',
    'plus': '+',
    'exponential': 'e', # default in CLDR is E
    # strings
    'short_date_format': 'd MMM yyyy', # default in CLDR is y-MM-dd
    'long_date_format': 'd MMMM yyyy',
    'short_time_format': 'HH:mm:ss', # default in CLDR is HH:mm
    'long_time_format': 'HH:mm:ss z',
    'am': 'AM',
    'pm': 'PM',
    # arrays
    'standalone_short_month_names': ['Jan', 'Feb', 'Mar', 'Apr', 'May', 'Jun', 'Jul', 'Aug', 'Sep', 'Oct', 'Nov', 'Dec'],
    'standalone_long_month_names': ['January', 'February', 'March', 'April', 'May', 'June', 'July', 'August', 'September', 'October', 'November', 'December'],
    'standalone_narrow_month_names': ['J', 'F', 'M', 'A', 'M', 'J', 'J', 'A', 'S', 'O', 'N', 'D'],
    'short_month_names': ['Jan', 'Feb', 'Mar', 'Apr', 'May', 'Jun', 'Jul', 'Aug', 'Sep', 'Oct', 'Nov', 'Dec'],
    'long_month_names':  ['January', 'February', 'March', 'April', 'May', 'June', 'July', 'August', 'September', 'October', 'November', 'December'],
    'narrow_month_names': ['1', '2', '3', '4', '5', '6', '7', '8', '9', '10', '11', '12'],
    'standalone_short_day_names': ['Mon', 'Tue', 'Wed', 'Thu', 'Fri', 'Sat', 'Sun'],
    'standalone_long_day_names': ['Monday', 'Tuesday', 'Wednesday', 'Thursday', 'Friday', 'Saturday', 'Sunday'],
    'standalone_narrow_day_names': ['M', 'T', 'W', 'T', 'F', 'S', 'S'],
    'short_day_names': ['Mon', 'Tue', 'Wed', 'Thu', 'Fri', 'Sat', 'Sun'],
    'long_day_names': ['Monday', 'Tuesday', 'Wednesday', 'Thursday', 'Friday', 'Saturday', 'Sunday'],
    'narrow_day_names': ['1', '2', '3', '4', '5', '6', '7'],
}
# artificial entries
localemap['C'] = {}
mapcopy(localedefaults, localemap['C'])
localemap['C']['language'] = 'QLocale::Language::C'

# locales parsing
# TODO: accept only "contributed" or "approved" values
def readlocale(fromxml, tomap, isparent):
    locale = os.path.basename(fromxml)
    locale = locale.replace('.xml', '')

    if '_' in fromxml:
        # merge parent locales (non-territory) into the current one so that data can be read
        # from them. they do not have territory and currency data is based on territory so
        # cross-reference is not possible without doing so
        localeparent = locale.split('_')[0]
        xmlparent = fromxml.replace(locale, localeparent)
        root = xmlmerge(fromxml, xmlparent)
    else:
        tree = ET.parse(fromxml)
        root = tree.getroot()

    variant = root.find('./identity/variant')
    if variant is not None:
        # TODO: variants are not supported by QLocale
        return

    language = root.find('./identity/language')
    langtype = language.get('type')
    country = root.find('./identity/territory')
    countrytype = None
    scripttype = None
    numbertype = 'latn' # CLDR default

    tomap[locale] = {}
    if isparent:
        mapcopy(localedefaults, tomap[locale])
    else:
        mapcopy(localeparentvaluesmap['root'], tomap[locale])

    # set defaults from parent locale if territory is specified
    if country is not None:
        for parent in localeparentmap.keys():
            if locale in localeparentmap[parent]:
                if not parent in localeparentvaluesmap.keys():
                    # reference to locale without data
                    continue
                mapcopy(localeparentvaluesmap[parent], tomap[locale])
    # then from main locale (non-territory) filling the blanks that even parent locales do not fill
    if not isparent:
        mapmerge(localemap[langtype], tomap[locale], localedefaults)

    # find the enums from mapped values
    tomap[locale]['language'] = tolanguageenum(langtype)

    if not isparent and country is not None:
        countrytype = country.get('type')
        tomap[locale]['country'] = tocountryenum(countrytype)
    else:
        # territory often is not specified, use language code as fallback
        countrytype = langtype.upper()

    # script is specified either in the locale or supplemental data
    script = root.find('./identity/script')
    if script is not None:
        scripttype = script.get('type')
    elif not isparent:
        # scripts map is partial, pick from what is mapped
        if langtype in localescriptmap.keys():
            scriptterritories = localescriptmap[langtype]['territories']
            if 'AnyTerritory' in scriptterritories \
                or countrytype in scriptterritories:
                scripttype = localescriptmap[langtype]['script']

    defaultnumbersystem = root.find('./numbers/defaultNumberingSystem')
    if defaultnumbersystem is not None:
        numbertype = defaultnumbersystem.text

    # find values from supplemental maps
    if not isparent and scripttype:
        tomap[locale]['script'] = toscriptenum(scripttype)

    for key in localefirstdaymap.keys():
        for countryvalue in localefirstdaymap[key]:
            if countryvalue == countrytype:
                tomap[locale]['first_day_of_week'] = key
                break

    for key in localeweekendstartmap.keys():
        for countryvalue in localeweekendstartmap[key]:
            if countryvalue == countrytype:
                tomap[locale]['weekend_start'] = key
                break

    for key in localeweekendendmap.keys():
        for countryvalue in localeweekendendmap[key]:
            if countryvalue == countrytype:
                tomap[locale]['weekend_end'] = key
                break

    # find from locale data
    for symbol in root.findall('./numbers/symbols'):
        symbolnumbersystem = symbol.get('numberSystem')
        if not symbolnumbersystem == numbertype:
            # should be the locale numeric system
            continue

        decimal = symbol.find('./decimal')
        if decimal is not None and len(decimal.text) == 1:
            tomap[locale]['decimal'] = decimal.text

        group = symbol.find('./group')
        if group is not None and len(group.text) == 1:
            tomap[locale]['group'] = group.text

        listdelimiter = symbol.find('./list')
        if listdelimiter is not None and len(listdelimiter.text) == 1:
            tomap[locale]['list'] = listdelimiter.text

        percent = symbol.find('./percentSign')
        if percent is not None and len(percent.text) == 1:
            tomap[locale]['percent'] = percent.text

        minus = symbol.find('./minusSign')
        if minus is not None and len(minus.text) == 1:
            tomap[locale]['minus'] = minus.text

        plus = symbol.find('./plusSign')
        if plus is not None and len(plus.text) == 1:
            tomap[locale]['plus'] = plus.text

        exponential = symbol.find('./exponential')
        if exponential is not None and len(exponential.text) == 1:
            tomap[locale]['exponential'] = exponential.text

        # zero is from cross-reference numeric system map,
        # taking the first character works even for UTF-8 chars
        tomap[locale]['zero'] = localenumberingmap[numbertype][0]

        # locale numeric system was found, break
        break

    for calendar in root.findall('./dates/calendars/calendar'):
        calendartype = calendar.get('type')
        if not calendartype == 'gregorian':
            # all values should be from gregorian calendar
            continue
        for dateformat in calendar.findall('./dateFormats/dateFormatLength'):
            dateformattype = dateformat.get('type')
            if dateformattype == 'short':
                pattern = dateformat.find('./dateFormat/pattern')
                tomap[locale]['short_date_format'] = todatetimeformat(pattern.text)
            elif dateformattype == 'long':
                pattern = dateformat.find('./dateFormat/pattern')
                tomap[locale]['long_date_format'] = todatetimeformat(pattern.text)

        for timeformat in calendar.findall('./timeFormats/timeFormatLength'):
            timeformattype = timeformat.get('type')
            if timeformattype == 'short':
                pattern = timeformat.find('./timeFormat/pattern')
                tomap[locale]['short_time_format'] = todatetimeformat(pattern.text)
            elif timeformattype == 'long':
                pattern = timeformat.find('./timeFormat/pattern')
                tomap[locale]['long_time_format'] = todatetimeformat(pattern.text)

        for dayperiodwidth in calendar.findall('./dayPeriods/dayPeriodContext/dayPeriodWidth'):
            dayperiodwidthtype = dayperiodwidth.get('type')
            if not dayperiodwidthtype == 'wide':
                # all values should be in wide format
                continue
            for dayperiod in dayperiodwidth.findall('dayPeriod'):
                dayperiodtype = dayperiod.get('type')
                if dayperiodtype == 'am':
                    tomap[locale]['am'] = dayperiod.text
                elif dayperiodtype == 'pm':
                    tomap[locale]['pm'] = dayperiod.text

        # month/day names
        for monthcontext in calendar.findall('./months/monthContext'):
            monthcontexttype = monthcontext.get('type')
            if monthcontexttype == 'stand-alone':
                for monthwidth in monthcontext.findall('./monthWidth'):
                    monthwidthtype = monthwidth.get('type')
                    if monthwidthtype == 'wide':
                        months = monthwidth.findall('./month')
                        tomap[locale]['standalone_long_month_names'] = tomonthslist(months, tomap[locale]['standalone_long_month_names'])
                    elif monthwidthtype == 'abbreviated':
                        months = monthwidth.findall('./month')
                        tomap[locale]['standalone_short_month_names'] = tomonthslist(months, tomap[locale]['standalone_short_month_names'])
                    elif monthwidthtype == 'narrow':
                        months = monthwidth.findall('./month')
                        tomap[locale]['standalone_narrow_month_names'] = tomonthslist(months, tomap[locale]['standalone_narrow_month_names'])
            elif monthcontexttype == 'format':
                for monthwidth in monthcontext.findall('./monthWidth'):
                    monthwidthtype = monthwidth.get('type')
                    if monthwidthtype == 'wide':
                        months = monthwidth.findall('./month')
                        tomap[locale]['long_month_names'] = tomonthslist(months, tomap[locale]['long_month_names'])
                    elif monthwidthtype == 'abbreviated':
                        months = monthwidth.findall('./month')
                        tomap[locale]['short_month_names'] = tomonthslist(months, tomap[locale]['short_month_names'])
                    elif monthwidthtype == 'narrow':
                        months = monthwidth.findall('./month')
                        tomap[locale]['narrow_month_names'] = tomonthslist(months, tomap[locale]['narrow_month_names'])

        for daycontext in calendar.findall('./days/dayContext'):
            daycontexttype = daycontext.get('type')
            if daycontexttype == 'stand-alone':
                for daywidth in daycontext.findall('./dayWidth'):
                    daywidthtype = daywidth.get('type')
                    if daywidthtype == 'wide':
                        days = daywidth.findall('./day')
                        tomap[locale]['standalone_long_day_names'] = todayslist(days, tomap[locale]['standalone_long_day_names'])
                    elif daywidthtype == 'abbreviated':
                        days = daywidth.findall('./day')
                        tomap[locale]['standalone_short_day_names'] = todayslist(days, tomap[locale]['standalone_short_day_names'])
                    elif daywidthtype == 'narrow':
                        days = daywidth.findall('./day')
                        tomap[locale]['standalone_narrow_day_names'] = todayslist(days, tomap[locale]['standalone_narrow_day_names'])
            elif daycontexttype == 'format':
                for daywidth in daycontext.findall('./dayWidth'):
                    daywidthtype = daywidth.get('type')
                    if daywidthtype == 'wide':
                        days = daywidth.findall('./day')
                        tomap[locale]['long_day_names'] = todayslist(days, tomap[locale]['long_day_names'])
                    elif daywidthtype == 'abbreviated':
                        days = daywidth.findall('./day')
                        tomap[locale]['short_day_names'] = todayslist(days, tomap[locale]['short_day_names'])
                    elif daywidthtype == 'narrow':
                        days = daywidth.findall('./day')
                        tomap[locale]['narrow_day_names'] = todayslist(days, tomap[locale]['narrow_day_names'])

        # gregorian calendar was found, break
        break

    # month/day names are set during calendar parsing

# read parent locales first
for xml in glob.glob('common/main/*.xml'):
    xmlbase = os.path.basename(xml)
    xmlbase = xmlbase.replace('.xml', '')
    if not xmlbase in localeparentmap.keys():
        continue
    readlocale(xml, localeparentvaluesmap, True)

# now everything including those
for xml in sorted(glob.glob('common/main/*.xml')):
    if xml.endswith('/root.xml'):
        # root is not actual locale
        continue
    readlocale(xml, localemap, False)

print('''static const QLocalePrivate localeTbl[] = {''')

# print C first
printlocaledata(localemap, 'C')

# now everything except that
for key in sorted(localemap.keys()):
    if key == 'C':
        continue
    printlocaledata(localemap, key)

print('};')
print('static const qint16 localeTblSize = sizeof(localeTbl) / sizeof(QLocalePrivate);\n')

# likely subtags parsing
tree = ET.parse('common/supplemental/likelySubtags.xml')
root = tree.getroot()
for likelysubtag in root.findall('./likelySubtags/likelySubtag'):
    likelysubtagfrom = likelysubtag.get('from')
    likelysubtagto = likelysubtag.get('to')
    # split code into language, script and country to make it possible to match against regardless
    # of separators and remap to enums so that it is possible to substitute both named and enumed
    # locale searches at the cost of not covering all named cases
    likelysubtagfromsplit = localeregex.findall(likelysubtagfrom)
    likelysubtagfromsplitlen = len(likelysubtagfromsplit)
    likelysubtagtosplit = localeregex.findall(likelysubtagto)
    likelysubtagtosplitlen = len(likelysubtagtosplit)
    likelyfromlanguage = None
    likelyfromscript = None
    likelyfromcountry = None
    if likelysubtagfromsplitlen == 1:
        likelyfromlanguage = tolanguageenum(likelysubtagfromsplit[0])
        likelyfromscript = 'QLocale::Script::AnyScript'
        likelyfromcountry = 'QLocale::Country::AnyCountry'
    elif likelysubtagfromsplitlen == 2:
        likelyfromlanguage = tolanguageenum(likelysubtagfromsplit[0])
        likelyfromscript = 'QLocale::Script::AnyScript'
        likelyfromcountry = tocountryenum(likelysubtagfromsplit[1])
    elif likelysubtagfromsplitlen == 3:
        likelyfromlanguage = tolanguageenum(likelysubtagfromsplit[0])
        likelyfromscript = toscriptenum(likelysubtagfromsplit[1])
        likelyfromcountry = tocountryenum(likelysubtagfromsplit[2])
    elif likelysubtagfromsplitlen > 3 or likelysubtagtosplitlen > 3:
        # the regular expression is intentionally greedy, if there are more than 3 group matches
        # then it is likely a variant and that is not supported case yet
        print(likelysubtagfrom, likelysubtagfromsplit)
        print(likelysubtagto, likelysubtagtosplit)
        sys.exit(1)
    likelytolanguage = tolanguageenum(likelysubtagtosplit[0])
    likelytoscript = toscriptenum(likelysubtagtosplit[1])
    likelytocountry = tocountryenum(likelysubtagtosplit[2])

    if not likelyfromlanguage or not likelyfromscript or not likelyfromcountry \
        or not likelytolanguage or not likelytoscript or not likelytocountry:
        # if there are no enums for the codes skip the entry
        continue

    likelysubtagsmap[likelysubtagfrom] = {
        'fromlanguage' : likelyfromlanguage,
        'fromscript' : likelyfromscript,
        'fromcountry' : likelyfromcountry,
        'tolanguage' : likelytolanguage,
        'toscript' : likelytoscript,
        'tocountry' : likelytocountry,
    }
print('''static const struct subtagAliasTblData {
    const QLocale::Language fromlanguage;
    const QLocale::Script fromscript;
    const QLocale::Country fromcountry;
    const QLocale::Language tolanguage;
    const QLocale::Script toscript;
    const QLocale::Country tocountry;
} subtagAliasTbl[] = {''')

for key in sorted(likelysubtagsmap):
    value = likelysubtagsmap[key]
    print('''    {
        %s, %s, %s,
        %s, %s, %s
    },''' % (
            value['fromlanguage'],
            value['fromscript'],
            value['fromcountry'],
            value['tolanguage'],
            value['toscript'],
            value['tocountry'],
        )
    )

print('};')
print('static const qint16 subtagAliasTblSize = sizeof(subtagAliasTbl) / sizeof(subtagAliasTblData);\n')

# language alias parsing
tree = ET.parse('common/supplemental/supplementalMetadata.xml')
root = tree.getroot()
for languagealias in root.findall('./metadata/alias/languageAlias'):
    languagealiastype = languagealias.get('type')
    languagealiasreplacement = languagealias.get('replacement')
    if '_' in languagealiastype or '-' in languagealiastype \
        or '_' in languagealiasreplacement or '-' in languagealiasreplacement:
        # if either the original or the substitute is BCP47 code (language and script/country
        # included) skip it because QLocalePrivate::codeToLanguage() should be dealing with
        # language codes only
        continue
    languagealiasmap[languagealiastype] = languagealiasreplacement

printaliastable(languagealiasmap, 'language')

# country alias parsing
for territoryalias in root.findall('./metadata/alias/territoryAlias'):
    territoryaliastype = territoryalias.get('type')
    territoryaliasreplacement = territoryalias.get('replacement')
    countryaliasmap[territoryaliastype] = territoryaliasreplacement

printaliastable(countryaliasmap, 'country')

# script alias parsing
for scriptalias in root.findall('./metadata/alias/scriptAlias'):
    scriptaliastype = scriptalias.get('type')
    scriptaliasreplacement = scriptalias.get('replacement')
    scriptaliasmap[scriptaliastype] = scriptaliasreplacement

printaliastable(scriptaliasmap, 'script')
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								#!/usr/bin/python3
-												rework genlocale script and remove assumptions about table entries length

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-02 14:07:55 +00:00
+								#-*- coding: UTF-8 -*-
-												ground work for locale data update

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-01 18:08:02 +00:00
-												update tables data to CLDR v44

Signed-off-by: Ivailo Monev <xakepa10@gmail.com>

											
										
										
											2024-03-13 22:23:10 +02:00
+								# Data is from https://unicode.org/Public/cldr/44/core.zip
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
+								import os, sys, glob, re
-												ground work for locale data update

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-01 18:08:02 +00:00
+								import xml.etree.ElementTree as ET
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												add --printenums option to genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 13:53:57 +00:00
+								printenumsandexit = ('--printenums' in sys.argv)
-												update tables data to CLDR v36.1

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2020-03-19 21:36:11 +00:00
+								printdocsandexit = ('--printdocs' in sys.argv)
-												add --printenums option to genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 13:53:57 +00:00
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								def mapcopy(frommap, tomap):
 								    for key in frommap.keys():
 								        tomap[key] = frommap[key]
-												ground work for locale data update

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-01 18:08:02 +00:00
-												do not overwrite parent locale values with defaults

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:24:47 +00:00
+								def mapmerge(frommap, tomap, defaultmap):
 								    for key in frommap.keys():
 								        if frommap[key] == defaultmap[key]:
 								            continue
 								        tomap[key] = frommap[key]
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								def listcopy(fromlist, tolist):
 								    for entry in fromlist:
 								        tolist.append(entry)
 								def stripxmltext(fromxmltext):
 								    result = fromxmltext.replace('\n', '')
-												rework genlocale script and remove assumptions about table entries length

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-02 14:07:55 +00:00
+								    result = result.replace('\t', '')
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								    # 3-passes of double-space removal seems to be enough for all cases
-												minor genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-11 22:08:29 +00:00
+								    for r in range(3):
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								        result = result.replace('  ', ' ')
-												rework genlocale script and remove assumptions about table entries length

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-02 14:07:55 +00:00
+								    return result.strip()
-												merge non-territory locales into territory ones in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-11 12:03:33 +00:00
+								def normalizestring(fromstring):
 								    result = fromstring.replace(' ', '')
 								    result = result.replace('-', '')
-												update locale date from CLDR v36

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-11-17 17:39:37 +00:00
+								    result = result.replace(',', '')
-												merge non-territory locales into territory ones in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-11 12:03:33 +00:00
+								    result = result.replace("'", '')
 								    result = result.replace('&', 'And')
 								    result = result.replace('(', '')
 								    result = result.replace(')', '')
 								    result = result.replace('St.', 'St')
 								    result = result.replace('U.S.', 'UnitedStates')
 								    # UTF-8 chars
 								    result = result.replace(u'ʼ', '')
 								    result = result.replace(u'’', '')
 								    result = result.replace(u'ü', 'u')
 								    result = result.replace(u'å', 'a')
 								    result = result.replace(u'ç', 'c')
 								    result = result.replace(u'õ', 'o')
 								    result = result.replace(u'Å', 'A')
 								    result = result.replace(u'ô', 'o')
 								    result = result.replace(u'ã', 'a')
 								    result = result.replace(u'é', 'e')
 								    result = result.replace(u'í', 'i')
-												update tables data to CLDR v40

Signed-off-by: Ivailo Monev <xakepa10@gmail.com>

											
										
										
											2021-11-20 16:49:58 +02:00
+								    result = result.replace(u'ā', 'a')
-												prepare genlocale.py script for CLDR v42

Signed-off-by: Ivailo Monev <xakepa10@gmail.com>

											
										
										
											2022-11-14 20:35:44 +02:00
+								    result = result.replace(u'á', 'a')
-												merge non-territory locales into territory ones in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-11 12:03:33 +00:00
+								    return result
 								def xmlmerge(fromxml, fromxml2):
 								    tree = ET.parse(fromxml)
 								    root = tree.getroot()
 								    tree2 = ET.parse(fromxml2)
 								    root2 = tree2.getroot()
 								    for element in root:
 								        root2.insert(0, element)
 								    return root2
-												make zero symbol uint and regenerate locale table

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 20:31:26 +00:00
+								def touint(fromstring):
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								    # NOTE: symbols (plus, minus, etc.) are assumed to be single character which is not true for
 								    # many of the locales, however the API for those does not handle them as strings thus the first
 								    # character only is used
 								    return ord(fromstring)
-												minor genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 18:23:29 +00:00
+								def tochar(fromstring):
 								    if fromstring:
 								        return '"%s\\0"' % fromstring
-												get rid of Q_NULLPTR definition [ci reset]

Signed-off-by: Ivailo Monev <xakepa10@gmail.com>

											
										
										
											2021-08-06 15:35:21 +03:00
+								    return 'nullptr'
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												use Q_NULLPTR for empty char array values in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-06 15:33:59 +00:00
+								def tochararray(fromstringlist):
 								    result = '{ '
 								    for string in fromstringlist:
 								        result = '%s%s, ' % (result, tochar(string))
 								    result = '%s }' % result
 								    result = result.replace(',  }', ' }')
 								    return result
-												minor genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 18:23:29 +00:00
+								def todayenum(day):
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								    if day == 'mon':
 								        return 'Qt::Monday'
 								    elif day == 'tue':
 								        return 'Qt::Tuesday'
 								    elif day == 'wed':
 								        return 'Qt::Wednesday'
 								    elif day == 'thu':
 								        return 'Qt::Thursday'
 								    elif day == 'fri':
 								        return 'Qt::Friday'
 								    elif day == 'sat':
 								        return 'Qt::Saturday'
 								    elif day == 'sun':
 								        return 'Qt::Sunday'
 								    print('Unknown day: %s' % day)
 								    sys.exit(1)
-												remove invalid date/time format tags from locale data

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 01:32:21 +00:00
+								def todatetimeformat(fromformat):
-												"a" is valid date/time format tag

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 20:32:13 +00:00
+								    # valid are y, m, M, d, h, H, s, a, A, z and t
-												remove invalid date/time format tags from locale data

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 01:32:21 +00:00
+								    unsupportedtags = [
 								        'g',
 								        'u',
 								        'q',
 								        'l',
 								        'w',
 								        'f',
 								        'j',
 								    ]
-												handle all invalid cases in genlocale date/time formatter

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-12 00:50:49 +00:00
+								    replacementtags = {
-												ensure genlocale date/time formatter does not produce incorrect results

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-12 12:11:23 +00:00
+								        'MMMMM' : 'MMM', # narrow month name
 								        'LLLLL' : 'MMM', # stand-alone narrow month name
 								        'E' : 'ddd', 'EE' : 'ddd', 'EEE' : 'ddd', 'EEEEE' : 'ddd', 'EEEE' : 'dddd', # day of week
 								        'e' : 'ddd', 'ee' : 'ddd', 'eee' : 'ddd', 'eeeee' : 'ddd', 'eeee' : 'dddd', # local day of week
 								        'c' : 'ddd', 'cc' : 'ddd', 'ccc' : 'ddd', 'ccccc' : 'ddd', 'cccc' : 'dddd', # stand-alone local day of week
 								        'K' : 'h', # Hour 0-11
 								        'k' : 'H', # Hour 1-24
-												deal with TODO related to timezone format char

for reference:
https://github.com/fluxer/katie/commit/09592d6e12a2a5e555829e5fa969e3232ae7a248

Signed-off-by: Ivailo Monev <xakepa10@gmail.com>

											
										
										
											2021-11-23 08:15:08 +02:00
+								        'z' : 'Z', 'zz' : 'Z', 'zzz' : 'Z', 'zzzz' : 'Z', # timezone
 								        'Z' : 'Z', 'ZZ' : 'Z', 'ZZZ' : 'Z', 'ZZZZ' : 'Z', # timezone
 								        'v' : 'Z', 'vv' : 'Z', 'vvv' : 'Z', 'vvvv' : 'Z', # timezone
 								        'V' : 'Z', 'VV' : 'Z', 'VVV' : 'Z', 'VVVV' : 'Z',  # timezone
-												ensure genlocale date/time formatter does not produce incorrect results

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-12 12:11:23 +00:00
+								        'L' : 'M', # stand-alone month names. not supported
-												handle all invalid cases in genlocale date/time formatter

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-12 00:50:49 +00:00
+								    }
 								    replacementregex = {
-												ensure genlocale date/time formatter does not produce incorrect results

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-12 12:11:23 +00:00
+								        r'y' : 'yyyy',       # four-digit year without leading zeroes
 								        r'yyy{3,}' : 'yyyy', # more that three digits hence convert to four-digit year
 								        r'S{1,}' : '',       # fractional seconds. not supported.
-												minor comments corrections

Signed-off-by: Ivailo Monev <xakepa10@gmail.com>

											
										
										
											2021-04-19 21:23:48 +03:00
+								        r'A{1,}' : '',       # milliseconds in day. not supported.
-												ensure genlocale date/time formatter does not produce incorrect results

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-12 12:11:23 +00:00
+								        r'a' : 'AP',         # AM/PM
-												handle all invalid cases in genlocale date/time formatter

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-12 00:50:49 +00:00
+								    }
-												replace longest matches date/time tags first in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 10:57:58 +00:00
+								    possibleoccurences = [
-												remove invalid date/time format tags from locale data

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 01:32:21 +00:00
+								        '%s, ',
-												add more possible occurences if invalid date/time format tags

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-06 18:56:47 +00:00
+								        ', %s',
-												remove invalid date/time format tags from locale data

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 01:32:21 +00:00
+								        '%s.',
-												add more possible occurences if invalid date/time format tags

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-06 18:56:47 +00:00
+								        '.%s',
-												remove invalid date/time format tags from locale data

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 01:32:21 +00:00
+								        '%s-',
-												add more possible occurences if invalid date/time format tags

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-06 18:56:47 +00:00
+								        '-%s',
 								        '(%s)',
-												handle all invalid cases in genlocale date/time formatter

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-12 00:50:49 +00:00
+								        "('%s')",
 								        '%s ',
 								        ' %s',
-												remove invalid date/time format tags from locale data

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 01:32:21 +00:00
+								        '%s',
 								    ]
 								    result = fromformat
 								    for tag in unsupportedtags:
 								        uppertag = tag.upper()
-												replace longest matches date/time tags first in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 10:57:58 +00:00
+								        for occurence in possibleoccurences:
 								            result = result.replace(occurence % (tag * 4), '')
 								            result = result.replace(occurence % (tag * 3), '')
 								            result = result.replace(occurence % (tag * 2), '')
 								            result = result.replace(occurence % tag, '')
 								            result = result.replace(occurence % (uppertag * 4), '')
 								            result = result.replace(occurence % (uppertag * 3), '')
 								            result = result.replace(occurence % (uppertag * 2), '')
 								            result = result.replace(occurence % uppertag, '')
-												ensure genlocale date/time formatter does not produce incorrect results

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-12 12:11:23 +00:00
+								    for key in replacementregex.keys():
 								        result = re.sub(key, replacementregex[key], result)
-												handle all invalid cases in genlocale date/time formatter

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-12 00:50:49 +00:00
+								    for key in replacementtags.keys():
 								        result = result.replace(key, replacementtags[key])
-												remove invalid date/time format tags from locale data

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 01:32:21 +00:00
+								    return result
-												make zero symbol uint and regenerate locale table

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 20:31:26 +00:00
+								def tomonthslist(fromxmlelements, initialvalues):
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								    result = []
 								    listcopy(initialvalues, result)
 								    for month in fromxmlelements:
 								        monthtype = month.get('type')
 								        if monthtype == '1':
 								            result[0] = month.text
 								        elif monthtype == '2':
 								            result[1] = month.text
 								        elif monthtype == '3':
 								            result[2] = month.text
 								        elif monthtype == '4':
 								            result[3] = month.text
 								        elif monthtype == '5':
 								            result[4] = month.text
 								        elif monthtype == '6':
 								            result[5] = month.text
 								        elif monthtype == '7':
 								            result[6] = month.text
 								        elif monthtype == '8':
 								            result[7] = month.text
 								        elif monthtype == '9':
 								            result[8] = month.text
 								        elif monthtype == '10':
 								            result[9] = month.text
 								        elif monthtype == '11':
 								            result[10] = month.text
 								        elif monthtype == '12':
 								            result[11] = month.text
-												error out on unknown month/day from genlocale script [ci skip]

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 20:27:33 +00:00
+								        else:
 								            print('Unknown month: %s' % monthtype)
 								            sys.exit(1)
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								    return result
 								def todayslist(fromxmlelements, initialvalues):
 								    result = []
 								    listcopy(initialvalues, result)
 								    for day in fromxmlelements:
 								        daytype = day.get('type')
-												make monday first day in the locale table

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-12 11:46:53 +00:00
+								        if daytype == 'mon':
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								            result[0] = day.text
 								        elif daytype == 'tue':
-												make monday first day in the locale table

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-12 11:46:53 +00:00
+								            result[1] = day.text
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								        elif daytype == 'wed':
-												make monday first day in the locale table

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-12 11:46:53 +00:00
+								            result[2] = day.text
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								        elif daytype == 'thu':
-												make monday first day in the locale table

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-12 11:46:53 +00:00
+								            result[3] = day.text
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								        elif daytype == 'fri':
-												make monday first day in the locale table

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-12 11:46:53 +00:00
+								            result[4] = day.text
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								        elif daytype == 'sat':
-												make monday first day in the locale table

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-12 11:46:53 +00:00
+								            result[5] = day.text
 								        elif daytype == 'sun':
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								            result[6] = day.text
-												error out on unknown month/day from genlocale script [ci skip]

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 20:27:33 +00:00
+								        else:
 								            print('Unknown day: %s' % daytype)
 								            sys.exit(1)
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								    return result
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
+								def tolanguageenum(fromstring):
 								    for key in languagemap.keys():
 								        if fromstring == languagemap[key]['code']:
 								            return 'QLocale::Language::%s' % key
 								    # print('Unknown language: %s' % fromstring)
 								    # sys.exit(1)
 								def toscriptenum(fromstring):
 								    for key in scriptmap.keys():
 								        if fromstring == scriptmap[key]['code']:
 								            return 'QLocale::Script::%s' % key
 								    # print('Unknown script: %s' % fromstring)
 								    # sys.exit(1)
 								def tocountryenum(fromstring):
 								    for key in countrymap.keys():
 								        if fromstring == countrymap[key]['code']:
 								            return 'QLocale::Country::%s' % key
 								    # print('Unknown country: %s' % fromstring)
 								    # sys.exit(1)
-												map duplicate language, script and country codes as aliases

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 14:48:16 +00:00
+								# printenum prints mapped values that have unique code only, the rest are set to the enum of the
 								# first occurence. the reason for doing so is because table lookups for figuring out language,
-												update CLDR to v35.1, generated data is the same

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-08 19:53:30 +00:00
+								# script and country required for constructing QLocale from string (named locales) relies on the
 								# fact that there is only one code for each, if that is not the case constructing copy of locale
 								# from its name will not copy it correctly. printtable skips duplicate code entries entirely
-												rework genlocale script and remove assumptions about table entries length

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-02 14:07:55 +00:00
+								def printenum(frommap, prefix):
 								    keyscount = 0
-												deal with TODO in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 12:46:07 +00:00
+								    aliascodes = []
 								    seencodes = []
-												rework genlocale script and remove assumptions about table entries length

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-02 14:07:55 +00:00
-												map duplicate language, script and country codes as aliases

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 14:48:16 +00:00
+								    print('    enum %s {' % prefix)
-												rework genlocale script and remove assumptions about table entries length

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-02 14:07:55 +00:00
+								    # print Default and C first
-												fix long day names mapping

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 11:26:06 +00:00
+								    for key in frommap.keys():
-												rework genlocale script and remove assumptions about table entries length

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-02 14:07:55 +00:00
+								        if not key in ('Any%s' % prefix, 'C'):
 								            continue
 								        print('        %s = %d,' % (key, keyscount))
 								        keyscount += 1
-												ground work for locale data update

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-01 18:08:02 +00:00
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								    # now everything except those, save last key for later
-												rework genlocale script and remove assumptions about table entries length

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-02 14:07:55 +00:00
+								    lastkey = ''
 								    for key in sorted(frommap.keys()):
 								        if key in ('Any%s' % prefix, 'C'):
 								            continue
-												deal with TODO in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 12:46:07 +00:00
+								        code = frommap[key]['code']
 								        if code in seencodes:
 								            aliascodes.append(key)
-												map duplicate language, script and country codes as aliases

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 14:48:16 +00:00
+								            continue
-												deal with TODO in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 12:46:07 +00:00
+								        seencodes.append(code)
-												rework genlocale script and remove assumptions about table entries length

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-02 14:07:55 +00:00
+								        print('        %s = %d,' % (key, keyscount))
 								        lastkey = key
 								        keyscount += 1
-												ground work for locale data update

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-01 18:08:02 +00:00
-												map duplicate language, script and country codes as aliases

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 14:48:16 +00:00
+								    # now aliases
 								    print('')
-												deal with TODO in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 12:46:07 +00:00
+								    for alias in sorted(aliascodes):
 								        aliascode = frommap[alias]['code']
-												map duplicate language, script and country codes as aliases

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 14:48:16 +00:00
+								        aliasenum = None
 								        for key in sorted(frommap.keys()):
-												deal with TODO in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 12:46:07 +00:00
+								            code = frommap[key]['code']
 								            if aliascode == code:
-												map duplicate language, script and country codes as aliases

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 14:48:16 +00:00
+								                aliasenum == key
 								                break
 								        print('        %s = %s,' % (alias, key))
-												rework genlocale script and remove assumptions about table entries length

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-02 14:07:55 +00:00
+								    # print last key
 								    print('\n        Last%s = %s' % (prefix, lastkey))
-												ground work for locale data update

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-01 18:08:02 +00:00
-												map duplicate language, script and country codes as aliases

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 14:48:16 +00:00
+								    print('    };\n')
-												update tables data to CLDR v36.1

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2020-03-19 21:36:11 +00:00
+								def printdoc(frommap, prefix):
 								    print('// %s' % prefix)
 								    for key in sorted(frommap.keys()):
 								        if key in ('Any%s' % prefix, 'C'):
 								            continue
 								        print('    \\value %s' % key)
 								    print('')
-												map duplicate language, script and country codes as aliases

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 14:48:16 +00:00
-												rework genlocale script and remove assumptions about table entries length

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-02 14:07:55 +00:00
+								def printtable(frommap, prefix):
 								    lowerprefix = prefix.lower()
-												deal with TODO in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 12:46:07 +00:00
+								    seencodes = []
-												map duplicate language, script and country codes as aliases

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 14:48:16 +00:00
-												rework genlocale script and remove assumptions about table entries length

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-02 14:07:55 +00:00
+								    print('''static const struct %sTblData {
-												make enums first member of tables structs

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 11:37:22 +00:00
+								    const QLocale::%s %s;
-												ground work for locale data update

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-01 18:08:02 +00:00
+								    const char* name;
 								    const char* code;
-												rework genlocale script and remove assumptions about table entries length

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-02 14:07:55 +00:00
+								} %sTbl[] = {''' % (lowerprefix, prefix, lowerprefix, lowerprefix))
-												ground work for locale data update

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-01 18:08:02 +00:00
-												rework genlocale script and remove assumptions about table entries length

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-02 14:07:55 +00:00
+								    # print Default and C first
 								    for key in frommap.keys():
 								        if not key in ('Any%s' % prefix, 'C'):
 								            continue
-												deal with TODO in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 12:46:07 +00:00
+								        code = frommap[key]['code']
 								        name = frommap[key]['name']
-												make enums first member of tables structs

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 11:37:22 +00:00
+								        print('    { QLocale::%s::%s, %s, %s },' % (prefix, key, tochar(name), tochar(code)))
-												rework genlocale script and remove assumptions about table entries length

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-02 14:07:55 +00:00
-												map duplicate language, script and country codes as aliases

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 14:48:16 +00:00
+								    # now everything except those but only unique code values
-												rework genlocale script and remove assumptions about table entries length

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-02 14:07:55 +00:00
+								    for key in sorted(frommap.keys()):
 								        if key in ('Any%s' % prefix, 'C'):
 								            continue
-												deal with TODO in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 12:46:07 +00:00
+								        code = frommap[key]['code']
 								        if code in seencodes:
-												map duplicate language, script and country codes as aliases

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 14:48:16 +00:00
+								            continue
-												deal with TODO in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 12:46:07 +00:00
+								        seencodes.append(code)
 								        name = frommap[key]['name']
-												make enums first member of tables structs

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 11:37:22 +00:00
+								        print('    { QLocale::%s::%s, %s, %s },' % (prefix, key, tochar(name), tochar(code)))
-												rework genlocale script and remove assumptions about table entries length

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-02 14:07:55 +00:00
 								    print('};')
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								    print('static const qint16 %sTblSize = sizeof(%sTbl) / sizeof(%sTblData);\n' % (lowerprefix, lowerprefix, lowerprefix))
-												rework genlocale script and remove assumptions about table entries length

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-02 14:07:55 +00:00
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								def printlocaledata(frommap, key):
 								    value = frommap[key]
-												discard non-territory locale entries

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-06 14:09:10 +00:00
+								    # skip table entries without country (non-territory), unless it is artificial, this is done to
 								    # preserve the assumption in QLocalePrivate::findLocale that "AnyCountry" means "find me a
 								    # language, no matter what country it is spoken in" if "AnyCountry" is passed to it as argument
 								    # and also shrinks the table
-												locale data table should not have Default entry

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 19:26:34 +00:00
+								    if value['country'] == 'QLocale::Country::AnyCountry' and not key == 'C':
-												discard non-territory locale entries

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-06 14:09:10 +00:00
+								        return
-												update tables data to CLDR v43

hacks included

Signed-off-by: Ivailo Monev <xakepa10@gmail.com>

											
										
										
											2023-05-27 04:02:04 +03:00
+								    # HACK: skip table entries the language of which is unknown
-												update tables data to CLDR v44

Signed-off-by: Ivailo Monev <xakepa10@gmail.com>

											
										
										
											2024-03-13 22:23:10 +02:00
+								    if key == 'apc_SY' or key == 'skr_PK':
-												update tables data to CLDR v43

hacks included

Signed-off-by: Ivailo Monev <xakepa10@gmail.com>

											
										
										
											2023-05-27 04:02:04 +03:00
+								        return
-												genlocale script comment correction

Signed-off-by: Ivailo Monev <xakepa10@gmail.com>

											
										
										
											2023-05-27 05:44:57 +03:00
+								    # HACK: skip table entries with and without specifiec script
-												update tables data to CLDR v43

hacks included

Signed-off-by: Ivailo Monev <xakepa10@gmail.com>

											
										
										
											2023-05-27 04:02:04 +03:00
+								    if key == 'ha_Arab_NG':
 								        return
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								    print('''    {
 								        %s, %s, %s,
 								        %s, %s, %s,
-												remove unused QLocale currency related methods and enum

Signed-off-by: Ivailo Monev <xakepa10@gmail.com>

											
										
										
											2022-06-10 23:18:59 +03:00
+								        %s, %s, %s, %s, %s, %s, %s, %s,
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								        %s, %s, %s, %s,
 								        %s, %s,
 								        %s,
 								        %s,
 								        %s,
 								        %s,
 								        %s,
 								        %s,
 								        %s,
 								        %s,
 								        %s,
 								        %s,
 								        %s,
 								        %s
 								    }, // %s''' % (
 								            value['language'],
 								            value['script'],
 								            value['country'],
 								            value['first_day_of_week'],
 								            value['weekend_start'],
 								            value['weekend_end'],
-												make zero symbol uint and regenerate locale table

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 20:31:26 +00:00
+								            touint(value['decimal']),
 								            touint(value['group']),
 								            touint(value['list']),
 								            touint(value['percent']),
 								            touint(value['minus']),
 								            touint(value['plus']),
 								            touint(value['exponential']),
 								            touint(value['zero']),
-												handle all invalid cases in genlocale date/time formatter

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-12 00:50:49 +00:00
+								            tochar(value['short_date_format']),
 								            tochar(value['long_date_format']),
-												minor genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 18:23:29 +00:00
+								            tochar(value['short_time_format']),
 								            tochar(value['long_time_format']),
 								            tochar(value['am']),
 								            tochar(value['pm']),
 								            tochararray(value['standalone_short_month_names']),
 								            tochararray(value['standalone_long_month_names']),
 								            tochararray(value['standalone_narrow_month_names']),
 								            tochararray(value['short_month_names']),
 								            tochararray(value['long_month_names']),
 								            tochararray(value['narrow_month_names']),
 								            tochararray(value['standalone_short_day_names']),
 								            tochararray(value['standalone_long_day_names']),
 								            tochararray(value['standalone_narrow_day_names']),
 								            tochararray(value['short_day_names']),
 								            tochararray(value['long_day_names']),
 								            tochararray(value['narrow_day_names']),
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								            key,
 								        )
 								    )
-												rework genlocale script and remove assumptions about table entries length

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-02 14:07:55 +00:00
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
+								def printaliastable(frommap, prefix):
 								    print('''static const struct %sAliasTblData {
-												assume locale BCP names use ASCII characters only

Signed-off-by: Ivailo Monev <xakepa10@gmail.com>

											
										
										
											2021-09-07 18:51:12 +03:00
+								    const char* original;
 								    const char* substitute;
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
+								} %sAliasTbl[] = {''' % (prefix, prefix))
 								    for key in sorted(frommap):
 								        # territories and scripts entries can contain multiple replacements, add one for each
 								        splitvalue = frommap[key].split(' ')
 								        for value in splitvalue:
-												assume locale BCP names use ASCII characters only

Signed-off-by: Ivailo Monev <xakepa10@gmail.com>

											
										
										
											2021-09-07 18:51:12 +03:00
+								            print('    { "%s", "%s" },' % (key, value))
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
 								    print('};')
 								    print('static const qint16 %sAliasTblSize = sizeof(%sAliasTbl) / sizeof(%sAliasTblData);\n' % (prefix, prefix, prefix))
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								# main maps
 								languagemap = {}
 								countrymap = {}
 								scriptmap = {}
 								localemap = {}
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
+								likelysubtagsmap = {}
-												implement language alias substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 17:39:01 +00:00
+								languagealiasmap = {}
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
+								countryaliasmap = {}
 								scriptaliasmap = {}
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								# cross-reference maps
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								localeparentmap = {}
 								localeparentvaluesmap = {}
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								localescriptmap = {}
 								localefirstdaymap = {}
-												correct weekend end parsing

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 16:33:01 +00:00
+								localeweekendstartmap = {}
 								localeweekendendmap = {}
-												minor genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-06 11:27:12 +00:00
+								localenumberingmap = {}
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
+								# regular expressions
-												escape dash in regular expression in genlocale script [ci skip]

Signed-off-by: Ivailo Monev <xakepa10@gmail.com>

											
										
										
											2020-08-18 23:22:25 +03:00
+								localeregex = re.compile('([^_|\-|\.|@]+)+')
-												ground work for locale data update

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-01 18:08:02 +00:00
-												do not discard locale tables entries

it is required by QLocale::countriesForLanguage() for an example

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 18:28:49 +00:00
+								# artificial entries
-												deal with TODO in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 12:46:07 +00:00
+								languagemap['AnyLanguage'] = {
 								    'code': '',
 								    'name': 'Default',
 								}
 								languagemap['C'] = {
 								    'code': 'C',
 								    'name': 'C',
 								}
 								countrymap['AnyCountry'] = {
 								    'code': '',
 								    'name': 'Default',
 								}
 								scriptmap['AnyScript'] = {
 								    'code': '',
 								    'name': 'Default',
 								}
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								# locale to parent parsing
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								tree = ET.parse('common/supplemental/supplementalData.xml')
 								root = tree.getroot()
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								for parentlocale in root.findall('./parentLocales/parentLocale'):
 								    parentlocaleparent = parentlocale.get('parent')
 								    parentlocalelocales = parentlocale.get('locales')
 								    localeparentmap[parentlocaleparent] = parentlocalelocales.split(' ')
 								# locale to script parsing
-												deal with TODO in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 12:46:07 +00:00
+								# only languages with one primary script are mapped because if there are multiple it should be
 								# specified in the locale data, see:
 								# https://sites.google.com/site/cldr/development/updating-codes/update-language-script-info/language-script-description
-												implement language alias substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 17:39:01 +00:00
+								# secondary scripts are not taken into account at all
-												implement imperial table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 19:27:41 +00:00
+								for suppllanguage in root.findall('./languageData/language'):
 								    suppllanguagetype = suppllanguage.get('type')
 								    suppllanguagescripts = suppllanguage.get('scripts')
-												deal with TODO in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 12:46:07 +00:00
+								    suppllanguagealt = suppllanguage.get('alt')
 								    if not suppllanguagescripts or suppllanguagealt == 'secondary':
-												slightly better locale to script mappings

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-08 21:41:52 +00:00
+								        # alternative entry, skip it
 								        continue
-												deal with TODO in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 12:46:07 +00:00
+								    suppllanguagescriptslist = suppllanguagescripts.split(' ')
 								    if not len(suppllanguagescriptslist) == 1:
 								        # skip entries without definitive primary script
 								        continue
 								    suppllanguageterritories = suppllanguage.get('territories')
 								    if not suppllanguageterritories:
 								        # territories is optional, if not specified use artifical value to map all languages of
 								        # that type to the script
 								        suppllanguageterritories = 'AnyTerritory'
 								    localescriptmap[suppllanguagetype] = {
 								        'script': suppllanguagescripts,
 								        'territories': suppllanguageterritories.split(' '),
 								    }
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												minor genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 18:23:29 +00:00
+								# locale to first day parsing
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								for firstday in root.findall('./weekData/firstDay'):
 								    firstdayday = firstday.get('day')
 								    firstdayterritories = firstday.get('territories')
-												minor genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 18:23:29 +00:00
+								    localefirstdaymap[todayenum(firstdayday)] = stripxmltext(firstdayterritories).split(' ')
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												correct weekend end parsing

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 16:33:01 +00:00
+								# locale to weekend start parsing
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								for weekstart in root.findall('./weekData/weekendStart'):
 								    weekstartday = weekstart.get('day')
 								    weekstartterritories = weekstart.get('territories')
-												correct weekend end parsing

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 16:33:01 +00:00
+								    localeweekendstartmap[todayenum(weekstartday)] = stripxmltext(weekstartterritories).split(' ')
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												correct weekend end parsing

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 16:33:01 +00:00
+								# locale to weekend end parsing
 								for weekend in root.findall('./weekData/weekendEnd'):
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								    weekendday = weekend.get('day')
 								    weekendterritories = weekend.get('territories')
-												correct weekend end parsing

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 16:33:01 +00:00
+								    localeweekendendmap[todayenum(weekendday)] = stripxmltext(weekendterritories).split(' ')
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												minor genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-06 11:27:12 +00:00
+								# locale to numbering system parsing
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								tree = ET.parse('common/supplemental/numberingSystems.xml')
 								root = tree.getroot()
-												minor genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-06 11:27:12 +00:00
+								for numberingsystem  in root.findall('./numberingSystems/numberingSystem'):
 								    numberingsystemid = numberingsystem.get('id')
 								    numberingsystemdigits = numberingsystem.get('digits')
 								    if numberingsystemdigits:
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								        # either digits or rules is set
-												minor genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-06 11:27:12 +00:00
+								        localenumberingmap[numberingsystemid] = stripxmltext(numberingsystemdigits)
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
 								# language parsing
 								tree = ET.parse('common/main/en.xml')
 								root = tree.getroot()
 								for language in root.findall('./localeDisplayNames/languages/language'):
 								    languagetype = language.get('type')
 								    normallanguage = normalizestring(language.text)
 								    if normallanguage in ('Nauru', 'Tokelau', 'Tuvalu'):
-												implement language alias substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 17:39:01 +00:00
+								        # country and language are the same, suffix to solve enum clashes
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								        normallanguage = '%sLanguage' % normallanguage
-												deal with TODO in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 12:46:07 +00:00
+								    languagemap[normallanguage] = {
 								        'code': languagetype,
 								        'name': language.text,
 								    }
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												add --printenums option to genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 13:53:57 +00:00
+								if printenumsandexit:
 								    printenum(languagemap, 'Language')
-												update tables data to CLDR v36.1

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2020-03-19 21:36:11 +00:00
+								elif printdocsandexit:
 								    printdoc(languagemap, 'Language')
-												add --printenums option to genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 13:53:57 +00:00
+								else:
 								    printtable(languagemap, 'Language')
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
 								# country parsing
 								for country in root.findall('./localeDisplayNames/territories/territory'):
 								    countrytype = country.get('type')
 								    normalcountry = normalizestring(country.text)
-												deal with TODO in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 12:46:07 +00:00
+								    countrymap[normalcountry] = {
 								        'code': countrytype,
 								        'name': country.text,
 								    }
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												add --printenums option to genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 13:53:57 +00:00
+								if printenumsandexit:
 								    printenum(countrymap, 'Country')
-												update tables data to CLDR v36.1

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2020-03-19 21:36:11 +00:00
+								elif printdocsandexit:
 								    printdoc(countrymap, 'Country')
-												add --printenums option to genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 13:53:57 +00:00
+								else:
 								    printtable(countrymap, 'Country')
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
 								# scripts parsing
 								for script in root.findall('./localeDisplayNames/scripts/script'):
 								    scripttype = script.get('type')
 								    normalscript = normalizestring(script.text)
 								    if not normalscript.endswith('Script'):
 								        # suffix script if needed
 								        normalscript = '%sScript' % normalscript
 								    if normalscript in ('UnknownScript', 'CommonScript'):
 								        # only interested in specific scripts
 								        continue
-												deal with TODO in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 12:46:07 +00:00
+								    scriptmap[normalscript] = {
 								        'code': scripttype,
 								        'name': script.text,
 								    }
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												add --printenums option to genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 13:53:57 +00:00
+								if printenumsandexit:
 								    printenum(scriptmap, 'Script')
 								    sys.exit(0)
-												update tables data to CLDR v36.1

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2020-03-19 21:36:11 +00:00
+								elif printdocsandexit:
 								    printdoc(scriptmap, 'Script')
 								    sys.exit(0)
-												add --printenums option to genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 13:53:57 +00:00
+								else:
 								    printtable(scriptmap, 'Script')
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												locale data table should not have Default entry

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 19:26:34 +00:00
+								# these defaults are used as parent locales fallback, C uses them as actual values because root
 								# contains UTF-8 characters and for compatibility. for the rest defaults are set from root
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								localedefaults = {
 								    # enums
 								    'language': 'QLocale::Language::AnyLanguage',
 								    'script': 'QLocale::Script::AnyScript',
 								    'country': 'QLocale::Country::AnyCountry',
 								    'first_day_of_week': 'Qt::Monday',
 								    'weekend_start': 'Qt::Saturday',
 								    'weekend_end': 'Qt::Sunday',
 								    # characters
 								    'decimal': '.',
 								    'group': ',',
 								    'list': ';',
 								    'percent': '%',
 								    'zero': '0',
 								    'minus': '-',
 								    'plus': '+',
 								    'exponential': 'e', # default in CLDR is E
-												implement language alias substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 17:39:01 +00:00
+								    # strings
-												correct date/time format parsing and adjust some test cases

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-08 11:21:20 +00:00
+								    'short_date_format': 'd MMM yyyy', # default in CLDR is y-MM-dd
-												remove invalid date/time format tags from locale data

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 01:32:21 +00:00
+								    'long_date_format': 'd MMMM yyyy',
-												deal with TODO in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 12:46:07 +00:00
+								    'short_time_format': 'HH:mm:ss', # default in CLDR is HH:mm
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								    'long_time_format': 'HH:mm:ss z',
 								    'am': 'AM',
 								    'pm': 'PM',
 								    # arrays
 								    'standalone_short_month_names': ['Jan', 'Feb', 'Mar', 'Apr', 'May', 'Jun', 'Jul', 'Aug', 'Sep', 'Oct', 'Nov', 'Dec'],
 								    'standalone_long_month_names': ['January', 'February', 'March', 'April', 'May', 'June', 'July', 'August', 'September', 'October', 'November', 'December'],
 								    'standalone_narrow_month_names': ['J', 'F', 'M', 'A', 'M', 'J', 'J', 'A', 'S', 'O', 'N', 'D'],
 								    'short_month_names': ['Jan', 'Feb', 'Mar', 'Apr', 'May', 'Jun', 'Jul', 'Aug', 'Sep', 'Oct', 'Nov', 'Dec'],
 								    'long_month_names':  ['January', 'February', 'March', 'April', 'May', 'June', 'July', 'August', 'September', 'October', 'November', 'December'],
 								    'narrow_month_names': ['1', '2', '3', '4', '5', '6', '7', '8', '9', '10', '11', '12'],
-												make monday first day in the locale table

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-12 11:46:53 +00:00
+								    'standalone_short_day_names': ['Mon', 'Tue', 'Wed', 'Thu', 'Fri', 'Sat', 'Sun'],
 								    'standalone_long_day_names': ['Monday', 'Tuesday', 'Wednesday', 'Thursday', 'Friday', 'Saturday', 'Sunday'],
 								    'standalone_narrow_day_names': ['M', 'T', 'W', 'T', 'F', 'S', 'S'],
 								    'short_day_names': ['Mon', 'Tue', 'Wed', 'Thu', 'Fri', 'Sat', 'Sun'],
 								    'long_day_names': ['Monday', 'Tuesday', 'Wednesday', 'Thursday', 'Friday', 'Saturday', 'Sunday'],
 								    'narrow_day_names': ['1', '2', '3', '4', '5', '6', '7'],
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								}
-												revert back to non-root defaults for Default and C

for compatibility and because root uses UTF-8 characters for quotation for
an example

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-06 19:36:36 +00:00
+								# artificial entries
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								localemap['C'] = {}
-												revert back to non-root defaults for Default and C

for compatibility and because root uses UTF-8 characters for quotation for
an example

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-06 19:36:36 +00:00
+								mapcopy(localedefaults, localemap['C'])
 								localemap['C']['language'] = 'QLocale::Language::C'
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												use somewhat correct defaults only for parent locales

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-06 18:22:12 +00:00
+								# locales parsing
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								# TODO: accept only "contributed" or "approved" values
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								def readlocale(fromxml, tomap, isparent):
-												merge non-territory locales into territory ones in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-11 12:03:33 +00:00
+								    locale = os.path.basename(fromxml)
 								    locale = locale.replace('.xml', '')
 								    if '_' in fromxml:
-												minor genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-11 22:08:29 +00:00
+								        # merge parent locales (non-territory) into the current one so that data can be read
-												merge non-territory locales into territory ones in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-11 12:03:33 +00:00
+								        # from them. they do not have territory and currency data is based on territory so
 								        # cross-reference is not possible without doing so
 								        localeparent = locale.split('_')[0]
 								        xmlparent = fromxml.replace(locale, localeparent)
 								        root = xmlmerge(fromxml, xmlparent)
 								    else:
 								        tree = ET.parse(fromxml)
 								        root = tree.getroot()
-												variant locales are not supported, yet

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 20:24:01 +00:00
 								    variant = root.find('./identity/variant')
 								    if variant is not None:
-												error out on unknown month/day from genlocale script [ci skip]

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 20:27:33 +00:00
+								        # TODO: variants are not supported by QLocale
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								        return
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
 								    language = root.find('./identity/language')
-												set defaults from main locale if territory is specified

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 19:47:38 +00:00
+								    langtype = language.get('type')
-												do not overwrite parent locale values with defaults

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:24:47 +00:00
+								    country = root.find('./identity/territory')
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								    countrytype = None
-												slightly better locale to script mappings

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-08 21:41:52 +00:00
+								    scripttype = None
-												minor genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 18:23:29 +00:00
+								    numbertype = 'latn' # CLDR default
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								    tomap[locale] = {}
-												use somewhat correct defaults only for parent locales

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-06 18:22:12 +00:00
+								    if isparent:
 								        mapcopy(localedefaults, tomap[locale])
 								    else:
 								        mapcopy(localeparentvaluesmap['root'], tomap[locale])
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
-												do not overwrite parent locale values with defaults

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:24:47 +00:00
+								    # set defaults from parent locale if territory is specified
-												set defaults from main locale if territory is specified

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 19:47:38 +00:00
+								    if country is not None:
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								        for parent in localeparentmap.keys():
-												do not overwrite parent locale values with defaults

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:24:47 +00:00
+								            if locale in localeparentmap[parent]:
-												update tables data to CLDR v43

hacks included

Signed-off-by: Ivailo Monev <xakepa10@gmail.com>

											
										
										
											2023-05-27 04:02:04 +03:00
+								                if not parent in localeparentvaluesmap.keys():
 								                    # reference to locale without data
 								                    continue
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								                mapcopy(localeparentvaluesmap[parent], tomap[locale])
-												do not overwrite parent locale values with defaults

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:24:47 +00:00
+								    # then from main locale (non-territory) filling the blanks that even parent locales do not fill
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								    if not isparent:
-												do not overwrite parent locale values with defaults

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:24:47 +00:00
+								        mapmerge(localemap[langtype], tomap[locale], localedefaults)
-												set defaults from main locale if territory is specified

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 19:47:38 +00:00
-												make zero symbol uint and regenerate locale table

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 20:31:26 +00:00
+								    # find the enums from mapped values
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
+								    tomap[locale]['language'] = tolanguageenum(langtype)
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
+								    if not isparent and country is not None:
-												ground work for locale data update

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-01 18:08:02 +00:00
+								        countrytype = country.get('type')
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
+								        tomap[locale]['country'] = tocountryenum(countrytype)
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								    else:
 								        # territory often is not specified, use language code as fallback
 								        countrytype = langtype.upper()
-												deal with TODO in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 12:46:07 +00:00
+								    # script is specified either in the locale or supplemental data
 								    script = root.find('./identity/script')
 								    if script is not None:
 								        scripttype = script.get('type')
 								    elif not isparent:
 								        # scripts map is partial, pick from what is mapped
 								        if langtype in localescriptmap.keys():
 								            scriptterritories = localescriptmap[langtype]['territories']
 								            if 'AnyTerritory' in scriptterritories \
 								                or countrytype in scriptterritories:
 								                scripttype = localescriptmap[langtype]['script']
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								    defaultnumbersystem = root.find('./numbers/defaultNumberingSystem')
 								    if defaultnumbersystem is not None:
-												minor genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 18:23:29 +00:00
+								        numbertype = defaultnumbersystem.text
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												implement imperial table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 19:27:41 +00:00
+								    # find values from supplemental maps
-												deal with TODO in genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 12:46:07 +00:00
+								    if not isparent and scripttype:
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
+								        tomap[locale]['script'] = toscriptenum(scripttype)
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								    for key in localefirstdaymap.keys():
 								        for countryvalue in localefirstdaymap[key]:
 								            if countryvalue == countrytype:
 								                tomap[locale]['first_day_of_week'] = key
 								                break
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								    for key in localeweekendstartmap.keys():
 								        for countryvalue in localeweekendstartmap[key]:
 								            if countryvalue == countrytype:
 								                tomap[locale]['weekend_start'] = key
 								                break
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								    for key in localeweekendendmap.keys():
 								        for countryvalue in localeweekendendmap[key]:
 								            if countryvalue == countrytype:
 								                tomap[locale]['weekend_end'] = key
 								                break
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												minor genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 18:23:29 +00:00
+								    # find from locale data
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								    for symbol in root.findall('./numbers/symbols'):
 								        symbolnumbersystem = symbol.get('numberSystem')
-												minor genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 18:23:29 +00:00
+								        if not symbolnumbersystem == numbertype:
 								            # should be the locale numeric system
-												ground work for locale data update

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-01 18:08:02 +00:00
+								            continue
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								        decimal = symbol.find('./decimal')
 								        if decimal is not None and len(decimal.text) == 1:
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								            tomap[locale]['decimal'] = decimal.text
-												ground work for locale data update

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-01 18:08:02 +00:00
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								        group = symbol.find('./group')
 								        if group is not None and len(group.text) == 1:
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								            tomap[locale]['group'] = group.text
-												ground work for locale data update

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-01 18:08:02 +00:00
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								        listdelimiter = symbol.find('./list')
 								        if listdelimiter is not None and len(listdelimiter.text) == 1:
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								            tomap[locale]['list'] = listdelimiter.text
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
 								        percent = symbol.find('./percentSign')
 								        if percent is not None and len(percent.text) == 1:
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								            tomap[locale]['percent'] = percent.text
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
 								        minus = symbol.find('./minusSign')
 								        if minus is not None and len(minus.text) == 1:
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								            tomap[locale]['minus'] = minus.text
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
 								        plus = symbol.find('./plusSign')
 								        if plus is not None and len(plus.text) == 1:
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								            tomap[locale]['plus'] = plus.text
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
 								        exponential = symbol.find('./exponential')
 								        if exponential is not None and len(exponential.text) == 1:
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								            tomap[locale]['exponential'] = exponential.text
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
-												make zero symbol uint and regenerate locale table

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 20:31:26 +00:00
+								        # zero is from cross-reference numeric system map,
 								        # taking the first character works even for UTF-8 chars
-												minor genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-06 11:27:12 +00:00
+								        tomap[locale]['zero'] = localenumberingmap[numbertype][0]
-												make zero symbol uint and regenerate locale table

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 20:31:26 +00:00
-												locale data table should not have Default entry

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 19:26:34 +00:00
+								        # locale numeric system was found, break
 								        break
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								    for calendar in root.findall('./dates/calendars/calendar'):
 								        calendartype = calendar.get('type')
 								        if not calendartype == 'gregorian':
-												minor genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-06 11:27:12 +00:00
+								            # all values should be from gregorian calendar
-												rework genlocale script and remove assumptions about table entries length

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-02 14:07:55 +00:00
+								            continue
-												correct date/time format parsing and adjust some test cases

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-08 11:21:20 +00:00
+								        for dateformat in calendar.findall('./dateFormats/dateFormatLength'):
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								            dateformattype = dateformat.get('type')
 								            if dateformattype == 'short':
 								                pattern = dateformat.find('./dateFormat/pattern')
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								                tomap[locale]['short_date_format'] = todatetimeformat(pattern.text)
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								            elif dateformattype == 'long':
 								                pattern = dateformat.find('./dateFormat/pattern')
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								                tomap[locale]['long_date_format'] = todatetimeformat(pattern.text)
-												ground work for locale data update

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-01 18:08:02 +00:00
-												correct date/time format parsing and adjust some test cases

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-08 11:21:20 +00:00
+								        for timeformat in calendar.findall('./timeFormats/timeFormatLength'):
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								            timeformattype = timeformat.get('type')
 								            if timeformattype == 'short':
 								                pattern = timeformat.find('./timeFormat/pattern')
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								                tomap[locale]['short_time_format'] = todatetimeformat(pattern.text)
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								            elif timeformattype == 'long':
 								                pattern = timeformat.find('./timeFormat/pattern')
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								                tomap[locale]['long_time_format'] = todatetimeformat(pattern.text)
-												ground work for locale data update

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-01 18:08:02 +00:00
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								        for dayperiodwidth in calendar.findall('./dayPeriods/dayPeriodContext/dayPeriodWidth'):
 								            dayperiodwidthtype = dayperiodwidth.get('type')
 								            if not dayperiodwidthtype == 'wide':
-												minor genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-06 11:27:12 +00:00
+								                # all values should be in wide format
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								                continue
 								            for dayperiod in dayperiodwidth.findall('dayPeriod'):
 								                dayperiodtype = dayperiod.get('type')
 								                if dayperiodtype == 'am':
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								                    tomap[locale]['am'] = dayperiod.text
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								                elif dayperiodtype == 'pm':
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								                    tomap[locale]['pm'] = dayperiod.text
-												ground work for locale data update

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-01 18:08:02 +00:00
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								        # month/day names
 								        for monthcontext in calendar.findall('./months/monthContext'):
 								            monthcontexttype = monthcontext.get('type')
 								            if monthcontexttype == 'stand-alone':
 								                for monthwidth in monthcontext.findall('./monthWidth'):
 								                    monthwidthtype = monthwidth.get('type')
 								                    if monthwidthtype == 'wide':
 								                        months = monthwidth.findall('./month')
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								                        tomap[locale]['standalone_long_month_names'] = tomonthslist(months, tomap[locale]['standalone_long_month_names'])
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								                    elif monthwidthtype == 'abbreviated':
 								                        months = monthwidth.findall('./month')
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								                        tomap[locale]['standalone_short_month_names'] = tomonthslist(months, tomap[locale]['standalone_short_month_names'])
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								                    elif monthwidthtype == 'narrow':
 								                        months = monthwidth.findall('./month')
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								                        tomap[locale]['standalone_narrow_month_names'] = tomonthslist(months, tomap[locale]['standalone_narrow_month_names'])
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								            elif monthcontexttype == 'format':
 								                for monthwidth in monthcontext.findall('./monthWidth'):
 								                    monthwidthtype = monthwidth.get('type')
 								                    if monthwidthtype == 'wide':
 								                        months = monthwidth.findall('./month')
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								                        tomap[locale]['long_month_names'] = tomonthslist(months, tomap[locale]['long_month_names'])
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								                    elif monthwidthtype == 'abbreviated':
 								                        months = monthwidth.findall('./month')
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								                        tomap[locale]['short_month_names'] = tomonthslist(months, tomap[locale]['short_month_names'])
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								                    elif monthwidthtype == 'narrow':
 								                        months = monthwidth.findall('./month')
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								                        tomap[locale]['narrow_month_names'] = tomonthslist(months, tomap[locale]['narrow_month_names'])
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
 								        for daycontext in calendar.findall('./days/dayContext'):
 								            daycontexttype = daycontext.get('type')
 								            if daycontexttype == 'stand-alone':
 								                for daywidth in daycontext.findall('./dayWidth'):
 								                    daywidthtype = daywidth.get('type')
 								                    if daywidthtype == 'wide':
 								                        days = daywidth.findall('./day')
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								                        tomap[locale]['standalone_long_day_names'] = todayslist(days, tomap[locale]['standalone_long_day_names'])
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								                    elif daywidthtype == 'abbreviated':
 								                        days = daywidth.findall('./day')
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								                        tomap[locale]['standalone_short_day_names'] = todayslist(days, tomap[locale]['standalone_short_day_names'])
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								                    elif daywidthtype == 'narrow':
 								                        days = daywidth.findall('./day')
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								                        tomap[locale]['standalone_narrow_day_names'] = todayslist(days, tomap[locale]['standalone_narrow_day_names'])
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								            elif daycontexttype == 'format':
 								                for daywidth in daycontext.findall('./dayWidth'):
 								                    daywidthtype = daywidth.get('type')
 								                    if daywidthtype == 'wide':
 								                        days = daywidth.findall('./day')
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								                        tomap[locale]['long_day_names'] = todayslist(days, tomap[locale]['long_day_names'])
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								                    elif daywidthtype == 'abbreviated':
 								                        days = daywidth.findall('./day')
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								                        tomap[locale]['short_day_names'] = todayslist(days, tomap[locale]['short_day_names'])
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								                    elif daywidthtype == 'narrow':
 								                        days = daywidth.findall('./day')
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								                        tomap[locale]['narrow_day_names'] = todayslist(days, tomap[locale]['narrow_day_names'])
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
 								        # gregorian calendar was found, break
 								        break
 								    # month/day names are set during calendar parsing
-												parse parent locales from genlocale script

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-05 22:00:18 +00:00
+								# read parent locales first
 								for xml in glob.glob('common/main/*.xml'):
 								    xmlbase = os.path.basename(xml)
 								    xmlbase = xmlbase.replace('.xml', '')
 								    if not xmlbase in localeparentmap.keys():
 								        continue
 								    readlocale(xml, localeparentvaluesmap, True)
 								# now everything including those
 								for xml in sorted(glob.glob('common/main/*.xml')):
 								    if xml.endswith('/root.xml'):
 								        # root is not actual locale
 								        continue
 								    readlocale(xml, localemap, False)
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								print('''static const QLocalePrivate localeTbl[] = {''')
-												locale data table should not have Default entry

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 19:26:34 +00:00
+								# print C first
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								printlocaledata(localemap, 'C')
-												locale data table should not have Default entry

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 19:26:34 +00:00
+								# now everything except that
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								for key in sorted(localemap.keys()):
-												locale data table should not have Default entry

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-07 19:26:34 +00:00
+								    if key == 'C':
-												implement locales table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 15:56:53 +00:00
+								        continue
 								    printlocaledata(localemap, key)
 								print('};')
-												implement imperial table generator

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-04 19:27:41 +00:00
+								print('static const qint16 localeTblSize = sizeof(localeTbl) / sizeof(QLocalePrivate);\n')
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
+								# likely subtags parsing
 								tree = ET.parse('common/supplemental/likelySubtags.xml')
 								root = tree.getroot()
 								for likelysubtag in root.findall('./likelySubtags/likelySubtag'):
 								    likelysubtagfrom = likelysubtag.get('from')
 								    likelysubtagto = likelysubtag.get('to')
 								    # split code into language, script and country to make it possible to match against regardless
 								    # of separators and remap to enums so that it is possible to substitute both named and enumed
 								    # locale searches at the cost of not covering all named cases
 								    likelysubtagfromsplit = localeregex.findall(likelysubtagfrom)
 								    likelysubtagfromsplitlen = len(likelysubtagfromsplit)
 								    likelysubtagtosplit = localeregex.findall(likelysubtagto)
-												minr genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-11 13:32:58 +00:00
+								    likelysubtagtosplitlen = len(likelysubtagtosplit)
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
+								    likelyfromlanguage = None
 								    likelyfromscript = None
 								    likelyfromcountry = None
 								    if likelysubtagfromsplitlen == 1:
 								        likelyfromlanguage = tolanguageenum(likelysubtagfromsplit[0])
 								        likelyfromscript = 'QLocale::Script::AnyScript'
 								        likelyfromcountry = 'QLocale::Country::AnyCountry'
 								    elif likelysubtagfromsplitlen == 2:
 								        likelyfromlanguage = tolanguageenum(likelysubtagfromsplit[0])
 								        likelyfromscript = 'QLocale::Script::AnyScript'
 								        likelyfromcountry = tocountryenum(likelysubtagfromsplit[1])
 								    elif likelysubtagfromsplitlen == 3:
 								        likelyfromlanguage = tolanguageenum(likelysubtagfromsplit[0])
 								        likelyfromscript = toscriptenum(likelysubtagfromsplit[1])
 								        likelyfromcountry = tocountryenum(likelysubtagfromsplit[2])
-												minr genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-11 13:32:58 +00:00
+								    elif likelysubtagfromsplitlen > 3 or likelysubtagtosplitlen > 3:
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
+								        # the regular expression is intentionally greedy, if there are more than 3 group matches
 								        # then it is likely a variant and that is not supported case yet
 								        print(likelysubtagfrom, likelysubtagfromsplit)
-												minr genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-11 13:32:58 +00:00
+								        print(likelysubtagto, likelysubtagtosplit)
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
+								        sys.exit(1)
 								    likelytolanguage = tolanguageenum(likelysubtagtosplit[0])
 								    likelytoscript = toscriptenum(likelysubtagtosplit[1])
 								    likelytocountry = tocountryenum(likelysubtagtosplit[2])
 								    if not likelyfromlanguage or not likelyfromscript or not likelyfromcountry \
 								        or not likelytolanguage or not likelytoscript or not likelytocountry:
 								        # if there are no enums for the codes skip the entry
 								        continue
 								    likelysubtagsmap[likelysubtagfrom] = {
 								        'fromlanguage' : likelyfromlanguage,
 								        'fromscript' : likelyfromscript,
 								        'fromcountry' : likelyfromcountry,
 								        'tolanguage' : likelytolanguage,
 								        'toscript' : likelytoscript,
 								        'tocountry' : likelytocountry,
 								    }
 								print('''static const struct subtagAliasTblData {
 								    const QLocale::Language fromlanguage;
 								    const QLocale::Script fromscript;
 								    const QLocale::Country fromcountry;
 								    const QLocale::Language tolanguage;
 								    const QLocale::Script toscript;
 								    const QLocale::Country tocountry;
 								} subtagAliasTbl[] = {''')
 								for key in sorted(likelysubtagsmap):
 								    value = likelysubtagsmap[key]
 								    print('''    {
 								        %s, %s, %s,
 								        %s, %s, %s
 								    },''' % (
 								            value['fromlanguage'],
 								            value['fromscript'],
 								            value['fromcountry'],
 								            value['tolanguage'],
 								            value['toscript'],
 								            value['tocountry'],
 								        )
 								    )
 								print('};')
 								print('static const qint16 subtagAliasTblSize = sizeof(subtagAliasTbl) / sizeof(subtagAliasTblData);\n')
-												implement language alias substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 17:39:01 +00:00
+								# language alias parsing
 								tree = ET.parse('common/supplemental/supplementalMetadata.xml')
 								root = tree.getroot()
 								for languagealias in root.findall('./metadata/alias/languageAlias'):
 								    languagealiastype = languagealias.get('type')
 								    languagealiasreplacement = languagealias.get('replacement')
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
+								    if '_' in languagealiastype or '-' in languagealiastype \
 								        or '_' in languagealiasreplacement or '-' in languagealiasreplacement:
-												minr genlocale script review

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-11 13:32:58 +00:00
+								        # if either the original or the substitute is BCP47 code (language and script/country
 								        # included) skip it because QLocalePrivate::codeToLanguage() should be dealing with
 								        # language codes only
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
+								        continue
-												implement language alias substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 17:39:01 +00:00
+								    languagealiasmap[languagealiastype] = languagealiasreplacement
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
+								printaliastable(languagealiasmap, 'language')
-												implement language alias substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 17:39:01 +00:00
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
+								# country alias parsing
 								for territoryalias in root.findall('./metadata/alias/territoryAlias'):
 								    territoryaliastype = territoryalias.get('type')
 								    territoryaliasreplacement = territoryalias.get('replacement')
 								    countryaliasmap[territoryaliastype] = territoryaliasreplacement
-												implement language alias substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-09 17:39:01 +00:00
-												implement subtag, script and country substitution

Signed-off-by: Ivailo Monev <xakepa10@laimg.moc>

											
										
										
											2019-08-10 19:15:18 +00:00
+								printaliastable(countryaliasmap, 'country')
 								# script alias parsing
 								for scriptalias in root.findall('./metadata/alias/scriptAlias'):
 								    scriptaliastype = scriptalias.get('type')
 								    scriptaliasreplacement = scriptalias.get('replacement')
 								    scriptaliasmap[scriptaliastype] = scriptaliasreplacement
 								printaliastable(scriptaliasmap, 'script')