| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268 | #!/usr/bin/env python3## Version 1.0.1############################################################################### Change log:#  7 May  2019, Ondrej Tuma, Initial#  9 June 2020, 3d-gussner, Added version and Change log#  9 June 2020, 3d-gussner, Wrap text to 20 char and rows#  9 June 2020, 3d-gussner, colored output#  2 Apr. 2021, 3d-gussner, Fix and improve text warp# 22 Apr. 2021, DRracer   , add English source to output# 23 Apr. 2021, wavexx    , improve# 24 Apr. 2021, wavexx    , improve# 26 Apr. 2021, 3d-gussner, add character ruler##############################################################################"""Check lang files."""from argparse import ArgumentParserfrom traceback import print_excfrom sys import stdout, stderrimport textwrapimport redef color_maybe(color_attr, text):    if stdout.isatty():        return '\033[0;' + str(color_attr) + 'm' + text + '\033[0m'    else:        return textred = lambda text: color_maybe(31, text)green = lambda text: color_maybe(32, text)yellow = lambda text: color_maybe(33, text)cyan = lambda text: color_maybe(36, text)def print_wrapped(wrapped_text, rows, cols):    if type(wrapped_text) == str:        wrapped_text = [wrapped_text]    for r, line in enumerate(wrapped_text):        r_ = str(r + 1).rjust(3)        if r >= rows:            r_ = red(r_)        print((' {} |{:' + str(cols) + 's}|').format(r_, line))def print_truncated(text, cols):    if len(text) <= cols:        prefix = text.ljust(cols)        suffix = ''    else:        prefix = text[0:cols]        suffix = red(text[cols:])    print('   |' + prefix + '|' + suffix)def print_ruler(spc, cols):    print(' ' * spc + cyan(('₀₁₂₃₄₅₆₇₈₉'*4)[:cols]))def print_source_translation(source, translation, wrapped_source, wrapped_translation, rows, cols):    if rows == 1:        print(' source text:')        print_ruler(4, cols);        print_truncated(source, cols)        print(' translated text:')        print_ruler(4, cols);        print_truncated(translation, cols)    else:        print(' source text:')        print_ruler(6, cols);        print_wrapped(wrapped_source, rows, cols)        print(' translated text:')        print_ruler(6, cols);        print_wrapped(wrapped_translation, rows, cols)    print()def highlight_trailing_white(text):    if type(text) == str:        return re.sub(r' $', '·', text)    else:        ret = text[:]        ret[-1] = highlight_trailing_white(ret[-1])        return retdef wrap_text(text, cols):    # wrap text    ret = list(textwrap.TextWrapper(width=cols).wrap(text))    if len(ret):        # add back trailing whitespace        ret[-1] += ' ' * (len(text) - len(text.rstrip()))    return retdef unescape(text):    if '\\' not in text:        return text    return text.encode('ascii').decode('unicode_escape')def ign_char_first(c):    return c.isalnum() or c in {'%', '?'}def ign_char_last(c):    return c.isalnum() or c in {'.', "'"}def parse_txt(lang, no_warning, warn_empty):    """Parse txt file and check strings to display definition."""    if lang == "en":        file_path = "lang_en.txt"    else:        file_path = "lang_en_%s.txt" % lang    print(green("Start %s lang-check" % lang))    lines = 1    with open(file_path) as src:        while True:            comment = src.readline().split(' ')            #print (comment) #Debug            #Check if columns and rows are defined            cols = None            rows = None            for item in comment[1:]:                key, val = item.split('=')                if key == 'c':                    cols = int(val)                    #print ("c=",cols) #Debug                elif key == 'r':                    rows = int(val)                    #print ("r=",rows) #Debug                else:                    raise RuntimeError(                        "Unknown display definition %s on line %d" %                        (' '.join(comment), lines))            if cols is None and rows is None:                if not no_warning:                    print(yellow("[W]: No display definition on line %d" % lines))                cols = len(translation)     # propably fullscreen            if rows is None:                rows = 1            elif rows > 1 and cols != 20:                print(yellow("[W]: Multiple rows with odd number of columns on line %d" % lines))            #Wrap text to 20 chars and rows            source = src.readline()[:-1].strip('"')            #print (source) #Debug            translation = src.readline()[:-1].strip('"')            if translation == '\\x00':                # crude hack to handle intentionally-empty translations                translation = ''            # handle backslash sequences            source = unescape(source)            translation = unescape(translation)            #print (translation) #Debug            wrapped_source = wrap_text(source, cols)            rows_count_source = len(wrapped_source)            wrapped_translation = wrap_text(translation, cols)            rows_count_translation = len(wrapped_translation)            # Check for potential errors in the definition            if not no_warning:                # Incorrect number of rows/cols on the definition                if rows == 1 and (len(source) > cols or rows_count_source > rows):                    print(yellow('[W]: Source text longer than %d cols as defined on line %d:' % (cols, lines)))                    print_ruler(4, cols);                    print_truncated(source, cols)                    print()                elif rows_count_source > rows:                    print(yellow('[W]: Wrapped source text longer than %d rows as defined on line %d:' % (rows, lines)))                    print_ruler(6, cols);                    print_wrapped(wrapped_source, rows, cols)                    print()                # Missing translation                if len(translation) == 0 and (warn_empty or rows > 1):                    if rows == 1:                        print(yellow("[W]: Empty translation for \"%s\" on line %d" % (source, lines)))                    else:                        print(yellow("[W]: Empty translation on line %d" % lines))                        print_ruler(6, cols);                        print_wrapped(wrapped_source, rows, cols)                        print()            # Check for translation lenght            if (rows_count_translation > rows) or (rows == 1 and len(translation) > cols):                print(red('[E]: Text is longer than definition on line %d: cols=%d rows=%d (rows diff=%d)'                          % (lines, cols, rows, rows_count_translation-rows)))                print_source_translation(source, translation,                                         wrapped_source, wrapped_translation,                                         rows, cols)            # Different count of % sequences            if source.count('%') != translation.count('%') and len(translation) > 0:                print(red('[E]: Unequal count of %% escapes on line %d:' % (lines)))                print_source_translation(source, translation,                                         wrapped_source, wrapped_translation,                                         rows, cols)            # Different first/last character            if not no_warning and len(source) > 0 and len(translation) > 0:                source_end = source.rstrip()[-1]                translation_end = translation.rstrip()[-1]                start_diff = not (ign_char_first(source[0]) and ign_char_first(translation[0])) and source[0] != translation[0]                end_diff = not (ign_char_last(source_end) and ign_char_last(translation_end)) and source_end != translation_end                if start_diff or end_diff:                    if start_diff:                        print(yellow('[W]: Differing first punctuation character (%s => %s) on line %d:' % (source[0], translation[0], lines)))                    if end_diff:                        print(yellow('[W]: Differing last punctuation character (%s => %s) on line %d:' % (source[-1], translation[-1], lines)))                    print_source_translation(source, translation,                                             wrapped_source, wrapped_translation,                                             rows, cols)            # Short translation            if not no_warning and len(source) > 0 and len(translation) > 0:                if len(translation.rstrip()) < len(source.rstrip()) / 2:                    print(yellow('[W]: Short translation on line %d:' % (lines)))                    print_source_translation(source, translation,                                             wrapped_source, wrapped_translation,                                             rows, cols)            # Incorrect trailing whitespace in translation            if not no_warning and len(translation) > 0 and \               (source.rstrip() == source or (rows == 1 and len(source) == cols)) and \               translation.rstrip() != translation and \               (rows > 1 or len(translation) != len(source)):                print(yellow('[W]: Incorrect trailing whitespace for translation on line %d:' % (lines)))                source = highlight_trailing_white(source)                translation = highlight_trailing_white(translation)                wrapped_translation = highlight_trailing_white(wrapped_translation)                print_source_translation(source, translation,                                         wrapped_source, wrapped_translation,                                         rows, cols)            if len(src.readline()) != 1:  # empty line                break            lines += 4    print(green("End %s lang-check" % lang))def main():    """Main function."""    parser = ArgumentParser(        description=__doc__,        usage="%(prog)s lang")    parser.add_argument(        "lang", nargs='?', default="en", type=str,        help="Check lang file (en|cs|de|es|fr|nl|it|pl)")    parser.add_argument(        "--no-warning", action="store_true",        help="Disable warnings")    parser.add_argument(        "--warn-empty", action="store_true",        help="Warn about empty translations")    args = parser.parse_args()    try:        parse_txt(args.lang, args.no_warning, args.warn_empty)        return 0    except Exception as exc:        print_exc()        parser.error("%s" % exc)        return 1if __name__ == "__main__":    exit(main())
 |