bazarr/libs/unidecode/util.py

52 lines
1.6 KiB
Python
Raw Normal View History

# vim:ts=4 sw=4 expandtab softtabstop=4
import argparse
import io
import locale
import os
import sys
from unidecode import unidecode
def fatal(msg):
sys.stderr.write(msg + "\n")
sys.exit(1)
def main():
default_encoding = locale.getpreferredencoding()
parser = argparse.ArgumentParser(
description="Transliterate Unicode text into ASCII. FILE is path to file to transliterate. "
"Standard input is used if FILE is omitted and -c is not specified.")
parser.add_argument('-e', '--encoding', metavar='ENCODING', default=default_encoding,
help='Specify an encoding (default is %s)' % (default_encoding,))
parser.add_argument('-c', metavar='TEXT', dest='text',
help='Transliterate TEXT instead of FILE')
parser.add_argument('path', nargs='?', metavar='FILE')
args = parser.parse_args()
encoding = args.encoding
if args.path:
if args.text:
fatal("Can't use both FILE and -c option")
else:
stream = open(args.path, 'rb')
elif args.text:
text = os.fsencode(args.text)
# add a newline to the string if it comes from the
# command line so that the result is printed nicely
# on the console.
stream = io.BytesIO(text + b'\n')
else:
stream = sys.stdin.buffer
for line_nr, line in enumerate(stream):
try:
line = line.decode(encoding)
except UnicodeDecodeError as e:
fatal('Unable to decode input line %s: %s, start: %d, end: %d' % (line_nr, e.reason, e.start, e.end))
sys.stdout.write(unidecode(line))
stream.close()