You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
52 lines
1.6 KiB
52 lines
1.6 KiB
1 year ago
|
# vim:ts=4 sw=4 expandtab softtabstop=4
|
||
|
import argparse
|
||
|
import io
|
||
|
import locale
|
||
|
import os
|
||
|
import sys
|
||
|
|
||
|
from unidecode import unidecode
|
||
|
|
||
|
def fatal(msg):
|
||
|
sys.stderr.write(msg + "\n")
|
||
|
sys.exit(1)
|
||
|
|
||
|
def main():
|
||
|
default_encoding = locale.getpreferredencoding()
|
||
|
|
||
|
parser = argparse.ArgumentParser(
|
||
|
description="Transliterate Unicode text into ASCII. FILE is path to file to transliterate. "
|
||
|
"Standard input is used if FILE is omitted and -c is not specified.")
|
||
|
parser.add_argument('-e', '--encoding', metavar='ENCODING', default=default_encoding,
|
||
|
help='Specify an encoding (default is %s)' % (default_encoding,))
|
||
|
parser.add_argument('-c', metavar='TEXT', dest='text',
|
||
|
help='Transliterate TEXT instead of FILE')
|
||
|
parser.add_argument('path', nargs='?', metavar='FILE')
|
||
|
|
||
|
args = parser.parse_args()
|
||
|
|
||
|
encoding = args.encoding
|
||
|
|
||
|
if args.path:
|
||
|
if args.text:
|
||
|
fatal("Can't use both FILE and -c option")
|
||
|
else:
|
||
|
stream = open(args.path, 'rb')
|
||
|
elif args.text:
|
||
|
text = os.fsencode(args.text)
|
||
|
# add a newline to the string if it comes from the
|
||
|
# command line so that the result is printed nicely
|
||
|
# on the console.
|
||
|
stream = io.BytesIO(text + b'\n')
|
||
|
else:
|
||
|
stream = sys.stdin.buffer
|
||
|
|
||
|
for line_nr, line in enumerate(stream):
|
||
|
try:
|
||
|
line = line.decode(encoding)
|
||
|
except UnicodeDecodeError as e:
|
||
|
fatal('Unable to decode input line %s: %s, start: %d, end: %d' % (line_nr, e.reason, e.start, e.end))
|
||
|
|
||
|
sys.stdout.write(unidecode(line))
|
||
|
stream.close()
|