You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
59 lines
1.7 KiB
59 lines
1.7 KiB
4 years ago
|
# vim:ts=4 sw=4 expandtab softtabstop=4
|
||
|
from __future__ import print_function
|
||
|
import argparse
|
||
|
import locale
|
||
|
import os
|
||
|
import sys
|
||
|
|
||
|
from unidecode import unidecode
|
||
|
|
||
|
PY3 = sys.version_info[0] >= 3
|
||
|
|
||
|
def fatal(msg):
|
||
|
sys.stderr.write(msg + "\n")
|
||
|
sys.exit(1)
|
||
|
|
||
|
def main():
|
||
|
default_encoding = locale.getpreferredencoding()
|
||
|
|
||
|
parser = argparse.ArgumentParser(
|
||
|
description="Transliterate Unicode text into ASCII. FILE is path to file to transliterate. "
|
||
|
"Standard input is used if FILE is omitted and -c is not specified.")
|
||
|
parser.add_argument('-e', '--encoding', metavar='ENCODING', default=default_encoding,
|
||
|
help='Specify an encoding (default is %s)' % (default_encoding,))
|
||
|
parser.add_argument('-c', metavar='TEXT', dest='text',
|
||
|
help='Transliterate TEXT instead of FILE')
|
||
|
parser.add_argument('path', nargs='?', metavar='FILE')
|
||
|
|
||
|
args = parser.parse_args()
|
||
|
|
||
|
encoding = args.encoding
|
||
|
|
||
|
if args.path:
|
||
|
if args.text:
|
||
|
fatal("Can't use both FILE and -c option")
|
||
|
else:
|
||
|
with open(args.path, 'rb') as f:
|
||
|
stream = f.read()
|
||
|
elif args.text:
|
||
|
if PY3:
|
||
|
stream = os.fsencode(args.text)
|
||
|
else:
|
||
|
stream = args.text
|
||
|
# add a newline to the string if it comes from the
|
||
|
# command line so that the result is printed nicely
|
||
|
# on the console.
|
||
|
stream += b'\n'
|
||
|
else:
|
||
|
if PY3:
|
||
|
stream = sys.stdin.buffer.read()
|
||
|
else:
|
||
|
stream = sys.stdin.read()
|
||
|
|
||
|
try:
|
||
|
stream = stream.decode(encoding)
|
||
|
except UnicodeDecodeError as e:
|
||
|
fatal('Unable to decode input: %s, start: %d, end: %d' % (e.reason, e.start, e.end))
|
||
|
|
||
|
sys.stdout.write(unidecode(stream))
|