You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
|
|
|
#!/usr/bin/env python3
|
|
|
|
# encoding: utf-8
|
|
|
|
# Copyright 2017 Johns Hopkins University (Shinji Watanabe)
|
|
|
|
# Apache 2.0 (http://www.apache.org/licenses/LICENSE-2.0)
|
|
|
|
from __future__ import print_function
|
|
|
|
from __future__ import unicode_literals
|
|
|
|
|
|
|
|
import argparse
|
|
|
|
import codecs
|
|
|
|
import json
|
|
|
|
import sys
|
|
|
|
|
|
|
|
is_python2 = sys.version_info[0] == 2
|
|
|
|
|
|
|
|
|
|
|
|
def get_parser():
|
|
|
|
parser = argparse.ArgumentParser(
|
|
|
|
description="convert scp to json",
|
|
|
|
formatter_class=argparse.ArgumentDefaultsHelpFormatter, )
|
|
|
|
parser.add_argument("--key", "-k", type=str, help="key")
|
|
|
|
return parser
|
|
|
|
|
|
|
|
|
|
|
|
if __name__ == "__main__":
|
|
|
|
parser = get_parser()
|
|
|
|
args = parser.parse_args()
|
|
|
|
|
|
|
|
new_line = {}
|
|
|
|
sys.stdin = codecs.getreader("utf-8")(sys.stdin
|
|
|
|
if is_python2 else sys.stdin.buffer)
|
|
|
|
sys.stdout = codecs.getwriter("utf-8")(sys.stdout
|
|
|
|
if is_python2 else sys.stdout.buffer)
|
|
|
|
line = sys.stdin.readline()
|
|
|
|
while line:
|
|
|
|
x = line.rstrip().split()
|
|
|
|
v = {args.key: " ".join(x[1:])}
|
|
|
|
new_line[x[0]] = v
|
|
|
|
line = sys.stdin.readline()
|
|
|
|
|
|
|
|
all_l = {"utts": new_line}
|
|
|
|
|
|
|
|
# ensure "ensure_ascii=False", which is a bug
|
|
|
|
jsonstring = json.dumps(
|
|
|
|
all_l,
|
|
|
|
indent=4,
|
|
|
|
ensure_ascii=False,
|
|
|
|
sort_keys=True,
|
|
|
|
separators=(",", ": "))
|
|
|
|
print(jsonstring)
|