Source code for scripts.normalize

import argparse
import os

from ucca.ioutil import get_passages_with_progress_bar, write_passage
from ucca.normalization import normalize


[docs]def main(args): if args.outdir: os.makedirs(args.outdir, exist_ok=True) for p in get_passages_with_progress_bar(args.filenames, desc="Normalizing", converters={}): normalize(p, extra=args.extra) write_passage(p, outdir=args.outdir, prefix=args.prefix, binary=args.binary, verbose=False)
if __name__ == "__main__": argparser = argparse.ArgumentParser(description="Normalize UCCA passages") argparser.add_argument("filenames", nargs="+", help="files or directories to normalize") argparser.add_argument("-o", "--outdir", default=".", help="output directory") argparser.add_argument("-p", "--prefix", default="", help="output filename prefix") argparser.add_argument("-b", "--binary", action="store_true", help="write in pickle binary format (.pickle)") argparser.add_argument("-e", "--extra", action="store_true", help="extra normalization rules") main(argparser.parse_args())