Example #1
0
parser.add_argument(
    "corpus",
    nargs="+",
    default="parallel text corpus",
    help=""
    )


parser.add_argument(
    "-V", "--verbose",
    action="store_true",
    help="verbose output"
    )


args = parser.parse_args()

if args.verbose:
    print >>stderr, "Reading corpus from", args.corpus
    
corpus = HitaextDoc(file=args.corpus)

from_tree = corpus.get_doc_tree("from")
to_tree = corpus.get_doc_tree("to")

from_tree.update()
to_tree.update()

corpus.inject_alignments(from_tree, to_tree)

corpus.alignment.set("method", "id")
Example #2
0
from daeso.utils.cli import ArgumentParser
from daeso.ptc.document import HitaextDoc

parser = ArgumentParser(description=__doc__)

parser.add_argument("corpus",
                    nargs="+",
                    default="parallel text corpus",
                    help="")

parser.add_argument("-V",
                    "--verbose",
                    action="store_true",
                    help="verbose output")

args = parser.parse_args()

if args.verbose:
    print >> stderr, "Reading corpus from", args.corpus

corpus = HitaextDoc(file=args.corpus)

from_tree = corpus.get_doc_tree("from")
to_tree = corpus.get_doc_tree("to")

from_tree.update()
to_tree.update()

corpus.inject_alignments(from_tree, to_tree)

corpus.alignment.set("method", "id")