from sys import stderr from os.path import splitext, join from daeso.utils.cli import ArgumentParser from daeso.ptc.document import HitaextDoc parser = ArgumentParser(description=__doc__) parser.add_argument( "corpus", nargs="+", default="parallel text corpus", help="" ) parser.add_argument( "-V", "--verbose", action="store_true", help="verbose output" ) args = parser.parse_args() if args.verbose: print >>stderr, "Reading corpus from", args.corpus
# You should have received a copy of the GNU General Public License # along with this program. If not, see <http://www.gnu.org/licenses/>. """ convert a parallel text corpus from n-based alignment to id-based alignment """ from sys import stderr from os.path import splitext, join from daeso.utils.cli import ArgumentParser from daeso.ptc.document import HitaextDoc parser = ArgumentParser(description=__doc__) parser.add_argument("corpus", nargs="+", default="parallel text corpus", help="") parser.add_argument("-V", "--verbose", action="store_true", help="verbose output") args = parser.parse_args() if args.verbose: print >> stderr, "Reading corpus from", args.corpus corpus = HitaextDoc(file=args.corpus) from_tree = corpus.get_doc_tree("from")
from glob import glob from os.path import basename, join from sys import stdout, stderr from string import uppercase from daeso.utils.cli import ArgumentParser from daeso.ptc.document import HitaextDoc parser = ArgumentParser(description=__doc__) parser.add_argument( "corpus", nargs="+", default="parallel text corpus", help="" ) parser.add_argument( "-d", "--dir", default="", help="new directory for source and target files " "(defaults to none, which means stripping the existing directory)" ) parser.add_argument( "-t", "--test", action="store_true", help="perform a dry run without actually changing the files (implies -v)" )
""" __authors__ = 'Erwin Marsi <*****@*****.**>' from glob import glob from os.path import basename, join from sys import stdout, stderr from string import uppercase from daeso.utils.cli import ArgumentParser from daeso.ptc.document import HitaextDoc parser = ArgumentParser(description=__doc__) parser.add_argument("corpus", nargs="+", default="parallel text corpus", help="") parser.add_argument( "-d", "--dir", default="", help="new directory for source and target files " "(defaults to none, which means stripping the existing directory)") parser.add_argument( "-t", "--test", action="store_true", help="perform a dry run without actually changing the files (implies -v)")