Exemplo n.º 1
0
def main():
    args = setup_args()
    glove_base_url = "http://nlp.stanford.edu/data/"
    glove_filename = "glove.6B.zip"

    print "\nDownloading wordvecs to {}".format(args.download_dir)

    if not os.path.exists(args.download_dir):
        os.makedirs(args.download_dir)

    maybe_download(glove_base_url, glove_filename, args.download_dir, 862182613L)
    glove_zip_ref = zipfile.ZipFile(os.path.join(args.download_dir, glove_filename), 'r')

    glove_zip_ref.extractall(args.download_dir)
    glove_zip_ref.close()
Exemplo n.º 2
0
def main():
    args = setup_args()
    glove_base_url = "http://nlp.stanford.edu/data/"
    glove_filename = "glove.6B.zip"

    print("\nDownloading wordvecs to {}".format(args.download_dir))

    if not os.path.exists(args.download_dir):
        os.makedirs(args.download_dir)

    maybe_download(glove_base_url, glove_filename, args.download_dir, 862182613)
    glove_zip_ref = zipfile.ZipFile(os.path.join(args.download_dir, glove_filename), 'r')

    glove_zip_ref.extractall(args.download_dir)
    glove_zip_ref.close()
def main():
    args = setup_args()
    glove_base_url = "http://nlp.stanford.edu/data/"
    glove_filename = "glove.840B.300d.zip"

    if not os.path.exists(args.data_dir):
        os.makedirs(args.data_dir, exist_ok=True)

    maybe_download(glove_base_url, glove_filename, args.data_dir)

    glove_path = os.path.join(args.data_dir, glove_filename)
    print("Unzipping {}...".format(glove_path))
    glove_zip_ref = zipfile.ZipFile(glove_path, 'r')

    glove_zip_ref.extractall(args.data_dir)
    glove_zip_ref.close()
if __name__ == '__main__':
    parser = argparse.ArgumentParser()
    parser.add_argument(
        "--glove_source",
        choices=['wiki', 'crawl_ci', 'crawl_cs'],
        required=True)  # added for use with different glove sources
    args = parser.parse_args()

    glove_base_url = "http://nlp.stanford.edu/data/"
    if args.glove_source == 'wiki':
        glove_filename = "glove.6B.zip"
    elif args.glove_source == 'crawl_ci':
        glove_filename = "glove.42B.300d.zip"
    elif args.glove_source == 'crawl_cs':
        glove_filename = "glove.840B.300d.zip"

    prefix = os.path.join("download", "dwr")

    print("Storing datasets in {}".format(prefix))

    if not os.path.exists(prefix):
        os.makedirs(prefix)

    glove_zip = maybe_download(glove_base_url, glove_filename, prefix,
                               862182613)
    glove_zip_ref = zipfile.ZipFile(os.path.join(prefix, glove_filename), 'r')

    glove_zip_ref.extractall(prefix)
    glove_zip_ref.close()
import argparse
import os
from squad_preprocess import maybe_download


def setup_args():
    parser = argparse.ArgumentParser()
    parser.add_argument(
        "--download_dir",
        required=True)  # where to put the downloaded glove files
    return parser.parse_args()


if __name__ == '__main__':
    args = setup_args()
    glove_base_url = "http://nlp.stanford.edu/data/"
    glove_filename = "glove.6B.zip"

    print("\nDownloading wordvecs to {}".format(args.download_dir))

    if not os.path.exists(args.download_dir):
        os.makedirs(args.download_dir)
    # if not os.path.exists(os.path.join(prefix, filename)):
    maybe_download(glove_base_url, glove_filename, args.download_dir,
                   862182613)  # instead of 862182613L (python2)
    glove_zip_ref = zipfile.ZipFile(
        os.path.join(args.download_dir, glove_filename), 'r')

    glove_zip_ref.extractall(args.download_dir)
    glove_zip_ref.close()