예제 #1
0
def download(lang='en'):
    base = os.path.dirname(COMMAND_PATH)
    if os.path.isfile(COMMAND_PATH):
        print("Stanford CoreNLP is already downloaded at {}.".format(base))
    else:
        print("Downloading Stanford CoreNLP...")
        unzip_from_url(DOWNLOAD_URL, DIRS.user_data_dir)

        for directory in os.listdir(DIRS.user_data_dir):
            if directory.startswith("stanford-corenlp-full"):
                stanford_directory = os.path.join(DIRS.user_data_dir, directory)
                if os.path.isdir(stanford_directory):
                    corenlp = os.path.join(stanford_directory, "corenlp.sh")
                    st = os.stat(corenlp)
                    os.chmod(corenlp, st.st_mode | stat.S_IEXEC)
                    break

    # Download extra data for specific language
    if lang.lower() == 'es':
        SPANISH_PATH = os.path.join(_FOLDER_PATH, 'edu', 'stanford', 'nlp', 'models')
        if os.path.isdir(SPANISH_PATH):
            print("Extra data for lang '{}' already downloaded.".format(lang))
        else:
            print("Downloading Stanford CoreNLP extra data for lang '{}'...".format(lang))
            unzip_from_url(DOWNLOAD_URL_ES, _FOLDER_PATH)
    elif lang.lower() != 'en':
        print("There are no extra data to download for lang '{}'.".format(lang))
예제 #2
0
파일: corenlp.py 프로젝트: prashiyn/iepy
def download(lang="en"):
    base = os.path.dirname(COMMAND_PATH)
    if os.path.isfile(COMMAND_PATH):
        print("Stanford CoreNLP is already downloaded at {}.".format(base))
    else:
        print("Downloading Stanford CoreNLP...")
        unzip_from_url(DOWNLOAD_URL, DIRS.user_data_dir)

        # Zip acquired. Make sure right Java is used, and file is executable
        for directory in os.listdir(DIRS.user_data_dir):
            if directory.startswith("stanford-corenlp-full"):
                stanford_directory = os.path.join(DIRS.user_data_dir, directory)
                if os.path.isdir(stanford_directory):
                    runner_path = os.path.join(stanford_directory, "corenlp.sh")
                    st = os.stat(runner_path)
                    _content = open(runner_path).read()
                    _content = _content.replace("java", "$JAVAHOME")
                    with open(runner_path, "w") as runner_file:
                        runner_file.write(_content)

                    os.chmod(runner_path, st.st_mode | stat.S_IEXEC)
                    break

    # Download extra data for specific language
    if lang.lower() == "es":
        SPANISH_PATH = os.path.join(_FOLDER_PATH, "edu", "stanford", "nlp", "models")
        if os.path.isdir(SPANISH_PATH):
            print("Extra data for lang '{}' already downloaded.".format(lang))
        else:
            print("Downloading Stanford CoreNLP extra data for lang '{}'...".format(lang))
            unzip_from_url(DOWNLOAD_URL_ES, _FOLDER_PATH)
    elif lang.lower() != "en":
        print("There are no extra data to download for lang '{}'.".format(lang))
예제 #3
0
def download(lang='en'):
    base = os.path.dirname(COMMAND_PATH)
    if os.path.isfile(COMMAND_PATH):
        print("Stanford CoreNLP is already downloaded at {}.".format(base))
    else:
        print("Downloading Stanford CoreNLP...")
        unzip_from_url(DOWNLOAD_URL, DIRS.user_data_dir)

        # Zip acquired. Make sure right Java is used, and file is executable
        for directory in os.listdir(DIRS.user_data_dir):
            if directory.startswith("stanford-corenlp-full"):
                stanford_directory = os.path.join(DIRS.user_data_dir, directory)
                if os.path.isdir(stanford_directory):
                    runner_path = os.path.join(stanford_directory, "corenlp.sh")
                    st = os.stat(runner_path)
                    _content = open(runner_path).read()
                    _content = _content.replace('java', '$JAVAHOME')
                    with open(runner_path, 'w') as runner_file:
                        runner_file.write(_content)

                    os.chmod(runner_path, st.st_mode | stat.S_IEXEC)
                    break

    # Download extra data for specific language
    download_urls = dict(es=DOWNLOAD_URL_ES, de=DOWNLOAD_URL_DE)
    if lang.lower() in download_urls.keys():
        print("Downloading Stanford CoreNLP extra data for lang '{}'...".format(lang))
        unzip_from_url(download_urls[lang.lower()], _FOLDER_PATH)
    elif lang.lower() != 'en':
        print("There are no extra data to download for lang '{}'.".format(lang))
예제 #4
0
 def download_old_iepy_version(self):
     oldv = self.old_version
     url = "https://pypi.python.org/packages/source/i/iepy/iepy-{}.tar.gz".format(oldv)
     old_versions_path = os.path.join(DIRS.user_data_dir, 'old_versions')
     os.makedirs(old_versions_path, exist_ok=True)
     asked_tag_path = os.path.join(old_versions_path, 'iepy-{}'.format(oldv))
     if not os.path.exists(asked_tag_path):
         print ('Downloading old iepy version {} for allowing patches'.format(oldv))
         unzip_from_url(url, old_versions_path)
         print('Done')
     return asked_tag_path
예제 #5
0
파일: corenlp.py 프로젝트: JeffersonK/iepy
def download():
    base = os.path.dirname(COMMAND_PATH)
    if os.path.isfile(COMMAND_PATH):
        print("Stanford CoreNLP is already downloaded at {}.".format(base))
        return
    print("Downloading Stanford CoreNLP...")

    unzip_from_url(DOWNLOAD_URL, DIRS.user_data_dir)

    for directory in os.listdir(DIRS.user_data_dir):
        if directory.startswith("stanford-corenlp-full"):
            stanford_directory = os.path.join(DIRS.user_data_dir, directory)
            if os.path.isdir(stanford_directory):
                corenlp = os.path.join(stanford_directory, "corenlp.sh")
                st = os.stat(corenlp)
                os.chmod(corenlp, st.st_mode | stat.S_IEXEC)
                break
예제 #6
0
def download():
    base = os.path.dirname(COMMAND_PATH)
    if os.path.isfile(COMMAND_PATH):
        print("Stanford CoreNLP is already downloaded at {}.".format(base))
        return
    print("Downloading Stanford CoreNLP...")

    unzip_from_url(DOWNLOAD_URL, DIRS.user_data_dir)

    for directory in os.listdir(DIRS.user_data_dir):
        if directory.startswith("stanford-corenlp-full"):
            stanford_directory = os.path.join(DIRS.user_data_dir, directory)
            if os.path.isdir(stanford_directory):
                corenlp = os.path.join(stanford_directory, "corenlp.sh")
                st = os.stat(corenlp)
                os.chmod(corenlp, st.st_mode | stat.S_IEXEC)
                break