Exemplo n.º 1
0
                continue
            pm.go_or_create_and_go_to(expanded_query)
            filenames = os.listdir()
            for i, filename in enumerate(filenames):
                if filename == '.DS_Store':
                    continue
                try:
                    page = pfl.load_file(filename)
                except EOFError:
                    print('%sのロードに失敗!' % page.title)
                    page.text = ''
                    page.sentences = ['']
                    continue
                if hasattr(page, 'text'):
                    print('%sはすでにフェッチしています' % page.title)
                    continue
                try:
                    if page.sentences:
                        continue
                    page.fetch_html()
                    page.set_text_from_html_body()
                    page.set_sentences_from_text()
                    pfs.save_file(obj=page, filename=filename)
                    print('%i番目のページ、%sの保存完了!' % (i, page.title))
                except:
                    print('%sの処理に失敗!' % page.title)
                    continue
            pm.go_up()
        pm.go_up()
    pm.go_up()
                continue
            pm.go_or_create_and_go_to(expanded_query)
            filenames = os.listdir()
            for i, filename in enumerate(filenames):
                if filename == ".DS_Store":
                    continue
                try:
                    page = pfl.load_file(filename)
                except EOFError:
                    print("%sのロードに失敗!" % page.title)
                    page.text = ""
                    page.sentences = [""]
                    continue
                if hasattr(page, "text"):
                    print("%sはすでにフェッチしています" % page.title)
                    continue
                try:
                    if page.sentences:
                        continue
                    page.fetch_html()
                    page.set_text_from_html_body()
                    page.set_sentences_from_text()
                    pfs.save_file(obj=page, filename=filename)
                    print("%i番目のページ、%sの保存完了!" % (i, page.title))
                except:
                    print("%sの処理に失敗!" % page.title)
                    continue
            pm.go_up()
        pm.go_up()
    pm.go_up()