示例#1
0
def retrieve_papers_to_tsv(ptitle):
    """

    :param publication:
    :param filename:
    :return:
    """
    ptitle_f = ptitle.replace('/', ' ')
    filename = 'tsv/' + ptitle_f + '.tsv'
    if os.path.isfile(filename):
        return
    fields = ['number', 'doi', 'spage', 'epage', 'issue', 'partnum',
              'publication', 'year', 'rank', 'title', 'abstract',
              'authors', 'terms']
    with open(filename, 'ta', newline='') as fp:
        tsv_writer = csv.writer(fp, delimiter='\t')
        # tsv_writer.writerow(fields)
        try:
            print('get publication urls', ptitle)
            urls = journal_articles_requests_urls(ptitle,
                                                  articles_per_request=1000)
            for url in urls:
                try:
                    print('reading --', url)
                    paper_dicts = retrieve_documents_from_url(url)
                    paperlist = []
                    for pd in paper_dicts:
                        p = Paper(ptitle, pd)
                        paperlist.append(p)
                    paper_str_list = []
                    for p in paperlist:
                        paper_str_list.append(p.to_list())
                    tsv_writer.writerows(paper_str_list)
                except Exception as e:
                    print(str(e))
        except Exception as e:
            print(str(e))
示例#2
0
    def get_total_number_of_articles(self):
        """

        """
        url = journal_articles_requests_urls(self.title)[0]
        return journal_article_total_number_from_url(url)