def get_from_query_gds_in_pmc_fulltext_dict(id_type, pmc_query, geo_year=None): ids = geo.get_ids_by_year(id_type, geo_year) ids.sort() response_dict = get_dict_submit_reuse_of_accession_in_pmc_fulltext( id_type, ids, pmc_query) return (response_dict)
def get_from_query_gds_in_pmc_fulltext_dict(id_type, pmc_query, geo_year=None): ids = geo.get_ids_by_year(id_type, geo_year) ids.sort() response_dict = get_dict_submit_reuse_of_accession_in_pmc_fulltext(id_type, ids, pmc_query) return(response_dict)
fh.close() updated_base_query_all = """("1901"[PubDate] : "2011/12/31"[PubDate])""" updated_base_query_reuse = """("1901"[PubDate] : "2011/12/31"[PubDate]) NOT "pmc gds"[filter]""" updated_base_query_create = """("1901"[PubDate] : "2011/12/31"[PubDate]) AND "pmc gds"[filter]""" if True: fh = open("scienceplot_new/results/pubmed_gse_count.csv", "w") num_id_fields = ["year", "num_gse_ids"] writer = csv.DictWriter(fh, num_id_fields) writer.writerow(dict((fn, fn) for fn in writer.fieldnames)) total_count = 0 for id_type in ["GSE"]: id_count = 0 for year in geo_years: ids = geo.get_ids_by_year(id_type, year) row_dict = dict(year=year, num_gse_ids=len(ids)) print row_dict.values() writer.writerow(row_dict) id_count += len(ids) print id_type, id_count total_count += id_count print total_count fh.close() year = "2009" #submission_years = [str(year) for year in range(2007,2008)] submission_years = [year] all_dict = run_stats(submission_years, id_types, updated_base_query_all) if True:
fh.close() updated_base_query_all = """("1901"[PubDate] : "2011/12/31"[PubDate])""" updated_base_query_reuse = """("1901"[PubDate] : "2011/12/31"[PubDate]) NOT "pmc gds"[filter]""" updated_base_query_create = """("1901"[PubDate] : "2011/12/31"[PubDate]) AND "pmc gds"[filter]""" if True: fh = open("scienceplot_new/results/pubmed_gse_count.csv", "w") num_id_fields = ["year", "num_gse_ids"] writer = csv.DictWriter(fh, num_id_fields) writer.writerow(dict((fn,fn) for fn in writer.fieldnames)) total_count = 0 for id_type in ["GSE"]: id_count = 0 for year in geo_years: ids = geo.get_ids_by_year(id_type, year) row_dict = dict(year=year, num_gse_ids=len(ids)) print row_dict.values() writer.writerow(row_dict) id_count += len(ids) print id_type, id_count total_count += id_count print total_count fh.close() year = "2009" #submission_years = [str(year) for year in range(2007,2008)] submission_years = [year] all_dict = run_stats(submission_years, id_types, updated_base_query_all)