def test_arxiv_4(self): prov = Arxiv(upload=False, verbose=VERBOSE) url = "https://arxiv.org/pdf/physics/0605197v1.pdf" exp_filename = ( "Knuth_-_Optimal_Data-Based_Binning_for_Histograms_2006.pdf") filename = prov.run(url) self.assertEqual(exp_filename, os.path.basename(filename))
def test_arxiv_1(self): # check with qpdf prov = Arxiv(upload=False, verbose=VERBOSE, pdftk_path=None) url = "https://arxiv.org/abs/1811.11242v1" exp_filename = "Burg_Nazabal_Sutton_-_Wrangling_Messy_CSV_Files_by_Detecting_Row_and_Type_Patterns_2018.pdf" filename = prov.run(url) self.assertEqual(exp_filename, os.path.basename(filename))
def test_arxiv_copy_toc(self): """Make sure the table of content is kept after processing when using the arXiv provider.""" prov = Arxiv(upload=False, verbose=VERBOSE) filename = prov.run("https://arxiv.org/abs/1711.03512") with Pdf.open(filename) as pdf: with pdf.open_outline() as outline: assert len(outline.root) > 0
def test_arxiv_6(self): prov = Arxiv(upload=False, verbose=VERBOSE) url = "https://arxiv.org/pdf/1701.05517.pdf?source=post_page---------------------------" exp_filename = "Salimans_et_al_-_PixelCNN_Improving_the_PixelCNN_With_Discretized_Logistic_Mixture_Likelihood_and_Other_Modifications_2017.pdf" filename = prov.run(url) self.assertEqual(exp_filename, os.path.basename(filename))
def test_arxiv_5(self): prov = Arxiv(upload=False, verbose=VERBOSE, qpdf_path=None) url = "https://arxiv.org/abs/2002.11523" exp_filename = "Ponomarev_Oseledets_Cichocki_-_Using_Reinforcement_Learning_in_the_Algorithmic_Trading_Problem_2020.pdf" filename = prov.run(url) self.assertEqual(exp_filename, os.path.basename(filename))
def test_arxiv_3(self): prov = Arxiv(upload=False, verbose=VERBOSE) url = "https://arxiv.org/abs/math/0309285" exp_filename = "Jackson_et_al_-_An_Algorithm_for_Optimal_Partitioning_of_Data_on_an_Interval_2003.pdf" filename = prov.run(url) self.assertEqual(exp_filename, os.path.basename(filename))
def test_arxiv_2(self): prov = Arxiv(upload=False, verbose=VERBOSE) url = "http://arxiv.org/abs/arXiv:1908.03213" exp_filename = "Ecker_et_al_-_Gravitational_Waves_From_Holographic_Neutron_Star_Mergers_2019.pdf" filename = prov.run(url) self.assertEqual(exp_filename, os.path.basename(filename))