def test_fetch_minutes(self): dt = datetime.datetime(2011, 1, 12) path = extract_path(dt) url = 'http://efiles.portlandoregon.gov/webdrawer.dll/webdrawer/rec/4187324/view/' with open('{}neh.pdf'.format(base_resources), 'wb') as f: extract_fetch(f, url, dt)
def output(self): return luigi.LocalTarget("{}/minutes.pdf".format(extract_path(self.date)))
def test_extract_path(self): dt = datetime.datetime(2011, 1, 12) path = extract_path(dt) #print(path, file=stderr) target_out = '{}'.format(os.getcwd()) self.assertEqual(target_out, path)
def output(self): return LocalTarget("{}/statements.pkl".format(extract_path(self.date)))
def output(self): return LocalTarget("{}/body.txt".format(extract_path(self.date)))
def output(self): return LocalTarget('{}/raw.text'.format(\ extract_path(self.date)))
def output(self): return LocalTarget('{}/token_links.pkl'.format(\ extract_path(self.date)))
def output(self): return LocalTarget('{}/cleaned.txt'.format(\ extract_path(self.date)))