def download_data(self):
        """Download the TripAdvisor data if it doesn't exist in raw_folder already."""
        
        # download files
        filename = self.resources.rpartition('/')[2]
        download_and_extract_archive(self.resources, download_root=self.raw_folder, filename=filename)

        print('Done!')
Ejemplo n.º 2
0
    def download_data(self):
        """Download the YelpReview data if it doesn't exist in raw_folder already."""

        # download files
        filename = 'yelp_review.zip'
        download_and_extract_archive(self.resources,
                                     download_root=self.raw_folder,
                                     filename=filename)

        print('Done!')
Ejemplo n.º 3
0
    def download_data(self):
        """Download the IMDB data if it doesn't exist in raw_folder already."""

        if self._check_exists():
            return

        os.makedirs(self.raw_folder, exist_ok=True)
        os.makedirs(self.processed_folder, exist_ok=True)

        # download files
        filename = self.resources.rpartition('/')[2]
        download_and_extract_archive(self.resources, download_root=self.raw_folder, filename=filename)

        print('Done!')
    def download_data(self):
        """Download the CitySearch data if it doesn't exist in raw_folder already."""

        # download files
        filename = self.resources.rpartition('/')[2]
        download_and_extract_archive(self.resources,
                                     download_root=self.raw_folder,
                                     filename=filename)

        # Remove *.pos and *.cnk files
        file_pos = glob.glob(
            os.path.join(self.raw_folder, 'citysearch_data', '*.pos'))
        file_cnk = glob.glob(
            os.path.join(self.raw_folder, 'citysearch_data', '*.cnk'))

        for f in file_pos:
            os.remove(f)
        for f in file_cnk:
            os.remove(f)

        print('Done!')