def testPrintSeedDBSingleNiche(self):
     seed_db_addr = "/Users/superCat/Desktop/PycharmProjectPortable/Seeds/CategorySeedDB.db"
     parameters = {"TF": 0}
     db = CategorySeedSiteDB(seed_db_addr)
     total = db.get_total("Society/Law", **parameters)
     db.close()
     print(total)
    def testeedExport(self):
        seed_db_addr = "/Users/superCat/Desktop/PycharmProjectPortable/sync/SeedSitesList"
        seed_db = SeedSiteDB("26/10/2015 Marketing CF20", db_addr=seed_db_addr)

        categoy_db_addr = "/Users/superCat/Desktop/PycharmProjectPortable/Seeds/CategorySeedDB.db"
        db = CategorySeedSiteDB(categoy_db_addr)
        # seed_manager = CategorySiteDBManager(CategorySeedSiteDB, db_path=categoy_db_addr)
        categories = db.get_sub_category_tables_name()
        target_ca = [
            x for x in categories if "Business/Marketing and Advertising" in x
        ]
        sites = []
        seeds_needed = 20000
        percentage = 1
        parameters = {
            "CF": 20,
        }
        for ca in target_ca:
            sites.clear()
            count = db.get_total(ca)
            if percentage == 1 and count > seeds_needed:
                count = seeds_needed
            count = int(percentage * count)
            if count > 0:
                temp = db.get_from_table(ca,
                                         0,
                                         count,
                                         random_read=False,
                                         filter_dict=parameters)
                for item in temp:
                    if isinstance(item, MajesticBacklinkDataStruct):
                        sites.append((item.ref_domain, 0))
                seed_db.add_sites(sites, skip_check=True)
        seed_db.close()
 def testPrintSeedDB(self):
     seed_db_addr = "/Users/superCat/Desktop/PycharmProjectPortable/Seeds/CategorySeedDB3.db"
     log_file_path = "/Users/superCat/Desktop/PycharmProjectPortable/Seeds/SeedLog3.csv"
     enable_log = True
     FileHandler.remove_file_if_exist(log_file_path)
     db = CategorySeedSiteDB(seed_db_addr)
     # seed_manager = CategorySiteDBManager(CategorySeedSiteDB, db_path=seed_db_addr)
     categories = db.get_sub_category_tables_name()
     total_count = 0
     target_niche = ""
     parameters = {"TF": 0}
     if enable_log:
         CsvLogger.log_to_file_path(log_file_path, [
             ("parameters", str(parameters)),
         ])
     # parameters = {"TF": 20}
     for item in categories:
         if target_niche in item or len(target_niche) == 0:
             count = db.get_total(item, **parameters)
             total_count += count
             print(item, "  ", count)
             if enable_log:
                 CsvLogger.log_to_file_path(log_file_path, [
                     (item, str(count)),
                 ])
     print("total:", total_count)
     if enable_log:
         CsvLogger.log_to_file_path(log_file_path, [
             ("total", str(total_count)),
         ])