def __init__(self): self.max_pages = cfg.google_img_pages() console.section('Google Reverse Image Search') console.task('Opening Webdriver') self.driver = cfg.getWebDriver() self.links = [] self.predictions = []
def __init__(self): console.section('Picture Age and Gender Detection') console.task('Opening Webdriver') self.driver = cfg.getWebDriver() self.ages = [] self.males = [] self.females = []
def collectAges(self, img_url): if not self.driver: self.driver = cfg.getWebDriver() console.task('New Image: {0}'.format(img_url.strip()[:90])) driver = self.driver driver.get("http://www.pictriev.com/?lang=en") console.subtask('Inserting Image URL') input = driver.find_elements_by_xpath('//*[@id="urltext"]')[0] input.clear() input.send_keys(img_url) btn = driver.find_elements_by_xpath('//*[@id="submit-url"]')[0] btn.click() console.subtask('Searching for Image...') time.sleep(cfg.timeout() * 3) try: age = driver.find_elements_by_css_selector( '#age-gauge > svg:nth-child(1) > text:nth-child(6) > tspan:nth-child(1)' ) except: age = driver.find_elements_by_css_selector( '#age-gauge > svg:nth-child(1) > text:nth-child(6) > tspan:nth-child(1)' ) if len(age) == 1: age = age[0].text else: age = 0 self.ages.append(int(age))
def grabLinks(self): img_urls = [] console.task('Opening Webdriver') driver = cfg.getWebDriver() for profile_url in self._pl: driver.get(profile_url) #first possibility profile_img_links = driver.find_elements_by_xpath( "/html/body/div[1]/div[4]/div[1]/div/div[2]/div[2]/div[2]/div/div[1]/div[1]/div[3]/div/div[2]/div[3]/div/div/div/img" ) for e in profile_img_links: img_src = e.get_attribute("src") img_urls.append(img_src) #second possivility profile_img_links = driver.find_elements_by_xpath( "/html/body/div[1]/div[1]/div[3]/div[1]/div/div/div[1]/div/div/div[1]/div/div/div/a/div/img" ) for e in profile_img_links: img_src = e.get_attribute("src") img_urls.append(img_src) driver.close() return list(set(img_urls))
def grabData(self): console.task('Opening Webdriver') driver = cfg.getWebDriver() driver.get(self.url) self.profile_list = [] self.profile_img = [] console.task("Please agree to facebook's stuff in the browser") time.sleep(10) #get all profile image links profile_img_links = driver.find_elements_by_xpath( "//a[@class='_2ial']") console.subtask('Collecting Image URLs...(Page 1)') if len(profile_img_links) <= 0: console.subfailure('No FB Links found') else: for e in profile_img_links: href = e.get_attribute("href") image = e.find_element_by_tag_name("img") img_src = image.get_attribute("src") self.profile_list.append(href) self.profile_img.append(img_src) pages = driver.find_elements_by_xpath("//a") pages_links = [] for e in pages: link = e.get_attribute('href') if "&page" in link: pages_links.append(link) pages_links = list(set(pages_links)) for page in pages_links: driver.get(page) profile_img_links = driver.find_elements_by_xpath( "//a[@class='_2ial']") page_num = page[-1:] console.subtask( 'Collecting Images URLs...(Page {0})'.format(page_num)) for e in profile_img_links: href = e.get_attribute("href") image = e.find_element_by_tag_name("img") img_src = image.get_attribute("src") self.profile_list.append(href) self.profile_img.append(img_src) time.sleep(1) driver.close()
def grabData(self): console.task('Opening Webdriver') driver = cfg.getWebDriver() driver.get(self.url) self.profile_list = [] self.profile_img = [] #get all profile image links profile_img_links = driver.find_elements_by_xpath( "//a[@class='_2ial _8o _8s lfloat _ohe']") console.subtask('Collecting Image URLs...(Page 1)') for e in profile_img_links: href = e.get_attribute("href") image = e.find_element_by_tag_name("img") img_src = image.get_attribute("src") self.profile_list.append(href) self.profile_img.append(img_src) pages = driver.find_elements_by_xpath("//a") pages_links = [] for e in pages: link = e.get_attribute('href') if "&page" in link: pages_links.append(link) pages_links = list(set(pages_links)) for page in pages_links: driver.get(page) profile_img_links = driver.find_elements_by_xpath( "//a[@class='_2ial _8o _8s lfloat _ohe']") page_num = page[-1:] console.subtask( 'Collecting Images URLs...(Page {0})'.format(page_num)) for e in profile_img_links: href = e.get_attribute("href") image = e.find_element_by_tag_name("img") img_src = image.get_attribute("src") self.profile_list.append(href) self.profile_img.append(img_src) time.sleep(1) driver.close()
def __init__(self): console.section('ImageRaider Reverse Image Search') console.task('Opening Webdriver') self.driver = cfg.getWebDriver() self.csv_error = False
def __init__(self): console.section('Yandex Reverse Image Search') console.task('Opening Webdriver') self.driver = cfg.getWebDriver() self.links = []