Python Entity.siteの例

プログラミング言語: Python

名前空間/パッケージ名: Schemas

クラス/型: Entity

メソッド/関数: site

hotexamples.comのコード掲載数: 2

Python Entity.site - 2件のコード例が見つかりました。すべてオープンソースプロジェクトから抽出されたPythonのSchemas.Entity.siteの実例で、最も評価が高いものを厳選しています。コード例の評価を行っていただくことで、より質の高いコード例が表示されるようになります。

よく使われるメソッド

表示非表示

subcategory(24)

title(21)

address(16)

desc(4)

author(3)

image(3)

site(2)

phone(2)

factual(2)

mpaa_rating(2)

publisher(2)

yrating(1)

original_release_date(1)

publish_date(1)

seattletimes(1)

small(1)

sku_number(1)

vicinity(1)

nytimes(1)

subtitle(1)

tiny(1)

yreviews(1)

titlel(1)

track_length(1)

openTable(1)

nrating(1)

nymag(1)

hoursOfOperation(1)

awardAnnals(1)

bid(1)

cast(1)

cuisine(1)

earliest_air_date(1)

entity_id(1)

googleLocal(1)

hd(1)

imdb_id(1)

nurl(1)

isbn(1)

large(1)

lat(1)

latest_air_date(1)

lng(1)

ngenres(1)

nid(1)

num_seasons(1)

yurl(1)

コード例 #1

ファイルを表示

ファイル: ZagatCrawler.py プロジェクト: Stamped/Stamped

 def _parseRestaurantPage(self, pool, region_name, city_name, restaurant_name, href):
     utils.log("[%s] parsing restaurant '%s.%s.%s' (%s)" % (self, region_name, city_name, restaurant_name, href))
     
     try:
         soup = utils.getSoup(href)
     except:
         utils.printException()
         utils.log("[%s] error downloading page %s" % (self, href))
         return
     
     # parse the address for the current restaurant
     addr   = soup.find('div', {'class' : 'address'})
     street = addr.find('span', {'class' : 'street'}).getText().strip()
     geo    = addr.find('span', {'class' : 'geo'}).getText().strip()
     
     address = "%s, %s" % (street, geo)
     
     # add the current restaurant to the output for this crawler
     entity = Entity()
     entity.subcategory = "restaurant"
     entity.title   = restaurant_name
     entity.address = address
     entity.sources.zagat = {
         'zurl' : self.base + href, 
     }
     
     #self._globals['soup'] = soup
     # parse cuisine
     header = soup.find('div', {'id' : "block-zagat_restaurants-14"})
     if header is not None:
         header = header.find('ul').find('li', {'class' : 'first'})
         
         if header is not None:
             entity.cuisine = header.getText()
     
     # parse website
     site = soup.find('span', {'class' : 'website'})
     if site is not None:
         site = site.find('a')
         
         if site is not None:
             entity.site = site.get('href')
     
     # parse preview image
     img = soup.find('div', {'id' : 'content'}).find('div', {'class' : 'photo'})
     if img is not None:
         img = img.find('img')
         
         if img is not None:
             entity.image = img.get('src')
     
     self._output.put(entity)

コード例 #2

ファイルを表示

ファイル: SeattleTimesCrawler.py プロジェクト: Stamped/Stamped

 def _parseRestaurantPage(self, pool, queue, url, name, base=False):
     utils.log('[%s] parsing restaurant page %s (%s)' % (self, name, url))
     
     try:
         soup = utils.getSoup(url)
     except:
         #utils.printException()
         utils.log("[%s] error downloading page %s (%s)" % (self, name, url))
         return
     
     content = soup.find('div', { 'id' : 'content'})
     
     if content is None:
         return
     
     entity = Entity()
     entity.title = content.find('h1').getText()
     entity.subcategory = "restaurant"
     entity.seattletimes = {}
     
     details = content.find('div', {'id' : 'edbtext'})
     desc    = details.find('p').getText()
     if desc is not None:
         entity.desc = desc
     
     details = details.findAll('p', {'class' : 'list'})
     address = details[0].renderContents().strip().replace('<br />', '')
     address = re.sub('[ \n\t]+', ' ', address)
     entity.address = address
     
     if len(details) > 1:
         site = details[1].get('href')
         if site is not None:
             entity.site = site
     
     if len(details) > 2:
         hoursOfOperation = details[2].getText()
         if hoursOfOperation is not None:
             entity.hoursOfOperation = hoursOfOperation
     
     key = (entity.title, entity.address)
     if key in self.seen or '(closed)' in entity.title.lower():
         return
     
     self.seen.add(key)
     self._output.put(entity)