Python BeautifulSoup.rstrip Beispiele

Programmiersprache: Python

Namespace / Paketname: BeautifulSoup

Klasse / Typ: BeautifulSoup

Methode / Funktion: rstrip

Beispiele auf hotexamples.com: 2

Python BeautifulSoup.rstrip - 2 Beispiele gefunden. Dies sind die am besten bewerteten Python Beispiele für die BeautifulSoup.BeautifulSoup.rstrip, die aus Open Source-Projekten extrahiert wurden. Sie können Beispiele bewerten, um die Qualität der Beispiele zu verbessern.

Häufig verwendete Methoden

Anzeigen Verbergen

BeautifulSoup(30)

decompose(30)

first(30)

find_all(30)

findAll(30)

find(30)

fetch(30)

feed(30)

getText(29)

insert(20)

findChildren(19)

body(12)

close(11)

__str__(11)

encode(8)

new_tag(6)

findChild(5)

append(4)

prettify(4)

findSelect(4)

decode(4)

get(4)

__unicode__(3)

goahead(3)

lower(3)

div(3)

findall(3)

pretify(3)

__init__(3)

firstText(2)

pop(2)

data(2)

findNext(2)

read(2)

index(1)

html(1)

query(1)

json(1)

load(1)

re_left(1)

noscript(1)

orig_url(1)

partition(1)

popTag(1)

pretiffy(1)

head(1)

findNextSiblings(1)

group(1)

encodeContents(1)

attrs(1)

Beispiel #1

Datei anzeigen

Datei: crhoy_4spider.py Projekt: Dephe/corpus_inil

 def parse(self, response):
     titulo = response.selector.xpath('/html/body/div[1]/div[2]/section/div[4]/article/div[1]/h1').extract()
     fecha = response.selector.xpath('/html/body/div[1]/div[2]/section/div[4]/article/div[1]/div').extract()
     seccion = response.selector.xpath('/html/body/div[1]/div[2]/section/div[4]/article/div[1]/h3[1]/a[2]').extract()
     pagename = '/home/federico/Desktop/corpus_inil/crawler/crawler/crawlinil/datos_crhoy/' + str(random.randint(1,1000))
     titulo = BeautifulSoup(titulo[0], 'lxml').text
     titulo = titulo.rstrip('\n')
     fecha = BeautifulSoup(fecha[0], 'lxml').text
     fecha = re.findall('\w*\s\w*,\s\w*', fecha)[0]
     seccion = BeautifulSoup(seccion[0], 'lxml').text
     #macrosecciones
     if seccion in ['Fútbol', 'Atletismo', 'Baloncesto', 'Tennis', 'Motores', 'Natación', 'Ciclismo', 'Surf', 'Voleibol', 'Otros', 'Destino Rusia']:
         seccion = 'Deportes'
     if seccion in ['Clima', 'Educación', 'Gobierno', 'Política', 'Salud', 'Transportes', 'Servicios']:
         seccion = 'Nacionales'
     if seccion in = ['Sucesos']:
         seccion = 'Sucesos'
     if seccion in = ['Columnas'. 'Especialistas', 'Lector opina', 'Aclaraciones']:
         seccion = 'Opinión'

Beispiel #2

Datei anzeigen

Datei: downloads.py Projekt: PiTiLeZarD/BetaSeries-Scripts

def downloadEpisode(episode):
    search_text = "%s %s" % (episode.season.serie.name, episode.num)
    
    url = 'http://thepiratebay.org/search/%s/0/7/0' % urllib.quote(search_text)
    search = urllib2.urlopen( url ).read()
    torrents = BeautifulSoup(search).findAll('td')
    if len(torrents) > 1:
        torrent = torrents[1]
        link = BeautifulSoup("<html><body>%s</body></html>" % torrent).findAll('a')[1]
        link = re.search('href="(.*?)"', str(link)).group(1)
        
        if link.rstrip():
            download = model.Download()
            download.torrentFile = link
            download.episode = episode
        
            model.Session.add( download )
        
            fp = open( os.path.join( getOption('download.torrent.folder'), os.path.basename(link) ) , 'w')
            fp.write( urllib2.urlopen( link ).read() )
            fp.close()