Python BeautifulSoup.getattr Examples

Programming Language: Python

Namespace/Package Name: bs4

Class/Type: BeautifulSoup

Method/Function: __getattr__

Examples at hotexamples.com: 3

Python BeautifulSoup.__getattr__ - 3 examples found. These are the top rated real world Python examples of bs4.BeautifulSoup.__getattr__ extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

append(30)

BeautifulSoup(30)

__str__(30)

__init__(11)

attrs(10)

__len__(8)

__repr__(3)

__unicode__(2)

article(2)

__copy__(2)

__getattr__(2)

first(2)

findAllNext(2)

feed(1)

currentTag(1)

fartind(1)

BF(1)

filter_wikilinks(1)

fina_all(1)

fnd_all(1)

h1(1)

replace_with(1)

td(1)

toCSV(1)

copy(1)

alcohol(1)

astype(1)

assign(1)

apply(1)

add_structure(1)

add_shared_term(1)

a(1)

_title(1)

_repr_html_(1)

_find_all(1)

_all_strings(1)

__getitem__(1)

__contains__(1)

NavigableString(1)

Date(1)

wrap(1)

Example #1

Show file

File: download-useragents.py Project: arthaud/python3-pwntools

    l.success()


def loop(xml):
    for item in xml:
        if item.name == 'folder':
            if item['description'] != 'UA List :: About':
                loop(item)
        elif item.name == 'useragent':
            uas.add(item['useragent'].strip())

with log.waitfor('Parsing list') as l:
    loop(soup.useragentswitcher)
    l.success()

with log.waitfor('Fetching from http://www.user-agents.org') as l:
    xml = getxml('http://www.user-agents.org/allagents.xml')
    soup = BeautifulSoup(xml)
    l.success()

with log.waitfor('Parsing list') as l:
    for item in soup.__getattr__('user-agents'):
        if item.name == 'user-agent':
            ua = item.select('string')[0].string.strip()
            uas.add(ua)
    l.success()

log.info('Fetched %d user agents' % len(uas))

write('useragents.txt', ''.join(sorted(ua + '\n' for ua in uas)))

Example #2

Show file


def loop(xml):
    for item in xml:
        if item.name == 'folder':
            if item['description'] != 'UA List :: About':
                loop(item)
        elif item.name == 'useragent':
            uas.add(item['useragent'].strip())


with log.waitfor('Parsing list') as l:
    loop(soup.useragentswitcher)
    l.success()

with log.waitfor('Fetching from http://www.user-agents.org') as l:
    xml = getxml('http://www.user-agents.org/allagents.xml')
    soup = BeautifulSoup(xml)
    l.success()

with log.waitfor('Parsing list') as l:
    for item in soup.__getattr__('user-agents'):
        if item.name == 'user-agent':
            ua = item.select('string')[0].string.strip()
            uas.add(ua)
    l.success()

log.info('Fetched %d user agents' % len(uas))

write('useragents.txt', ''.join(sorted(ua + '\n' for ua in uas)))

Example #3

Show file

<a href="http://example.com/tillie" class="sister" id="link3">Tillie</a>;
and they lived at the bottom of a well.</p>

<p class="story">...</p>
"""

soup = BeautifulSoup(html_doc, "html.parser")

#print(soup.prettify())
for tag in soup.find_all(re.compile("^b")):
    print(tag.name)
for tag in soup.find_all(lambda x: x.name.startswith('b')):
    print(tag.name)

soup2 = BeautifulSoup("&ldquo;Dammit!&rdquo; he said.", "html5lib")
print(str(soup2))

print('title' in dir(soup))
print(hasattr(soup, 'title'))
print('title' in soup.__dict__)
print(soup.__getattr__('title'))

markup = "<h1>Sacr\xc3\xa9 bleu!</h1>"
soup = BeautifulSoup(markup, "html5lib")
print(soup.h1)
# <h1>Sacré bleu!</h1>
print(soup.h1.string)
# u'Sacr\xe9 bleu!'
print(soup.original_encoding)
print(soup.contains_replacement_characters)
print(soup.prettify("latin-1"))

Python BeautifulSoup.__getattr__ Examples

Python BeautifulSoup.getattr Examples