Python Storage.add_link Examples

Programming Language: Python

Namespace/Package Name: storage

Class/Type: Storage

Method/Function: add_link

Examples at hotexamples.com: 4

Python Storage.add_link - 4 examples found. These are the top rated real world Python examples of storage.Storage.add_link extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

Storage(30)

add(27)

__init__(19)

get_items(5)

get_stats(4)

insert_items(4)

add_task(3)

size(2)

add_post(2)

add_link(2)

dbClose(2)

dbConnect(2)

push(2)

mu(2)

sigma(2)

a(2)

add_reddit_scraped_info(2)

is_all_piece_received(2)

initialize(2)

get_log(2)

verify_log(2)

T(2)

resCount(1)

remove_settings(1)

remove_items(1)

refresh(1)

read_username(1)

goodPrice(1)

read_password(1)

read_ip(1)

goods(1)

goodsCount(1)

r_free(1)

option(1)

num_drivers(1)

google_read(1)

loglevel(1)

loadUser(1)

loadCreateUser(1)

list(1)

resources(1)

is_piece_received(1)

is_initial(1)

google_write(1)

history(1)

latest(1)

AddContent(1)

return_code(1)

select_transactions(1)

wiki_merge(1)

Example #1

Show file

File: crawler.py Project: ik2/search-engine

def crawl_web(seed):
    tocrawl = set([seed])
    crawled = []
    database = Storage()
    while tocrawl:
        url = tocrawl.pop()
        if url not in crawled:
            content = get_page(url)
            text = content.get_text()
            text = re.sub(r"[-/']", ' ', text)
            text = re.sub(
                ur'[\u0932\u094b\u0917\u092a\u0930\u093f\u0926\u0943\u0936\u094d\u092f\u0938\u094d\u0925\u093e\u0928\u0915\u0930\u094d\u092e\u091a\u093e\u0930\u0940\u201c\u2013\u2019\u092b\u201d]',
                ' ', text)
            outlinks = get_all_links(content)
            for outlink in outlinks:
                database.add_link(url, outlink)
            punctuation = ".?;,!()|:\""
            for word in text.split():
                word = word.lstrip(punctuation).rstrip(punctuation).lower()
                search = re.search(r"[^a-z0-9]", word)
                if not search and word != "":
                    database.add_word_occurrence(url, word)
            tocrawl.update(outlinks)
            crawled.append(url)
    return database

Example #2

Show file

File: crawler.py Project: ik2/search-engine

def crawl_web(seed):
    tocrawl = set([seed])
    crawled = []
    database = Storage()
    while tocrawl: 
        url = tocrawl.pop()
        if url not in crawled:
            print url
            soup = get_page(url)
            text = soup.get_text()
            text = re.sub(r"[-/']", ' ', text)
            text = re.sub(ur'[\u0932\u094b\u0917\u092a\u0930\u093f\u0926\u0943\u0936\u094d\u092f\u0938\u094d\u0925\u093e\u0928\u0915\u0930\u094d\u092e\u091a\u093e\u0930\u0940\u201c\u2013\u2019\u092b\u201d]', ' ', text)
            outlinks = get_all_links(soup)
            url_title = str(soup.title.string)
            database.add_title(url, url_title)
            for outlink in outlinks:
                database.add_link(url, outlink)
            punctuation = ".?;,!()|:\""
            for word in text.split():
                word = word.lstrip(punctuation).rstrip(punctuation).lower()
                search = re.search(r"[^a-z0-9]", word)
                if not search and word is not "":
                    database.add_word_occurrence(url, word)
            tocrawl.update(outlinks)
            crawled.append(url)
    return database

Example #3

Show file

def crawl_web(seed):
    tocrawl = set([seed])
    crawled = []
    database = Storage()
    while tocrawl:
        url = tocrawl.pop()
        if url not in crawled:
            print url
            content = get_page(url)
            text = content.get_text()
            text = re.sub(r"[-/']", ' ', text)
            outlinks = get_all_links(content)
            for outlink in outlinks:
                database.add_link(url, outlink)
            punctuation = ".?;,!()|:\""
            for word in text.split():
                word = word.lstrip(punctuation).rstrip(punctuation).lower()
                search = re.search(r"[^a-z0-9]", word)
                if not search and word is not "":  #!=
                    database.add_word_occurrence(url, word)
            tocrawl.update(outlinks)
            crawled.append(url)
    return database

Example #4

Show file

File: crawler.py Project: ik2/search-engine

def crawl_web(seed):
    tocrawl = set([seed])
    crawled = []
    database = Storage()
    while tocrawl: 
        url = tocrawl.pop()
        if url not in crawled:
            print url
            content = get_page(url)
            text = content.get_text()
            text = re.sub(r"[-/']", ' ', text)
            outlinks = get_all_links(content)
            for outlink in outlinks:
                database.add_link(url, outlink)
            punctuation = ".?;,!()|:\""
            for word in text.split():
                word = word.lstrip(punctuation).rstrip(punctuation).lower()
                search = re.search(r"[^a-z0-9]", word)
                if not search and word is not "": #!=
                    database.add_word_occurrence(url, word)
            tocrawl.update(outlinks)
            crawled.append(url)
    return database