def createGeneralCards(cards, browser, environmentTags, url, cardCategory):
    _, content = browser.getContentOfPage(url)
    preSize = len(cards)

    environments = content.findAll(environmentTags)
    for environment in environments:
        if "id" in environment.attrs:
            linkId = environment.attrs["id"]
            cardLink = url + "#" + linkId

            cardTitle = mergeStringContent(environment)
            card = createSanitizedCard(cardCategory, cardTitle, cardLink)
            cards.append(card)

    postSize = len(cards)
    print("added " + str(postSize - preSize) + " cards for category : " + cardCategory)
示例#2
0
def createGeneralCards(cards, browser, environmentTags, url, cardCategory):
    _, content = browser.getContentOfPage(url)
    preSize = len(cards)

    environments = content.findAll(environmentTags)
    for environment in environments:
        if 'id' in environment.attrs:
            linkId = environment.attrs['id']
            cardLink = url + '#' + linkId

            cardTitle = mergeStringContent(environment)
            card = createSanitizedCard(cardCategory, cardTitle, cardLink)
            cards.append(card)

    postSize = len(cards)
    print("added " + str(postSize - preSize) + " cards for category : " +
          cardCategory)
from ankiflashcardcreationtools.CrawlTools import ContentRetrieverUsingSelenium, mergeStringContent
from ankiflashcardcreationtools.CardTools import createSanitizedCard, createCSVFile


if __name__ == "__main__":
    print("Make sure Firefox is running !")

    cards = []
    timeout = 1.5
    baseUrl = "https://docs.python.org/3/tutorial/"
    startUrl = baseUrl + "index.html"
    cardCategory = "Python 3"

    browser = ContentRetrieverUsingSelenium(timeout)

    try:
        _, content = browser.getContentOfPage(startUrl)
        tocTree = content.find("div", {"class": "toctree-wrapper"})
        links = tocTree.find_all("a", {"class": "reference internal"})

        for link in links:
            cardTitle = mergeStringContent(link)
            cardLink = baseUrl + link.attrs["href"]
            card = createSanitizedCard(cardCategory, cardTitle, cardLink)
            cards.append(card)
    finally:
        browser.close()

    print("finished collecting " + str(len(cards)))
    createCSVFile("python3", cards)
示例#4
0
    mergeStringContent
from ankiflashcardcreationtools.CardTools import createSanitizedCard,\
    createCSVFile

if __name__ == '__main__':
    print("Make sure Firefox is running !")

    cards = []
    timeout = 1.5
    baseUrl = 'https://docs.python.org/3/tutorial/'
    startUrl = baseUrl + 'index.html'
    cardCategory = 'Python 3'

    browser = ContentRetrieverUsingSelenium(timeout)

    try:
        _, content = browser.getContentOfPage(startUrl)
        tocTree = content.find('div', {'class': 'toctree-wrapper'})
        links = tocTree.find_all('a', {'class': 'reference internal'})

        for link in links:
            cardTitle = mergeStringContent(link)
            cardLink = baseUrl + link.attrs['href']
            card = createSanitizedCard(cardCategory, cardTitle, cardLink)
            cards.append(card)
    finally:
        browser.close()

    print("finished collecting " + str(len(cards)))
    createCSVFile("python3", cards)