Exemplo n.º 1
0
# Extract search information from responseDict
numTotalPages = responseDict['paginationOutput']['totalPages']
numTotalEntries = responseDict['paginationOutput']['totalEntries']
currPage = responseDict['paginationOutput']['pageNumber']

# DEBUG - print search information
print("Number of Total Pages to Search: " + numTotalPages)
print("Number of Total Entries: " + numTotalEntries)
print("Current Page: " + str(currPage))

# Loop over subsequent pages in the search, 100 entries per page, up to 10 pages
pageNum = 1
while pageNum < 1 and pageNum < int(numTotalPages):
    try:
        response = api.next_page()
        responseSoup = soup(response.content, 'html.parser')
        responseDict = response.dict()
        newItems = responseSoup.find_all('item')
        items += newItems

        currPage = responseDict['paginationOutput']['pageNumber']
        print("Current Page: " + str(currPage))
        pageNum += 1
    except ConnectionError as e:
        print(e)

# DEBUG
# print(soup.text + "\n")
# totalentries = int(soup.find('totalentries').text)
# print(str(totalentries) + "\n")