Esempio n. 1
0
# loop urls read
for url in urls:
    # progress feedback
    url = url.replace("\n", "")
    url_num += 1
    print url_num, "/", len(urls), " url: ", url

    page = browser.open(url)

    content = BeautifulSoup(page.read(), "lxml")
    guideContent = content.find("div", {"class": "guideContent"})

    details = content.find(id="exerciseDetails")
    name = details.h1.string.replace("\n", "").strip()
    newExercise = Exercise(name)
    newExercise.set_url(url)

    summary = content.find("span", {"class": "summary"})

    if summary.findNext('span').string != 'Read':
        rating = content.find("span", {"class": "rating"}).string
    else:
        rating = "N/A"

    newExercise.set_rating(rating)

    exercisePhotos = content.find("div", {"class": "exercisePhotos"})

    imgurls = []

    for photo in exercisePhotos.find_all("a"):