import Queue, issuuPagePub, csv import queueMethod as qm thisPage = issuuPagePub.issuuPagePub('http://issuu.com/jamesleng/docs/jamesleng_portfolio2013') print thisPage._width
myqueue.put("http://issuu.com/wangzigeng/docs/narrator_wang_zigeng_1500dpi") myqueue.put("http://issuu.com/sogkarimi/docs/karimiarchportfolio") myqueue.put("http://issuu.com/b.a.maranda/docs/portfolio_2015") myqueue.put("http://issuu.com/justinoh/docs/20150102_portfolio__compiled_") myqueue.put("http://issuu.com/maithamalmubarak/docs/portfolio2014") myqueue.put("http://issuu.com/yutianwang/docs/portfolio_of_yutian_wang_harvard_ma") myqueue.put("http://issuu.com/lixiangyu/docs/portfolio_b5-") myqueue.put("http://issuu.com/archdekk/docs/portfolio2013") count = 0 while count < 2000: if myqueue.qsize() == 0: break thisurl = myqueue.get() thisPage = issuuPagePub.issuuPagePub(thisurl) if dictPub.has_key(thisurl): continue dictPub[thisurl] = thisPage.getInformation() count += 1 print str(count) + " : " + str(thisPage) print "Queue current size "+ str(myqueue.qsize()) thisPage.setKeywordDict(['portfolio', 'work', 'project', 'sample', 'architect', 'architecture']) thisPage.initRelatedInformation() relatedUrl = thisPage.getRelatedUrl() for index in xrange(len(relatedUrl)): if myqueue.qsize() < 30000 and dictQueue.has_key(relatedUrl[index]) == 0: myqueue.put(relatedUrl[index]) dictQueue[relatedUrl[index]] = 0 with open('C:\Users\walter\Desktop\stat.csv', 'wb') as csvfile:
#downloadPublications.py '''an application to download publication using issuuPagePub class @version0.2.150912 @author:maajor{<mailto:[email protected]>} ''' import issuuPagePub aPage = issuuPagePub.issuuPagePub( 'http://issuu.com/elena_ardighieri/docs/portfolio_2014_3rd_print_opt') #change to the publication url you want print aPage aPage.savePageImages('D:/test//') #change to your own directory
myqueue.put("http://issuu.com/sogkarimi/docs/karimiarchportfolio") myqueue.put("http://issuu.com/b.a.maranda/docs/portfolio_2015") myqueue.put("http://issuu.com/justinoh/docs/20150102_portfolio__compiled_") myqueue.put("http://issuu.com/maithamalmubarak/docs/portfolio2014") myqueue.put( "http://issuu.com/yutianwang/docs/portfolio_of_yutian_wang_harvard_ma") myqueue.put("http://issuu.com/lixiangyu/docs/portfolio_b5-") myqueue.put("http://issuu.com/archdekk/docs/portfolio2013") count = 0 while count < 2000: if myqueue.qsize() == 0: break thisurl = myqueue.get() thisPage = issuuPagePub.issuuPagePub(thisurl) if dictPub.has_key(thisurl): continue dictPub[thisurl] = thisPage.getInformation() count += 1 print str(count) + " : " + str(thisPage) print "Queue current size " + str(myqueue.qsize()) thisPage.setKeywordDict([ 'portfolio', 'work', 'project', 'sample', 'architect', 'architecture' ]) thisPage.initRelatedInformation() relatedUrl = thisPage.getRelatedUrl() for index in xrange(len(relatedUrl)): if myqueue.qsize() < 30000 and dictQueue.has_key( relatedUrl[index]) == 0: myqueue.put(relatedUrl[index])
import Queue, issuuPagePub, csv import queueMethod as qm thisPage = issuuPagePub.issuuPagePub( 'http://issuu.com/jamesleng/docs/jamesleng_portfolio2013') print thisPage._width
#downloadPublications.py '''an application to download publication using issuuPagePub class @version0.2.150912 @author:maajor{<mailto:[email protected]>} ''' import issuuPagePub aPage = issuuPagePub.issuuPagePub('http://issuu.com/elena_ardighieri/docs/portfolio_2014_3rd_print_opt') #change to the publication url you want print aPage aPage.savePageImages('D:/test//') #change to your own directory