dict['SelectedSuggestionOrigin1']='' dict['ErroneousWordDestination1']='' dict['SelectedSuggestionDestination1']='' dict['departureStationCode2']='' dict['arrivalStationCode2']='' dict['ErroneousWordOrigin2']='' dict['SelectedSuggestionOrigin2']='' dict['ErroneousWordDestination2']='' dict['SelectedSuggestionDestination2']='' dict['__VIEWSTATE'] = viewstate dict['pageToken'] = "" r2 = s.post('http://tickets.vueling.com/XmlSearch.aspx', data=dict, headers=headers) cleanr2 = "" if r2.status_code == 200: if list(find_all(r2.text, "basicPriceRoute")): cleanr2=r2.text[sorted(list(find_all(r2.text, "basicPriceRoute")))[0]-5:r2.text.find('SKYSALES.Util.createObject', sorted(list(find_all(r2.text, "basicPriceRoute")))[0])] else: retries+=1 if retries>max_retries: print "Start:{0}, Ret:{1}. ".format(str(Start), str(Ret)) cleandone=0 Start=Start + datetime.timedelta(days=1) n+=1 continue write_to_gabi(cleanr2) #try: #cleanr2=r2.text[sorted(list(find_all(r2.text, "basicPriceRoute")))[0]-5:r2.text.find('</tbody>', sorted(list(find_all(r2.text, "basicPriceRoute")))[-1])] #except IndexError :
fd = codecs.open('/tmp/output_pages/' + sys.argv[0] + '_' + DST + '_' + str(Start) + '-' + str(Ret) + '.html', 'w', encoding='utf-8') fd.write(r2.text) fd.close() continue cur_date = Start.strftime("%d-%m-%Y") prP = getFlight(cur_date) prP.feed(r2.text) if debug_flag: print Start.strftime("%d/%m/%Y") print Ret.strftime("%d/%m/%Y") print len(list(find_all(r2.text, "marketColumn"))) for s in find_all(r2.text, '<span class="price">'): print strip_non_ascii( r2.text[s + 20:r2.text.find('<', s + 20, s + 30)]) print len(prP.data) for t in prP.data: print t print r2 print '-------' flightsList.extend(prP.data) Start = Ret print "" #Out=[] #Inc=[] #for i in flightsList: #if i['direction'] == 4 :
cleandone=0 Start=Start + datetime.timedelta(days=1) if debug_flag: fd=codecs.open('/tmp/output_pages/'+sys.argv[0]+'_'+DST+'_'+str(Start)+'-'+str(Ret)+'.html', 'w', encoding='utf-8') fd.write(r2.text) fd.close() continue cur_date=Start.strftime("%d-%m-%Y") prP = getFlight(cur_date) prP.feed(r2.text) if debug_flag: print Start.strftime("%d/%m/%Y") print Ret.strftime("%d/%m/%Y") print len(list(find_all(r2.text, "marketColumn"))) for s in find_all(r2.text, '<span class="price">'): print strip_non_ascii(r2.text[s+20:r2.text.find('<', s+20, s+30)]) print len(prP.data) for t in prP.data : print t print r2 print '-------' flightsList.extend(prP.data) Start=Ret print "" #Out=[] #Inc=[] #for i in flightsList: #if i['direction'] == 4 : #Out.append(i) #else:
dict['SelectedSuggestionDestination1'] = '' dict['departureStationCode2'] = '' dict['arrivalStationCode2'] = '' dict['ErroneousWordOrigin2'] = '' dict['SelectedSuggestionOrigin2'] = '' dict['ErroneousWordDestination2'] = '' dict['SelectedSuggestionDestination2'] = '' dict['__VIEWSTATE'] = viewstate dict['pageToken'] = "" r2 = s.post('http://tickets.vueling.com/XmlSearch.aspx', data=dict, headers=headers) cleanr2 = "" if r2.status_code == 200: if list(find_all(r2.text, "basicPriceRoute")): cleanr2 = r2.text[ sorted(list(find_all(r2.text, "basicPriceRoute")))[0] - 5:r2.text. find('SKYSALES.Util.createObject', sorted(list(find_all(r2.text, "basicPriceRoute")))[0])] else: retries += 1 if retries > max_retries: print "Start:{0}, Ret:{1}. ".format(str(Start), str(Ret)) cleandone = 0 Start = Start + datetime.timedelta(days=1) n += 1 continue write_to_gabi(cleanr2)