コード例 #1
0
ファイル: elalC_scrape.py プロジェクト: gabik/wizzscrape
    curs.execute(
        "select * FROM flights WHERE direction=%s and dst=%s and date=%s and dep_time=%s and company=%s",
        (i['direction'], DST, str(i['year']) + "-" + str(i['month']) + "-" +
         str(i['day']), '00:00', str(company_id)))
    if (len(curs.fetchall()) > 0):
        curs.execute(
            "DELETE FROM flights WHERE direction=%s and dst=%s and date=%s and dep_time=%s and company=%s",
            (i['direction'], DST, str(i['year']) + "-" + str(i['month']) +
             "-" + str(i['day']), '00:00', str(company_id)))
    curs.execute(
        "INSERT INTO flights (company, scrape_time, direction, dst, price, dep_time, arr_time, date, dur_time) VALUES (%s, %s, %s, %s, %s, %s, %s, %s, %s)",
        (str(company_id), str(scrape_time), i['direction'], DST, int(
            i['price']), '00:00', '00:00', str(i['year']) + "-" +
         str(i['month']) + "-" + str(i['day']), get_flight_time(i, DST)))
    curs.execute(
        "INSERT INTO archive_flights (company, scrape_time, direction, dst, price, dep_time, arr_time, date, dur_time) VALUES (%s, %s, %s, %s, %s, %s, %s, %s, %s)",
        (str(company_id), str(scrape_time), i['direction'], DST, int(
            i['price']), '00:00', '00:00', str(i['year']) + "-" +
         str(i['month']) + "-" + str(i['day']), get_flight_time(i, DST)))

if cleandone == 1:
    curs.execute(
        "delete from flights where company=%s and dst=%s and date>=%s and date<%s and scrape_time<%s",
        (str(company_id), DST, str(Start_orig.strftime("%Y-%m-%d")),
         str(Stop.strftime("%Y-%m-%d")), str(scrape_time)))
    print "Done!"

db.commit()

print datetime.datetime.now()
コード例 #2
0
ファイル: elal_scrape.py プロジェクト: gabik/wizzscrape
print ""
if debug_flag:
 print "Debug: efore clean_dup: Out, Inc: "
 print flightsList
fl2=up.clean_dup_max(flightsList, 1)
fl3=up.clean_dup_max(flightsList, 2)
fl2.extend(fl3)
if debug_flag:
 print "Debug: After clean_dup: Out, Inc: "
 for i in fl2:
  print i

#db= psycopg2.connect( host="manegerdb.cjjasb6ckbh1.us-east-1.rds.amazonaws.com", database="GabiScrape", user="******", password="******")
curs = db.cursor()
curs.execute("select id from companies where name='elal'")
company_id=curs.fetchone()[0]
for i in fl2:
 curs.execute("select * FROM flights WHERE direction=%s and dst=%s and date=%s and dep_time=%s and company=%s", (i['direction'],DST,str(i['year'])+"-"+str(i['month'])+"-"+str(i['day']), str(i['dep_time']), str(company_id)))
 if (len(curs.fetchall()) > 0):
  curs.execute("DELETE FROM flights WHERE direction=%s and dst=%s and date=%s and dep_time=%s and company=%s", (i['direction'],DST,str(i['year'])+"-"+str(i['month'])+"-"+str(i['day']), str(i['dep_time']), str(company_id)))
 curs.execute("INSERT INTO flights (company, scrape_time, direction, dst, price, dep_time, arr_time, date, dur_time) VALUES (%s, %s, %s, %s, %s, %s, %s, %s, %s)", (str(company_id), str(scrape_time), i['direction'], DST, int(i['price']),  str(i['dep_time']),   str(i['arr_time']),  str(i['year'])+"-"+str(i['month'])+"-"+str(i['day']), get_flight_time(i, DST)))
 curs.execute("INSERT INTO archive_flights (company, scrape_time, direction, dst, price, dep_time, arr_time, date, dur_time) VALUES (%s, %s, %s, %s, %s, %s, %s, %s, %s)", (str(company_id), str(scrape_time), i['direction'], DST, int(i['price']),  str(i['dep_time']),   str(i['arr_time']),  str(i['year'])+"-"+str(i['month'])+"-"+str(i['day']), get_flight_time(i, DST)))

if cleandone==1:
 curs.execute("delete from flights where company=%s and dst=%s and date>=%s and date<%s and scrape_time<%s", (str(company_id), DST, str(Start_orig.strftime("%Y-%m-%d")), str(Stop.strftime("%Y-%m-%d")), str(scrape_time)))
 print "Done!"

db.commit()

print datetime.datetime.now()