def __init__(self, *args, **kwargs): cls = self.__class__ super(cls, self).__init__(*args, **kwargs) self.portCitys = dataUtil.get_port_city() # 获取session需要一个日期,这里生成10天后的日期 days = date.today() + timedelta(days=10) self.custom_settings['SESSION_ID_URL'] = self.custom_settings['SESSION_ID_URL'] % days.strftime('%d-%b-%Y')
def __init__(self, *args, **kwargs): cls = self.__class__ super(cls, self).__init__(*args, **kwargs) self.start_urls = ['http://www.9air.com/app/GetFlight'] self.ADT = 3 self.version = 2.0 # 通过机场获取城市 self.portCitys = dataUtil.get_port_city() self.session_id = '' self.session_flag = True self.session_url = 'http://www.9air.com/app/Login' self.info_url = "http://www.9air.com/app/ChangeFlt" self.seat_url = 'http://www.9air.com/app/GetOrder?orderid=' self.session_data = { 'op': 'lg', # 设备ID,重新登陆安卓端可获取 'tck': '' } self.headers = { 'android_version': '1.44', 'Content-Type': 'application/x-www-form-urlencoded', 'User-Agent': 'Apache-HttpClient/UNAVAILABLE (java 1.4)', 'Host': 'www.9air.com' } self.timeout = 5 self.id_pool = [ 'A4FD4D17F0B6513BA4FD4D17F0B6513B0F01AC9B07E4EA18CCD0D90BAEF4076EC16A4AFE5B5FFD0C545F48C19EFEFD54A67C38DFC7165F61', 'A4FD4D17F0B6513BA4FD4D17F0B6513B0F01AC9B07E4EA18CCD0D90BAEF4076EC7170EB068F5A7DDFEFBFF044B3C77B410C50AD1FDC6EC69', 'A4FD4D17F0B6513BA4FD4D17F0B6513B0F01AC9B07E4EA18CCD0D90BAEF4076EC7170EB068F5A7DDF2BF7BD5087F7E44FA7BB8676BEFE96D', 'A4FD4D17F0B6513BA4FD4D17F0B6513B0F01AC9B07E4EA18CCD0D90BAEF4076EC7170EB068F5A7DD72FD095C54E93C2105B8245E0DE6C37A', 'A4FD4D17F0B6513BA4FD4D17F0B6513B0F01AC9B07E4EA18CCD0D90BAEF4076EC7170EB068F5A7DD5DE024C3ED7EDCC4ADE8F13194EF3C80', ]
def __init__(self, *args, **kwargs): cls = self.__class__ super(cls, self).__init__(*args, **kwargs) self.start_urls = [ 'http://wx.flycua.com/wechat/pip/book/flightSearch.json' ] self.ADT = 3 self.version = 1 # 通过机场获取城市 self.portCitys = dataUtil.get_port_city() self.session_id = '' self.session_flag = True self.headers = { 'Host': "wx.flycua.com", # 'content-length': "95", 'Origin': "http://wx.flycua.com", 'User-Agent': "Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/71.0.3578.98 Safari/537.36", 'isWechat': "H5", 'Content-Type': "application/json", 'Accept': "application/json, text/plain, */*", 'Cookie': "JSESSIONID=7DB644CF0C5608A8198719E96B1AF8B9", # 'referer': "http://wx.flycua.com/wechat/?code=021QpAK41iotwS1ed5L41EJxK41QpAKu&state=1", # 'cache-control': "no-cache", # 'postman-token': "ee1a68b8-780c-3243-f7fb-e4b552929ee4" } self.timeout = 5
def __init__(self, *args, **kwargs): cls = self.__class__ super(cls, self).__init__(*args, **kwargs) self.start_urls = [ 'https://book.evaair.com/plnext/EVAOnlineDX/Override.action' ] self.ADT = 3 self.version = 1.0 # 通过机场获取城市 self.portCitys = dataUtil.get_port_city() self.session_id = '' self.session_flag = True self.headers = { 'host': "book.evaair.com", 'origin': "https://booking.evaair.com", 'user-agent': "Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/71.0.3578.98 Safari/537.36", 'accept': "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8", # 'cookie': "_EVAlang=3; _EVAcookieaccept=Y; D_IID=7198D30D-7BBD-3DF6-825F-B9A8A2E33EE0; D_UID=23C10191-61C4-3CA8-9BC5-C5D35052983E; D_ZID=CE20E1D1-B040-39C1-ABA8-A02CD4FF539C; D_ZUID=586B31F7-C8CD-3A85-B4DA-B344F51A8200; D_HID=0C5A5C86-CDDE-3364-BA5F-C5D7DDEB0DF6; D_SID=104.233.233.98:HydOGsyu5q3U0qPWwvSWYahCS9zxyt4ScbSDCVW4MSI; PDEP=PVG; PARR=TPE; PSEG=oneway; PDATE=2019%2F03%2F28", 'content-type': "application/x-www-form-urlencoded", } self.timeout = 5 self.js_verify_flag = True self.image_verify_flag = False self.js_verify_url = 'https://book.evaair.com/iframe.html' self.url = ''
def __init__(self, *args, **kwargs): cls = self.__class__ super(cls, self).__init__(*args, **kwargs) self.portCitys = dataUtil.get_port_city() # 全局更换cookie cookie = random.choice(self.custom_settings.get('COOKIE_LIST')) self.custom_settings.get('HEADERS')['Cookie'] = 'kuhang_=%s;' % cookie print '使用cookie:%s进行访问' % cookie
def __init__(self, *args, **kwargs): cls = self.__class__ super(cls, self).__init__(*args, **kwargs) self.start_urls = ['https://www.flymango.com/api/availability/search'] self.ADT = '3' self.version = 1.6 # 通过机场获取城市 self.portCitys = dataUtil.get_port_city() self.currency = 'ZAR'
def __init__(self, *args, **kwargs): super(W6Spider, self).__init__(*args, **kwargs) self.custom_settings['GET_SESSION_DATA'].update( self.custom_settings.get('BASE_DATA')) self.custom_settings['GET_DATE_DATA'].update( self.custom_settings.get('BASE_DATA')) self.custom_settings['DEFAULT_DATA'].update( self.custom_settings.get('BASE_DATA')) self.custom_settings['DEFAULT_REQUEST_HEADERS'] = self.get_headers() self.portCitys = dataUtil.get_port_city()
def __init__(self, *args, **kwargs): cls = self.__class__ super(cls, self).__init__(*args, **kwargs) self.start_urls = [ 'https://fly.elal.co.il/plnext/mobile4LY/MFlexPricerAvailabilityDispatcherPui.action;jsessionid=' ] self.ADT = 3 self.version = 1.0 # 通过机场获取城市 self.port_city = dataUtil.get_port_city()
def __init__(self, name, num=1, proxy=1, local=1): self.num = num self.ADT = 3 self.now = 0 self.permins = 0 # 通过机场获取城市 self.host_name = name self.num = num self.city_ports = dataUtil.get_port_city() self.local = local
def __init__(self, *args, **kwargs): cls = self.__class__ super(cls, self).__init__(*args, **kwargs) self.start_urls = [ 'https://prod.open.flyscoot.com/v1/experience/query/search' ] self.ADT = 1 self.version = 1.5 # 通过机场获取城市 self.port_city = dataUtil.get_port_city() self.token_flag = True self.proxy_flag = False
def __init__(self): self.proxy_flag = True self.ip = '' # 通过机场获取城市 self.portCitys = dataUtil.get_port_city() self.task = [] self.buffer = [] # 处理js过滤关键字 self.js_list = [] for line in open("src/js_key.txt"): line_str = line.replace('\\\\', '\\').replace(' ', '').replace('\n', '') self.js_list.append(line_str)
def __init__(self, *args, **kwargs): cls = self.__class__ super(cls, self).__init__(*args, **kwargs) self.start_urls = ['https://www.spirit.com/Default.aspx?action=search'] self.ADT = 4 self.version = 1.2 # 通过机场获取城市 self.port_city = dataUtil.get_port_city() self.get_session_url = "https://www.spirit.com/" self.proxy = '' self.proxy_flag = True self.cookies_flag = True self.cookies_str = ''
def __init__(self, *args, **kwargs): cls = self.__class__ super(cls, self).__init__(*args, **kwargs) self.get_session_url = [ 'https://book.hop.com/plnext/HOPmobileNG/Override.action?' ] self.start_url = [ 'https://book.hop.com/plnext/HOPmobileNG/MFlexPricerAvailabilityDispatcherPui.action;jsessionid=' ] self.start_url_data = '?SITE=H01QH01Q&LANGUAGE=GB&COUNTRY_SITE=GB&UIFWK=ANGULAR' self.ADT = 3 self.version = 1.3 # 通过机场获取城市 self.port_city = dataUtil.get_port_city()
def __init__(self, *args, **kwargs): cls = self.__class__ super(cls, self).__init__(*args, **kwargs) self.start_urls = ['https://www.eastarjet.com/json/dataService'] self.ADT = 4 self.version = 1.8 # 通过机场获取城市 self.port_city = dataUtil.get_port_city() # 国家-城市,切换货币单位 self.city_dict = { 'HKG': 'CN', 'PVG': 'CN', 'SHE': 'CN', 'YNJ': 'CN', 'CTS': 'JP', 'FUK': 'JP', 'IBR': 'JP', 'KIX': 'JP', 'KMI': 'JP', 'KOJ': 'JP', 'NRT': 'JP', 'OKA': 'JP', 'CJJ': 'KR', 'CJU': 'KR', 'GMP': 'KR', 'ICN': 'KR', 'KUV': 'KR', 'PUS': 'KR', 'BKI': 'MY', 'VVO': 'RU', 'PPS': 'SE', 'BKK': 'TH', 'TPE': 'TW', 'TSA': 'TW', 'DAD': 'VN', 'HAN': 'VN', } self.headers = { 'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/70.0.3538.77 Safari/537.36', 'Referer': 'https://www.eastarjet.com/newstar/PGWHC00001', 'Cookie': '' } self.session_flag = True self.tax_dict = read_tax_json()
def __init__(self, *args, **kwargs): cls = self.__class__ super(cls, self).__init__(*args, **kwargs) self.start_urls = [ 'https://mobile.lionair.co.id/GQWCF_FlightEngine/GQDPMobileBookingService.svc/SearchAirlineFlights'] self.ADT = '3' self.version = 1.0 # 通过机场获取城市 self.port_city = dataUtil.get_port_city() # self.currency = 'ZAR' # 模拟参数 self.dep = 'HLP' self.arr = 'BPN' self.date = '' self.proxy = True
def __init__(self, *args, **kwargs): cls = self.__class__ super(cls, self).__init__(*args, **kwargs) self.first_url = "https://www.tui.co.uk/flight/search?" self.second_url = ['https://www.tui.co.uk/flight/ws/selectedflights?'] self.ADT = '3' self.version = 1.2 # 通过机场获取城市 self.portCitys = dataUtil.get_port_city() self.currency = 'GBP' self.carrier = "BY" self.cabin = 'X' self.isChange = 1 self.flag = True # 参数传递 self.dep = '' self.arr = '' self.date = ''
def __init__(self, host_name='hyn-test', num=1): if not host_name: host_name = socket.gethostname() self.host_name = host_name self.num = num self.city_ports = dataUtil.get_port_city()
def __init__(self, *args, **kwargs): cls = self.__class__ super(cls, self).__init__(*args, **kwargs) self.portCitys = dataUtil.get_port_city()
def __init__(self, *args, **kwargs): cls = self.__class__ super(cls, self).__init__(*args, **kwargs) self.portCitys = dataUtil.get_port_city() self.custom_settings['ADMIN_FEES'] = pubUtil.get_tax()
def __init__(self, *args, **kwargs): super(TwSpider, self).__init__(*args, **kwargs) self.portCitys = dataUtil.get_port_city()
def __init__(self, *args, **kwargs): super(self.__class__, self).__init__(*args, **kwargs) self.port_city = dataUtil.get_port_city()
def __init__(self, *args, **kwargs): cls = self.__class__ super(cls, self).__init__(*args, **kwargs) self.portCitys = dataUtil.get_port_city() self.dt_to_ts = lambda x: time.mktime( time.strptime(x, '%m/%d/%Y %H:%M'))