def __init__(self): ProcesserBase.__init__(self) self.cars = CarSpecification() self.seg_rule = [ ("series_num_zh", u"(\d{2,4}).+[年款]?", 1), ("logo_zh", u"[\u2E80-\u9FFF]+[版型级]", 0), #("transmission_zh", u"(手动)|(自动)|(手波)|(手自一体)|(无极变速)|(双离合)", 0), #("transmission", u"([AM]T)|(A[^T]+T)|CVT|GSG", 0), ("engine", u"(\d\.\d?)(?![\d|万])(L|l|T|t|升|TSI|FSI|TFSI)?", 1), ("imports_zh", u"(进口)|(国产)|([\u2E80-\u9FFF]+)国", 0)] self.rule1 = [("car_type", "pattern_zh", 0.1, 'str'), ("car_brand", "brand", 0.2, 'str'), ("car_series", "series", 0.2, 'str'), ("car_emission", "engine", 0.08, 'abs'), ("car_transmission", "transmission_zh", 0.04, 'str'), ("car_title", "logo_zh", 0.1, 'str'), ("car_title", "pattern_zh", 0.13, 'str'), ("car_title", "series_num_zh", 0.1, 'str'), ("car_description", "pattern_zh", 0.023, 'str'), ("car_birth", "producted_year", 0.03, 'str'), ("purchase_price_refer", "indicative_price", 0.024, 'num'),]
def __init__(self, item): self.item = item self.cars = CarSpecification() self.seg_rs = None