コード例 #1
0
    def parse_offender(self, response):

        predator = response.meta['person']

        AllCrimes = []
        for crimes in response.xpath('//td[@headers="descriptionColHdr"]'):
            NameOfCrime = crimes.xpath('text()').extract()
            NameOfCrimeString = ''.join(NameOfCrime)
            AllCrimes.append(NameOfCrimeString)
        predator['Crimes'] = AllCrimes

        image = response.xpath('//div[@class="photoBox"]/img/@src').extract()
        if Helpers.pictureAvailable(image):
            imageString = ''.join(image)
            predator['ImageLink'] = imageString

        DOB = response.xpath('//td[@headers="dobColHdr"]/text()').extract()
        DOBString = ''.join(DOB)
        predator['DOB'] = DOBString

        Gender = response.xpath('//td[@headers="genderColHdr"]/text()').extract()
        GenderString = ''.join(Gender)
        predator['Gender'] = GenderString

        Height = response.xpath('//td[@headers="heigthColHdr"]/text()').extract()
        TallnessString = ''.join(Height)
        predator['Tallness'] = TallnessString
        predator['Height'] = Helpers.heightToInches(TallnessString)

        Weight = response.xpath('//td[@headers="weigthColHdr"]/text()').extract()
        WeightString = ''.join(Weight)
        predator['Weight'] = WeightString

        eyeColor = response.xpath('//td[@headers="eyecolorColHdr"]/text()').extract()
        eyeColorString = ''.join(eyeColor)
        predator['EyeColor'] = eyeColorString

        hairColor = response.xpath('//td[@headers="haircolorColHdr"]/text()').extract()
        hairColorString = ''.join(hairColor)
        predator['HairColor'] = hairColorString

        ethnicity = response.xpath('//td[@headers="ethnicityColHdr"]/text()').extract()
        ethnicityString = ''.join(ethnicity)
        predator['Ethnicity'] = ethnicityString

        address = response.xpath('//td[@headers="lastKnwnAddrColHdr"]/text()').extract()
        addressString = ''.join(address)
        adjustedAddress = Helpers.fixAddress(addressString)
        predator['Address'] = adjustedAddress
        
        print predator
        Helpers.save_predator_to_database(predator)