Пример #1
0
    def parse(self, response):
        pewpew = response.meta.get('url')

        item = StarnewsItem()
        try:
            try:
                item['title'] = Selector(response).css(
                    'h1.kbwc-title::text').extract()[0]
            except:
                print("Loi Title")
            try:
                item['content'] = Selector(response).css(
                    'div.knc-content').extract()[0]
            except:
                print("Loi Content")
            try:
                item['url'] = response.url
            except:
                print("Loi URL")
            try:
                item['name'] = response.url.split('/')[-1].split('.')[0]
            except:
                print("Loi name")
            try:
                item['thumb'] = pewpew
            except:
                print("Loi thumb")
            yield item
        except:
            print("Loi khi nap thong tin vao item")
Пример #2
0
    def parse(self, response):
        pewpew = response.meta.get('url')

        item = StarnewsItem()
        try:
            try:
                item['title'] = Selector(response).css(
                    'h1.kbwc-title::text').extract()[0]
            except:
                print("Loi Title")
            try:
                item['content'] = Selector(response).css(
                    'div.knc-content').extract()[0]
            except:
                print("Loi Content")
            try:
                item['url'] = response.url
            except:
                print("Loi URL")
            try:
                item['name'] = response.url.split('/')[-1].split('.')[0]
            except:
                print("Loi name")
            try:
                item['thumb'] = pewpew
            except:
                print("Loi thumb")
            try:
                tags = response.css('li.kli a::text').extract()
                item['tags'] = []
                item['tags'] = tags
            except:
                print("Loi tags")
            try:
                cat = response.css(
                    "ul.kbws-list li.active a::text").extract()[0]
                categories = ["Music", cat]
                item['category'] = []
                item['category'] = categories
            except:
                print("Loi thumb")
            yield item
        except:
            print("Loi khi nap thong tin vao item")