def __init__(self, url: str, data: str, content_type: str): self.ignore_unparsed = False self.url = url #self.name = 'Web Parser' self.soup = BeautifulSoup(data, "lxml") super().__init__() #self.generic_parser = RecipeParser() self.preparse() self.get_images() self.text_parser = RecipeParser()
def __init__(self, url, data, content_type): self.ignore_unparsed = False self.url = url #self.name = 'Web Parser' self.soup = BeautifulSoup.BeautifulSoup( data, convertEntities=BeautifulSoup.BeautifulStoneSoup.XHTML_ENTITIES, ) InteractiveImporter.__init__(self) #self.generic_parser = RecipeParser() self.preparse() self.get_images() self.text_parser = RecipeParser()
def __init__(self, custom_parser=None, tags=DEFAULT_TAGS, tag_labels=DEFAULT_TAG_LABELS, modal=True, title=_('Import recipe')): self.title = title if custom_parser: self.parser = custom_parser else: self.parser = RecipeParser() self.labels_by_tag = tag_labels self.tags_by_label = {self.NEW_REC_TEXT: 'newrec'} for k, v in list(self.labels_by_tag.items()): self.tags_by_label[v] = k self.tags = tags self.setup_window() self.setup_action_area() self.markup_marks = {} self.markup_partners = {} self.anchors = [] self.midno = 0 # an ID counter for markup marks we insert self.labelled = [] self.label_counts = {} self.modal = modal # If we're in an embedded gtk mainloop... ConvenientImporter.__init__(self)