示例#1
0
 def __init__(self, url: str, data: str, content_type: str):
     self.ignore_unparsed = False
     self.url = url
     #self.name = 'Web Parser'
     self.soup = BeautifulSoup(data, "lxml")
     super().__init__()
     #self.generic_parser = RecipeParser()
     self.preparse()
     self.get_images()
     self.text_parser = RecipeParser()
示例#2
0
 def __init__(self, url, data, content_type):
     self.ignore_unparsed = False
     self.url = url
     #self.name = 'Web Parser'
     self.soup = BeautifulSoup.BeautifulSoup(
         data,
         convertEntities=BeautifulSoup.BeautifulStoneSoup.XHTML_ENTITIES,
     )
     InteractiveImporter.__init__(self)
     #self.generic_parser = RecipeParser()
     self.preparse()
     self.get_images()
     self.text_parser = RecipeParser()
示例#3
0
 def __init__(self,
              custom_parser=None,
              tags=DEFAULT_TAGS,
              tag_labels=DEFAULT_TAG_LABELS,
              modal=True,
              title=_('Import recipe')):
     self.title = title
     if custom_parser: self.parser = custom_parser
     else: self.parser = RecipeParser()
     self.labels_by_tag = tag_labels
     self.tags_by_label = {self.NEW_REC_TEXT: 'newrec'}
     for k, v in list(self.labels_by_tag.items()):
         self.tags_by_label[v] = k
     self.tags = tags
     self.setup_window()
     self.setup_action_area()
     self.markup_marks = {}
     self.markup_partners = {}
     self.anchors = []
     self.midno = 0  # an ID counter for markup marks we insert
     self.labelled = []
     self.label_counts = {}
     self.modal = modal  # If we're in an embedded gtk mainloop...
     ConvenientImporter.__init__(self)