Пример #1
0
 def extra(self, page):
     """
     Return a dictionary of extra information.
     """
     dic_extra = {}
     try:
         if page.find(TAG_EXTRA[0]) > -1:
             extra_html = Utils.text_between(page, TAG_EXTRA[0], TAG_EXTRA[1], True)
             extra_rows = Utils.split_html_tag(Utils.remove_spaces(extra_html), TAG_EXTRA_SEP)
             for row in extra_rows:
                 _row = Utils.remove_tags(row)
                 key, value = _row.split(":")
                 dic_extra[Utils.remove_spaces(key)] = Utils.remove_spaces(value)
     except:
         pass
     return dic_extra
Пример #2
0
 def synonyms(self, page):
     """
     Return list of synonyms.
     """
     synonyms = []
     if page.find(TAG_SYNONYMS[0]) > -1:
         synonyms_html = Utils.text_between(page, TAG_SYNONYMS[0], TAG_SYNONYMS[1], True)
         while synonyms_html.find(TAG_SYNONYMS_DELIMITER[0]) > -1:
             synonym = Utils.text_between(synonyms_html, TAG_SYNONYMS_DELIMITER[0], TAG_SYNONYMS_DELIMITER[1], True)
             synonyms.append(Word(Utils.remove_spaces(synonym)))
             synonyms_html = synonyms_html.replace(TAG_SYNONYMS_DELIMITER[0], "", 1)
             synonyms_html = synonyms_html.replace(TAG_SYNONYMS_DELIMITER[1], "", 1)
     return synonyms
Пример #3
0
 def scrape_extra(self, page):
     """
     Return a dictionary of extra information.
     """
     dict_extra = {}
     try:
         if page.find(TAG_EXTRA[0]) > -1:
             html = Utils.text_between(page, *TAG_EXTRA, force_html=True)
             extra_rows = Utils.split_html_tag(Utils.remove_spaces(html),
                                               TAG_EXTRA_SEP)
             for row in extra_rows:
                 _row = Utils.remove_tags(row)
                 key, value = map(Utils.remove_spaces, _row.split(":"))
                 dict_extra[key] = value
     except:
         pass
     return dict_extra
Пример #4
0
 def meaning(self, page):
     """
     Return meaning.
     """
     return Utils.remove_spaces(Utils.remove_tags(Utils.text_between(page, TAG_MEANING[0], TAG_MEANING[1], True)))