Python register_xpath_extensions示例

编程语言: Python

命名空间/包名称: talon.quotations

方法/功能: register_xpath_extensions

hotexamples.com的示例: 9

Python register_xpath_extensions - 已找到9个示例。这些是从开源项目中提取的最受好评的talon.quotations.register_xpath_extensions现实Python示例。您可以评价示例，以帮助我们提高示例质量。

示例#1

显示文件

# -*- coding: utf-8 -*-
import re
import cgi

from talon.quotations import (register_xpath_extensions, extract_from_html,
                              extract_from_plain)  # noqa
register_xpath_extensions()

from HTMLParser import HTMLParser


# http://stackoverflow.com/questions/753052/strip-html-from-strings-in-python
class MLStripper(HTMLParser):
    strippedTags = ["title", "script", "style"]

    def __init__(self):
        self.reset()
        self.fed = []
        self.strip_tag_contents_mode = False

    def handle_starttag(self, tag, attrs):
        # Strip the contents of a tag when it's
        # in strippedTags. We can do this because
        # HTMLParser won't try to parse the inner
        # contents of a tag.
        if tag.lower() in MLStripper.strippedTags:
            self.strip_tag_contents_mode = True

    def handle_endtag(self, tag):
        self.strip_tag_contents_mode = False

示例#2

显示文件

def init(path_to_models=None):
    register_xpath_extensions()
    if ML_ENABLED:
        signature.initialize(path_to_models)

示例#3

显示文件

文件： html.py 项目： 0xcd03/inbox

# -*- coding: utf-8 -*-
import re
import cgi
from HTMLParser import HTMLParser, HTMLParseError
from talon.quotations import (register_xpath_extensions, extract_from_html,
                              extract_from_plain)  # noqa
register_xpath_extensions()

from inbox.log import get_logger

__all__ = ['strip_tags', 'plaintext2html', 'extract_from_html',
           'extract_from_plain']


# http://stackoverflow.com/questions/753052/strip-html-from-strings-in-python
class MLStripper(HTMLParser):
    strippedTags = ["title", "script", "style"]

    def __init__(self):
        self.reset()
        self.fed = []
        self.strip_tag_contents_mode = False

    def handle_starttag(self, tag, attrs):
        # Strip the contents of a tag when it's
        # in strippedTags. We can do this because
        # HTMLParser won't try to parse the inner
        # contents of a tag.
        if tag.lower() in MLStripper.strippedTags:
            self.strip_tag_contents_mode = True

示例#4

显示文件

文件： __init__.py 项目： phroa/talon

def init():
    register_xpath_extensions()

示例#5

显示文件

文件： __init__.py 项目： kalekseev/talon

def init():
    register_xpath_extensions()
    if ML_ENABLED:
        signature.initialize()

示例#6

显示文件

文件： __init__.py 项目： benauthor/talon

def init():
    register_xpath_extensions()
    signature.initialize()

示例#7

显示文件

文件： __init__.py 项目： digideskio/talon

def init():
    register_xpath_extensions()
    if ML_ENABLED:
        signature.initialize()

示例#8

显示文件

文件： __init__.py 项目： zendesk/talon

def init():
    register_xpath_extensions()
    signature.initialize()

示例#9

显示文件

文件： __init__.py 项目： neutrinity/talon

def init():
    register_xpath_extensions()