Python text_after_line_numbers示例

编程语言: Python

命名空间/包名称: utils.sunlight_utils

方法/功能: text_after_line_numbers

hotexamples.com的示例: 10

Python text_after_line_numbers - 已找到10个示例。这些是从开源项目中提取的最受好评的utils.sunlight_utils.text_after_line_numbers现实Python示例。您可以评价示例，以帮助我们提高示例质量。

示例#1

显示文件

def az_text_extractor(mimetype, doc_source):
    if mimetype == 'text/html':
        doc = lxml.html.fromstring(doc_source)
        text = doc.xpath('//div[@class="Section2"]')[0].text_content()
        return text
    else:
        return text_after_line_numbers(pdfdata_to_text(doc_source))

示例#2

显示文件

def fl_text_extractor(doc_source):
    doc = lxml.html.fromstring(doc_source)
    pre = doc.xpath('//pre')
    if pre:
        text = pre[0].text_content().encode('ascii', 'replace')
        return text_after_line_numbers(text)
    else:
        return '\n'.join(x.text_content() for x in doc.xpath('//tr/td[2]'))

示例#3

显示文件

def ar_text_extractor(doc_source):
    return text_after_line_numbers(pdfdata_to_text(doc_source))

示例#4

显示文件

def in_text_extractor(doc_source):
    text = pdfdata_to_text(doc_source)
    return text_after_line_numbers(text)

示例#5

显示文件

def ia_text_extractor(doc_source):
    doc = lxml.html.fromstring(doc_source)
    text = doc.xpath('//pre')[0].text_content()
    # strip two sets of line numbers
    return text_after_line_numbers(text_after_line_numbers(text))

示例#6

显示文件

def ak_text_extractor(doc_source):
    doc = lxml.html.fromstring(doc_source)
    text = doc.xpath('//pre')[0].text_content()
    text = text_after_line_numbers(text)
    return text

示例#7

显示文件

def wi_text_extractor(mimetype, url, data):
    is_pdf = (mimetype == 'application/pdf' or
              url.endswith('.pdf'))
    if is_pdf:
        return text_after_line_numbers(pdfdata_to_text(data))

示例#8

显示文件

def ut_text_extractor(mimetype, data):
    if mimetype == 'application/pdf':
        return text_after_line_numbers(pdfdata_to_text(data))

示例#9

显示文件

def mo_text_extractor(doc_source):
    text = pdfdata_to_text(doc_source)
    return text_after_line_numbers(text).encode('ascii', 'ignore')

示例#10

显示文件

def hi_text_extractor(mimetype, doc_source):
    if mimetype == 'application/pdf':
        return text_after_line_numbers(pdfdata_to_text(doc_source))
    else:
        return None