Ejemplos de tostring en Python

Lenguaje de programación: Python

Namespace/Package Name: lxml_linux_64.html

Método / Función: tostring

Ejemplos en hotexamples.com: 3

Python tostring - 3 ejemplos encontrados. Estos son los ejemplos en Python del mundo real mejor valorados de lxml_linux_64.html.tostring extraídos de proyectos de código abierto. Puedes valorar ejemplos para ayudarnos a mejorar la calidad de los ejemplos.

Ejemplo n.º 1

Mostrar archivo

def htm2txt(inf):
    """ extract the text context"""
    doc=html.document_fromstring(inf)
    content=doc.xpath('//*[@id="contents"]')
    htmls=html.tostring(content[0],False)
    htmls=htmls.replace('<br>','\n')
    htmls=htmls.replace('<p>','\n')
    htmls=unescape(htmls)
    p=re.compile('\n{2,}') #replace more than 2 newlines in a row into one newline
    htmls=p.sub('\n',htmls)
    newdoc=html.document_fromstring(htmls)
    return newdoc.text_content()

Ejemplo n.º 2

Mostrar archivo

Archivo: www.ranwen.net.py Proyecto: anselmorenato/litebook-project

def htm2txt(inf):
    """ extract the text context"""
    doc=html.document_fromstring(inf)
    content=doc.xpath('//*[@id="bgdiv"]/table[2]/tbody/tr[1]/td/table/tbody/tr')
    htmls=html.tostring(content[0],False)
    htmls=htmls.replace('<br>','\n')
    htmls=htmls.replace('<p>','\n')
    htmls=htmls.replace('&#160;',' ')
    p=re.compile('\n{2,}') #replace more than 2 newlines in a row into one newline
    htmls=p.sub('\n',htmls)
    newdoc=html.document_fromstring(htmls)
    return newdoc.text_content()

Ejemplo n.º 3

Mostrar archivo

def htm2txt(inf):
    """ extract the text context"""
    doc = html.document_fromstring(inf)
    #content=doc.xpath('//*[@id="bgdiv"]/table[2]/tbody/tr[1]/td/table/tbody/tr')
    content = doc.xpath('//*[@id="content"]')
    htmls = html.tostring(content[0], False)
    htmls = htmls.replace('<br>', '\n')
    htmls = htmls.replace('<p>', '\n')
    htmls = htmls.replace('&#160;', ' ')
    p = re.compile(
        '\n{2,}')  #replace more than 2 newlines in a row into one newline
    htmls = p.sub('\n', htmls)
    newdoc = html.document_fromstring(htmls)
    return newdoc.text_content()