Python Library.BookParagraph Exemples

Langage de programmation: Python

Class/Type: Library

Méthode/Fonction: BookParagraph

Exemples au hotexamples.com: 3

Python Library.BookParagraph - 3 exemples trouvés. Ce sont les exemples réels les mieux notés de Library.BookParagraph à partir du pack mpi4py extraits de projets open source. Vous pouvez noter les exemples pour nous aider à en améliorer la qualité.

Méthodes fréquemment utilisées

Afficher Cacher

BookContent(3)

BookChapter(3)

BookParagraph(3)

read_book_collection(2)

Animation(2)

DP2DOptimizer(2)

Book(2)

alive(2)

DIYSearch(2)

Actor(1)

processData(1)

rand(1)

send(1)

response(1)

run_command(1)

send_help_message(1)

send_start_message(1)

set_patrons(1)

isPalindrome(1)

DeleteBook(1)

give_text(1)

DisjointSet(1)

Dijkstra(1)

AddBook(1)

CreateLibrary(1)

ConversationAsset(1)

Common(1)

BookInquery(1)

BellmanFord(1)

BH1750FVI(1)

AddRead(1)

xmas(1)

Méthodes fréquemment utilisées

BookContent (3)

BookChapter (3)

BookParagraph (3)

read_book_collection (2)

Animation (2)

DP2DOptimizer (2)

Book (2)

alive (2)

DIYSearch (2)

Actor (1)

Méthodes fréquemment utilisées

processData (1)

rand (1)

send (1)

response (1)

run_command (1)

send_help_message (1)

send_start_message (1)

set_patrons (1)

isPalindrome (1)

DeleteBook (1)

give_text (1)

DisjointSet (1)

Dijkstra (1)

AddBook (1)

CreateLibrary (1)

ConversationAsset (1)

Common (1)

BookInquery (1)

BellmanFord (1)

BH1750FVI (1)

Méthodes fréquemment utilisées

give_text (1)

DisjointSet (1)

Dijkstra (1)

AddBook (1)

CreateLibrary (1)

ConversationAsset (1)

Common (1)

BookInquery (1)

BellmanFord (1)

BH1750FVI (1)

AddRead (1)

xmas (1)

Méthodes fréquemment utilisées

AddRead (1)

xmas (1)

Exemple #1

0

Afficher le fichier

def _getGutenbergSpiegelChapters(pages): chapters = [] for page in pages: soup = BeautifulSoup(page) chapter = Library.BookChapter() titleElement = soup.find('div', attrs={'id': 'gutenb'}).find('h3') if titleElement != None: chapter.Title = ''.join(titleElement.strings) paragraphElements = soup.find('div', attrs={ 'id': 'gutenb' }).find_all('p') for paragraphElement in paragraphElements: paragraph = Library.BookParagraph() paragraphString = ''.join(paragraphElement.strings) if paragraphString != None: sentences = paragraphString.replace('!', '.').replace( '?', '.').split('.') paragraph.Sentences = [ s.strip() for s in sentences if s.strip() != '' ] if len(paragraph.Sentences) != 0: chapter.Paragraphs.append(paragraph) if len(chapter.Paragraphs) != 0 and chapter.Title != None: chapters.append(chapter) return chapters

Exemple #2

0

Afficher le fichier

def _getLowereadBookChapters(pages): chapters = [] currentChapter = Library.BookChapter() currentChapter.Title = '' currentChapter.Paragraphs = [] for page in pages: soup = BeautifulSoup(page) readBookElement = soup.find('td', attrs={'class': 'tb_read_book'}) if readBookElement != None: pageContentElement = readBookElement.find( 'div', attrs={ 'class': 'MsoNormal' }).find('p', attrs={'class': 'MsoNormal'}) for child in pageContentElement.find_all(re.compile('p|div')): if child.name == 'div': if child.string != None and child.string.strip() != '': if len(currentChapter.Paragraphs) != 0: chapters.append(currentChapter) currentChapter = Library.BookChapter() currentChapter.Title = child.string if child.name == 'p': paragraphString = ''.join(child.strings) if paragraphString.strip() != '': paragraphString = paragraphString.replace( os.linesep, ' ') paragraph = Library.BookParagraph() paragraph.Sentences = [] sentences = paragraphString.replace('!', '.').replace( '?', '.').split('.') sentences = [s.strip() for s in sentences] for sentence in sentences: if sentence != "": paragraph.Sentences.append(sentence) if len(paragraph.Sentences) != 0: currentChapter.Paragraphs.append(paragraph) return chapters

Exemple #3

0

Afficher le fichier

def _getReadcentralBookChapter(path): chapter = Library.BookChapter() chapter.Paragraphs = [] html = HtmlDownloader.DownloadHtml('www.readcentral.com', path) soup = BeautifulSoup(html) pageheadElem = soup.find('div', attrs={'id': 'pagehead'}) chapter.Title = pageheadElem.div.string.strip() contentElement = soup.find( 'div', attrs={'id': 'ctl00_contents_book_chapter_content_area'}) for paragraphElement in contentElement.find_all('p'): paragraphString = ''.join(paragraphElement.strings) #paragraphString = re.sub('<[^>]+>', '', paragraphString) if paragraphString != None: paragraph = Library.BookParagraph() paragraph.Sentences = getEnSentencesFromParagraphString( paragraphString) if len(paragraph.Sentences) != 0: chapter.Paragraphs.append(paragraph) return chapter