Python Document.length Examples

Programming Language: Python

Namespace/Package Name: xml.dom.minidom

Class/Type: Document

Method/Function: length

Examples at hotexamples.com: 2

Python Document.length - 2 examples found. These are the top rated real world Python examples of xml.dom.minidom.Document.length extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

Document(30)

unlink(30)

toprettyxml(30)

getElementsByTagName(30)

createTextNode(30)

createElement(30)

createComment(30)

createCDATASection(30)

toxml(30)

writexml(30)

appendChild(30)

createProcessingInstruction(16)

createElementNS(12)

setAttribute(11)

createAttribute(9)

__init__(8)

insertBefore(6)

encoding(4)

importNode(3)

cloneNode(2)

replaceChild(2)

aChild(2)

cE(2)

cT(2)

saveXML(2)

version(1)

save(1)

getElementsByName(1)

removeChild(1)

ownerDocument(1)

normalize(1)

nodeName(1)

length(1)

getElementsByTagNameNS(1)

createElemen(1)

createAttributeNS(1)

add_table(1)

add_paragraph(1)

writexml_1(1)

Example #1

Show file

File: Preprocessor.py Project: wxyyxc1992/datascience-practice-handbook

    def preprocessing(self):
        '''
        :function 执行数据预处理操作
        :return:
        '''
        print (u'载入数据......')

        # 打开文件读入数据
        with codecs.open(trainfile, 'r', 'utf-8') as f:
            docs = f.readlines()

        print (u"载入完成,准备生成字典对象和统计文本数据...")

        # 记录某个词的下标
        items_idx = 0

        # 读取文档的每一行
        for line in docs:
            if line != "":
                tmp = line.strip().split()
                # 生成一个文档对象
                doc = Document()

                # 遍历所有的词汇
                for item in tmp:

                    # 判断是否已经包含了该词汇
                    if self.word2id.has_key(item):

                        # 如果已经包含则直接添加
                        doc.words.append(self.word2id[item])
                    else:

                        # 否则将该词汇的下标设置为items_idx
                        self.word2id[item] = items_idx

                        # 将该单词下标添加到文档列表
                        doc.words.append(items_idx)

                        # 单词下标加1
                        items_idx += 1

                # 设置文档长度
                doc.length = len(tmp)

                self.docs.append(doc)
            else:
                pass
        self.docs_count = len(self.docs)

        self.words_count = len(self.word2id)

        print (u"共有%s个文档" % self.docs_count)

        self.cachewordidmap()

        print (u"词与序号对应关系已保存到%s" % wordidmapfile)

Example #2

Show file

    def preprocessing(self):
        '''
        :function 执行数据预处理操作
        :return:
        '''
        print(u'载入数据......')

        # 打开文件读入数据
        with codecs.open(trainfile, 'r', 'utf-8') as f:
            docs = f.readlines()

        print(u"载入完成,准备生成字典对象和统计文本数据...")

        # 记录某个词的下标
        items_idx = 0

        # 读取文档的每一行
        for line in docs:
            if line != "":
                tmp = line.strip().split()
                # 生成一个文档对象
                doc = Document()

                # 遍历所有的词汇
                for item in tmp:

                    # 判断是否已经包含了该词汇
                    if self.word2id.has_key(item):

                        # 如果已经包含则直接添加
                        doc.words.append(self.word2id[item])
                    else:

                        # 否则将该词汇的下标设置为items_idx
                        self.word2id[item] = items_idx

                        # 将该单词下标添加到文档列表
                        doc.words.append(items_idx)

                        # 单词下标加1
                        items_idx += 1

                # 设置文档长度
                doc.length = len(tmp)

                self.docs.append(doc)
            else:
                pass
        self.docs_count = len(self.docs)

        self.words_count = len(self.word2id)

        print(u"共有%s个文档" % self.docs_count)

        self.cachewordidmap()

        print(u"词与序号对应关系已保存到%s" % wordidmapfile)