Пример #1
0
                for fname in os.listdir(foldername):
                    try:
                        #initialize instances
                        kw_instance = [0 for i in range(len(display_keywords))]
                        #TO BE CHANGED TO Keywords with weights
                        changeflag = 0

                        # Open the .docx file
                        if 0:
                            document = Document(os.path.join(
                                docpath, filename))
                            paragraphs = document.paragraphs

                        if 1:
                            document = open(os.path.join(foldername, fname))
                            for line in document.readlines(
                            ):  # to extract the whole text
                                i = 0
                                for word in display_keywords:
                                    if word.lower() in line.strip().lower():
                                        kw_instance[i] = kw_instance[i] + 1
                                        if changeflag == 0:
                                            changeflag = 1
                                    i = i + 1

                        # Search returns true if found
                        if 0:
                            for par in paragraphs:  # to extract the whole text
                                i = 0
                                for word in display_keywords:
                                    if word.lower() in par.text.lower():
                                        kw_instance[i] = kw_instance[i] + 1