def __init__(self, path: str, stopwords: YaseeStopWords = None): if stopwords == None: self.ysw = YaseeStopWords() else: self.ysw = stopwords self.report_file = YaseeReportFile(path)
def __init__(self, path:str, stopwords:YaseeStopWords or frozenset=None): if stopwords == None: YaseeAnalysisClass.__init__(self, path, YaseeStopWords(UCIWC_DEFAULTSTOPWORDS, True)) elif type(stopwords) == frozenset: YaseeAnalysisClass.__init__(self, path, YaseeStopWords(UCIWC_DEFAULTSTOPWORDS, True)) self._ysw.addStopwords(stopwords) else: YaseeAnalysisClass.__init__(self, path, stopwords)
def __init__(self, path: str, stopwords: YaseeStopWords or frozenset = None): if stopwords == None: self._ysw = YaseeStopWords() elif type(stopwords) == YaseeStopWords: self._ysw = stopwords elif type(stopwords) == frozenset: self._ysw = YaseeStopWords(stopwords) self._report_file = YaseeReportFile(path)
class YaseeAnalysisClass(): def __init__(self, path: str, stopwords: YaseeStopWords = None): if stopwords == None: self.ysw = YaseeStopWords() else: self.ysw = stopwords self.report_file = YaseeReportFile(path) def addStopWords(self, additional_words: str or iter): self.ysw.addStopwords(additional_words)
def __init__(self, path: str, stopwords: YaseeStopWords = None): if stopwords == None: YaseeAnalysisClass.__init__( self, path, YaseeStopWords(UCIWC_DEFAULTSTOPWORDS, True)) else: YaseeAnalysisClass.__init__(self, path, stopwords)
def test_addStopWords(self): ysw = YaseeStopWords(stopwords=frozenset(("UCI", )), replace=True) ysw.addStopwords(("UCLA", "UCSD")) self.assertTrue(ysw.getStopwords() == frozenset(("UCI", "UCLA", "UCSD"))) ysw.addStopwords("UCSB") self.assertTrue(ysw.getStopwords() == frozenset(("UCI", "UCLA", "UCSD", "UCSB")))
class YaseeAnalysisClass(): combine_as_lines = lambda x, y: f"{x}\n{y}" combine_as_entry = lambda x, y: f"{x}: {y}" def __init__(self, path: str, stopwords: YaseeStopWords or frozenset = None): if stopwords == None: self._ysw = YaseeStopWords() elif type(stopwords) == YaseeStopWords: self._ysw = stopwords elif type(stopwords) == frozenset: self._ysw = YaseeStopWords(stopwords) self._report_file = YaseeReportFile(path) def addStopWords(self, additional_words: str or iter): self._ysw.addStopwords(additional_words) def getStopWords(self) -> frozenset: return self._ysw.getStopwords() def getReportFile(self) -> YaseeReportFile: return self._report_file
import pandas intermediate = pandas.ExcelFile("../reports/report.xlsx") file = intermediate.parse(intermediate.sheet_names[0]) columns = file """ import YaseeReportFile from collections import defaultdict from wordcloud import WordCloud from matplotlib import pyplot import numpy from YaseeStopWords import YaseeStopWords ysw = YaseeStopWords() words_toStrip = { "nan", "to", "the", "and", "a", "of", "her", "we", "she", "for", "about", "him", "his", "want", "wanted", "so", "student", "in", "on", "had", "an", "some", "as", "be", "what", "through", "make", "with", "not", "at", "is", "it", "from", "also", "out", "would", "which", "where", "for", "those", "this", "how", "that", "was", "he", "could", "them" } report_file = YaseeReportFile.YaseeReportFile("../test/report.xlsx") entries = report_file.extractColumn("WQ19", "VisitNotes") phrase_freq_dict = defaultdict(int) word_freq_dict = defaultdict(int) for entry in entries: words = str(entry).split()
def test_replace_init(self): ysw = YaseeStopWords(stopwords=frozenset(("UCI", )), replace=True) self.assertFalse("a" in ysw) self.assertTrue("UCI" in ysw)
def test_default_init(self): ysw = YaseeStopWords() self.assertTrue("a" in ysw)
def test_getStopWords(self): ysw = YaseeStopWords(stopwords=frozenset(("UCI", )), replace=True) self.assertTrue(ysw.getStopwords() == frozenset(("UCI", )))
def test_addon_init(self): ysw = YaseeStopWords(stopwords=frozenset(("UCI", ))) self.assertTrue("a" in ysw) self.assertTrue("UCI" in ysw)