Python Cleaner 예제들, Cleaner.Cleaner Python 예제들

예제 #1

0

파일 보기

    def read_emails(self, path):
        # Get all files
        files = [f for f in listdir(path) if isfile(join(path, f))]

        try:
            del (files[files.index('DS_Store')])
        except:
            pass

        reader = WordListCorpusReader(path, files)

        cleaner = Cleaner()

        emails = list()

        # Creates the Email Object out of each email file and appends to list
        for file_id in reader.fileids():
            with open(path + file_id, 'r') as current_file:
                cleaned_contents = cleaner.clean_file(current_file.read())
                split_email_header, split_email_body, split_email_file_id = self.divide(
                    cleaned_contents, file_id)
                emails.append(
                    Email(split_email_header, split_email_body,
                          split_email_file_id))

        # Return list of Email objects
        return emails

예제 #2

0

파일 보기

파일: Dialog.py 프로젝트: asmi38/clean-reddit

    def get_text(self):
        words = self.plainTextEdit.toPlainText()
        cleaner = Cleaner()
        words2 = cleaner.edit_bulk_comments(words)

        for item in words2:
            self.textEdit.append(item)

예제 #3

0

파일 보기

파일: part2.py 프로젝트: Occy88/MultiAgents

    def decide(self):
        # default messge to broadcast in case anything is required?
        print('------------', 'AGENT: ', self.name, '---------------')
        self.message = {}
        self.action = action.idle()
        # Conditions to Find Grid Size
        if self.grid_size < 0:
            FindGridSizeMind.run(self)
        if self.grid_size > 0:
            # order by inverse precedence (most important last (for any classes that affect actions)
            # keeps the current state of the map and the
            # age (number fo cycles since update)
            MappingMind.run(self)
            # Places a value on each cell by how long ago it was explored and cubes it (older exponentially more expensive)
            # and if there are other agents that are closer there is a penalty.
            # sums each cell to the value of it's surrounding cells (how much does the robot wanna go there)
            # Robot targets the closest most expensive cell
            GreedyExplore.run(self)
            # If there is a cell to clean, checks if there are other bots
            # closer that are able to clean it, if there are then abandons cleaning
            Cleaner.run(self)
            # Resolves a face to face argument, forces the next to moves to be a turn and
            # forward to the right if possible.
            # Follower.run(self
            Plunger.run(self)
            # goes to the specified self.target_position, viea the fewest
            # possible moves, prioritises x first then y.
            GoToPosition.run(self)

        return self.validate_actions()

예제 #4

0

파일 보기

파일: UnitTests.py 프로젝트: Smarine43/advancedProgrammingAssignment2

 def test_cleaner_birthday_Invalid_3_response2(self):
     clean = Cleaner()
     test_data = "23-11-99"
     expected_result = "The year needs to be in the full format eg: 2009"
     actual_result = clean.Clean_Birthday(test_data)[1]
     self.assertEqual(actual_result, expected_result,
                      "actaul_result should equal" + str(expected_result))

예제 #5

0

파일 보기

파일: UnitTests.py 프로젝트: Smarine43/advancedProgrammingAssignment2

 def test_cleaner_birthday_Invalid_3_response1(self):
     clean = Cleaner()
     test_data = "hello-break-me"
     expected_result = None
     actual_result = clean.Clean_Birthday(test_data)[0]
     self.assertEqual(actual_result, expected_result,
                      "actaul_result should equal" + str(expected_result))

예제 #6

0

파일 보기

파일: UnitTests.py 프로젝트: Smarine43/advancedProgrammingAssignment2

 def test_cleaner_birthday_valid_2(self):
     clean = Cleaner()
     test_data = "25-11-1991"
     expected_result = "25-11-1991"
     actual_result = clean.Clean_Birthday(test_data)[0]
     self.assertEqual(actual_result, expected_result,
                      "actaul_result should equal" + str(expected_result))

예제 #7

0

파일 보기

파일: UnitTests.py 프로젝트: Smarine43/advancedProgrammingAssignment2

 def test_cleaner_age_invalid(self):
     clean = Cleaner()
     test_data = "nine"
     expected_result = None
     actual_result = clean.Clean_Age(test_data)[0]
     self.assertEqual(actual_result, expected_result,
                      "actaul_result should equal" + str(expected_result))

예제 #8

0

파일 보기

파일: UnitTests.py 프로젝트: Smarine43/advancedProgrammingAssignment2

 def test_cleaner_age_valid_Int(self):
     clean = Cleaner()
     test_data = 99
     expected_result = 99
     actual_result = clean.Clean_Age(test_data)[0]
     self.assertEqual(actual_result, expected_result,
                      "actaul_result should equal" + str(expected_result))

예제 #9

0

파일 보기

 def __init__(self, dirPath, binsNum):
     self.binsNum = binsNum
     self.dirPath = dirPath
     self.m_estimate = 2
     self.loadStructure()
     try:
         self.df = pd.read_csv(self.dirPath + "/train.csv")
     except IOError:
         tkMessageBox.showerror(
             "Naive Bayes Classifier - Error",
             "There is a problem with open " + self.dirPath + "/train.csv")
     self.cleaner = Cleaner(self)
     self.naiveBases = {}  #attributeValue and Classification to NaiveBase
     self.cProb = {}
     for (i, record) in self.df.iterrows():
         recordDic = record.to_dict()
         for attribute in recordDic:
             value = recordDic[attribute]
             c = recordDic["class"]
             n_c = len(self.df.loc[((self.df[attribute] == value) &
                                    (self.df["class"] == c))].index)
             n = len(self.df.loc[(self.df["class"] == c)].index)
             m = self.m_estimate
             M = len(self.structure[attribute])
             p = float(1) / M
             naiveBase = float(n_c + m * p) / (n + m)
             self.naiveBases[attribute + str(value) + c] = naiveBase
     for c in self.structure["class"]:
         self.cProb[c] = float(
             len(self.df.loc[(self.df["class"] == c)].index)) / len(
                 self.df.index)
     tkMessageBox.showinfo("Naive Bayes Classifier - Success",
                           "Building classifier using train-set is done!")

예제 #10

0

파일 보기

    def run(self):

        #AUTHENTICATION
        if self.auth():
            print(self.DASH)
            print('Reddit Authentication Successful.\nWelcome, {}'.format(
                self.REDDIT_USERNAME))

        #Get a Subreddit randomly from the pool
        r = random.randint(0, len(self.SUBREDDITS) - 1)
        subreddit = self.getSubreddit(self.SUBREDDITS[r])

        #Get posts of the required subreddit
        posts = self.getSubInfo(subreddit)

        print(self.DASH)
        print("Starting uploads...")
        print(self.DASH)

        self.postToIG(posts)

        print('Uploaded {} posts'.format(self.COUNT))

        print('Starting cleaner..')
        Cleaner.clean()

예제 #11

0

파일 보기