예제 #1
0
 def test_id3_ut10(self, tn=10):
     """
     Tests information gain of Temperature in the examples and target_attribute PlayTennis.
     """        
     print('\n============ ID3 UT {} ======================='.format(tn))
     examples, colnames = bin_id3.parse_csv_file_into_examples('play_tennis.csv')
     avt = bin_id3.construct_attrib_values_from_examples(examples, colnames[1:])
     g   = bin_id3.gain(examples, 'PlayTennis', 'Temperature', avt)
     gt  = 0.029222565658954647
     err = 0.0001
     print('gain(Temperature)={}'.format(g))
     assert abs(g - gt) <= err
     print('\n============ ID3 UT {} passed ================'.format(tn))
예제 #2
0
 def test_id3_ut19(self, tn=19):
     """
     Let S = 
     1) {'Day': 'D1',  'Outlook': 'Sunny', 'Temperature': 'Hot', 'Humidity': 'High', 'Wind': 'Weak', 'PlayTennis': 'No'}
     2) {'Day': 'D2',  'Outlook': 'Sunny', 'Temperature': 'Hot', 'Humidity': 'High', 'Wind': 'Strong', 'PlayTennis': 'No'}
     3) {'Day': 'D8',  'Outlook': 'Sunny', 'Temperature': 'Mild', 'Humidity': 'High', 'Wind': 'Weak', 'PlayTennis': 'No'}
     4) {'Day': 'D9',  'Outlook': 'Sunny', 'Temperature': 'Cool', 'Humidity': 'Normal', 'Wind': 'Weak', 'PlayTennis': 'Yes'}
     5) {'Day': 'D11', 'Outlook': 'Sunny', 'Temperature': 'Mild', 'Humidity': 'Normal', 'Wind': 'Strong', 'PlayTennis': 'Yes'}
     Compute 
     1) Entropy(S);
     2) Gain(Temperature);
     3) Gain(Humidity);
     4) Gain(Wind);
     """
     print('\n============ ID3 UT {} ======================='.format(tn))
     examples, colnames = bin_id3.parse_csv_file_into_examples('play_tennis.csv')
     outlook_sunny_examples = bin_id3.find_examples_given_attrib_val(examples, 'Outlook', 'Sunny')
     avt = bin_id3.construct_attrib_values_from_examples(examples, colnames[1:])
     H   = bin_id3.entropy(outlook_sunny_examples, 'PlayTennis', avt)
     gH  = 0.9709505944546686
     err = 0.0001
     print('Entropy(S)={}'.format(H))
     assert abs(H - gH) <= err
     g   = bin_id3.gain(outlook_sunny_examples, 'PlayTennis', 'Temperature', avt)
     gt  = 0.5709505944546686
     err = 0.0001
     print('gain(Temperature)={}'.format(g))
     assert abs(g-gt) <= err
     g   = bin_id3.gain(outlook_sunny_examples, 'PlayTennis', 'Humidity', avt)
     gt  = 0.9709505944546686
     err = 0.0001
     print('gain(Humidity)={}'.format(g))
     assert abs(g-gt) <= err
     g   = bin_id3.gain(outlook_sunny_examples, 'PlayTennis', 'Wind', avt)
     gt  = 0.01997309402197489
     err = 0.0001
     print('gain(Wind)={}'.format(g))
     assert abs(g-gt) <= err
     print('\n============ ID3 UT {} passed ================'.format(tn))
예제 #3
0
 def test_id3_ut09(self, tn=9):
     """
     Tests information gain of Outlook in the examples and target_attribute PlayTennis.
     """        
     print('\n============ ID3 UT {} ======================='.format(tn))
     examples, colnames = bin_id3.parse_csv_file_into_examples('play_tennis.csv')
     avt = bin_id3.construct_attrib_values_from_examples(examples, colnames[1:])
     g   = bin_id3.gain(examples, 'PlayTennis', 'Outlook', avt)
     gt  = 0.2467498197744391
     err = 0.0001
     print('gain(Outlook)={}'.format(g))
     assert abs(g - gt) <= err
     print('\n============ ID3 UT {} passed ================'.format(tn))
예제 #4
0
 def test_id3_ut08(self, tn=8):
     """
     Tests information gain of Humidity in the examples and target_attribute PlayTennis.
     """        
     print('\n============ ID3 UT {} ======================='.format(tn))
     examples, colnames = bin_id3.parse_csv_file_into_examples('play_tennis.csv')
     avt = bin_id3.construct_attrib_values_from_examples(examples, colnames[1:])
     g   = bin_id3.gain(examples, 'PlayTennis', 'Humidity', avt)
     gt  = 0.15183550136234136
     err = 0.0001
     print('gain(Humidity)={}'.format(g))
     assert abs(g - gt) <= err
     print('\n============ ID3 UT {} passed ================'.format(tn))
예제 #5
0
 def test_id3_ut17(self, tn=17):
     """
     Find all examples with Outlook=Overcast and compute info gain of Wind.
     """
     print('\n============ ID3 UT {} ======================='.format(tn))
     examples, colnames = bin_id3.parse_csv_file_into_examples('play_tennis.csv')
     outlook_over_examples = bin_id3.find_examples_given_attrib_val(examples, 'Outlook', 'Overcast')
     avt = bin_id3.construct_attrib_values_from_examples(examples, colnames[1:])        
     g   = bin_id3.gain(outlook_over_examples, 'PlayTennis', 'Wind', avt)
     gt  = 0.0
     err = 0.0001
     print('gain(Wind)={}'.format(g))
     assert abs(g - gt) <= err
     print('\n============ ID3 UT {} passed ================'.format(tn))
예제 #6
0
 def test_id3_ut12(self, tn=12):
     """
     Find all examples with Outlook=Sunny and compute info gain of Temperature.
     """
     print('\n============ ID3 UT {} ======================='.format(tn))
     examples, colnames = bin_id3.parse_csv_file_into_examples('play_tennis.csv')
     outlook_sunny_examples = bin_id3.find_examples_given_attrib_val(examples, 'Outlook', 'Sunny')
     avt = bin_id3.construct_attrib_values_from_examples(examples, colnames[1:])
     g   = bin_id3.gain(outlook_sunny_examples, 'PlayTennis', 'Temperature', avt)
     gt  = 0.5709505944546686
     err = 0.0001
     print('gain(Temperature)={}'.format(g))
     assert abs(g - gt) <= err
     print('\n============ ID3 UT {} passed ================'.format(tn))
예제 #7
0
 def test_id3_ut07(self, tn=7):
     """
     Computes information gain of Wind in the examples and target_attribute PlayTennis.
     """
     print('\n============ ID3 UT {} ======================='.format(tn))
     examples, colnames = bin_id3.parse_csv_file_into_examples('play_tennis.csv')
     avt = bin_id3.construct_attrib_values_from_examples(examples, colnames[1:])
     # print('bin_id3: avt={}'.format(avt))
     g   = bin_id3.gain(examples, 'PlayTennis', 'Wind', avt)
     gt  = 0.04812703040826927
     err = 0.0001
     print('gain(Wind)={}'.format(g))
     assert abs(g - gt) <= err
     print('\n============ ID3 UT {} passed ================'.format(tn))