# fix random seed to ensure reproducibility
random.seed(42)

# parse command line arguments
parser = argparse.ArgumentParser(
    description='rule extraction by label counting')
parser.add_argument('-q',
                    '--quiet',
                    action="store_true",
                    help='disables info output')
parser.add_argument('config_file', help='the config file to use')
parser.add_argument('config_name', help='the name of the configuration')
args = parser.parse_args()

# read config file
config = util.parse_config_file(args.config_file, args.config_name)

# dictionary for the confidence values extracted from the data set
# maps from rule type to a list containing rules and their confidence
rules = {}
for rule_type in util.rule_types:
    rules[rule_type] = []

if not args.quiet:
    print("Looking for rules involving two concepts...")

# first look for simple rules involving only two concepts
# like "first_concept IMPLIES second_concept" and "first_concept IS DIFFERENT FROM second_concept"
for first_concept in config["concepts"]:
    if not args.quiet:
        print(first_concept)
Пример #2
0
# -*- coding: utf-8 -*-
"""
Analyzes the given data set and prints out its characteristics.

1st argument: config file, 2nd argument: config_name

Created on Thu Feb  8 09:33:14 2018

@author: lbechberger
"""

import util, sys

config = util.parse_config_file(sys.argv[1], sys.argv[2])
util.data_set_characteristics(config["training_vectors"], config["validation_vectors"], config["test_vectors"], config["concepts"])