예제 #1
0
    def __init__(self, args):

        # create logger
        self.logger = logging.getLogger(__name__)
        self.logger.setLevel(logging.DEBUG)

        # create console handler and set level to debug
        ch = logging.StreamHandler()
        ch.setLevel(logging.DEBUG)

        # create formatter
        formatter = logging.Formatter(
            '%(asctime)s - %(name)s - %(levelname)s - %(message)s')

        # add formatter to ch
        ch.setFormatter(formatter)

        # add ch to logger
        self.logger.addHandler(ch)
        self.logger.debug("Starting Collector process in %s" % os.getcwd())
        self.logger.debug("Gevent Version %s" % gevent.__version__)

        #TODO: move output file name to config
        #fname = "./NetFlow.%s.bin"%str(time.time()*100000)

        #WARN: might want to remove this after testing
        #self.out = open(fname,"wb")

        #create tool instances
        self.interface = Interface()
        self.parse = Parse()
        self.describe = Describe()
        self.standardize = Standardize()
        self.transform = Transform()
        self.partition = Partition()

        self.q = Queue()
        self.inWindow = False

        self.score = Score()
        #TODO: move csv name to config
        self.csv = CSV("output.csv")

        return super(Collector, self).__init__(args)
예제 #2
0
파일: pair_plot.py 프로젝트: floblanc/dslr
from loader import FileLoader
from describe import Describe


class Pair_Plot():
    def pair_plot(self, data, desc):
        try:
            data.drop("Index", axis=1, inplace=True)
            sns.pairplot(data, hue="Hogwarts House", markers=".")
            plt.show()
        except Exception as e:
            print("Histogram failed : {}".format(e))
            exit()


if (__name__ == '__main__'):
    file = "datasets/dataset_train.csv"
    result = 0
    if (len(sys.argv) < 3):
        if (len(sys.argv) == 2):
            file = sys.argv[1]
        loader = FileLoader()
        path = sys.path[0] + '/' + file
        data = loader.load(path)
        describer = Describe()
        result = describer.describe(data)
        pair_plotter = Pair_Plot()
        pair_plotter.pair_plot(data, result)
    else:
        print("There is too much arguments.")