Ejemplo n.º 1
0
    def getNonMonitoredTarget(webpageTrainSource):

        if config.BUILD_ALL_WEBPAGES:
            webpageTrain = Datastore.getWebpagesWangTor([101], 1, 2)

            webpageTrain = webpageTrain[0]
            config.ALL_WEBPAGES.append(webpageTrain)

            config.BUILD_ALL_WEBPAGES = False

            config.LARGEST_WEBPAGE = webpageTrain

        #print "src id: " + str(webpageTrainSource.getId())
        #print "largest target id: " + str(config.LARGEST_WEBPAGE.getId())
        #print "---"
        return config.LARGEST_WEBPAGE
                    elif config.DATA_SOURCE == 1 or config.DATA_SOURCE == 2:
                        webpageTrain = Datastore.getWebpagesHerrmann(
                            [webpageId], seed - config.NUM_TRAINING_TRACES,
                            seed)
                        webpageTest = Datastore.getWebpagesHerrmann(
                            [webpageId], seed,
                            seed + config.NUM_TESTING_TRACES)
                    elif config.DATA_SOURCE == 5:
                        if not unMonitoredWebpageIdsObj.__contains__(
                                webpageId):
                            # this block of code can be applied to either a closed or open-world
                            if config.COVARIATE_SHIFT == 0:  # Normal case
                                # monitored webpage so we take instances for training and testing as we do regularly
                                webpageTrain = Datastore.getWebpagesWangTor(
                                    [webpageId],
                                    seed - config.NUM_TRAINING_TRACES, seed)
                                webpageTest = Datastore.getWebpagesWangTor(
                                    [webpageId], seed,
                                    seed + config.NUM_TESTING_TRACES)
                            else:
                                # span time training/testing
                                # monitored webpage so we take instances for training and testing as we do regularly
                                webpageTrain = Datastore.getWebpagesWangTor(
                                    [webpageId], 0, config.NUM_TRAINING_TRACES)
                                webpageTest = Datastore.getWebpagesWangTor(
                                    [webpageId], config.NUM_TRAINING_TRACES +
                                    config.COVARIATE_SHIFT,
                                    config.NUM_TRAINING_TRACES +
                                    config.COVARIATE_SHIFT +
                                    config.NUM_TESTING_TRACES)
Ejemplo n.º 3
0
                        elif config.DATA_SOURCE == 1 or config.DATA_SOURCE == 2:
                            webpageTrain = Datastore.getWebpagesHerrmann(
                                [webpageId], seed - config.NUM_TRAINING_TRACES,
                                seed)
                            webpageTest = Datastore.getWebpagesHerrmann(
                                [webpageId], seed,
                                seed + config.NUM_TESTING_TRACES)
                        elif config.DATA_SOURCE == 5:
                            if not unMonitoredWebpageIdsObj.__contains__(
                                    webpageId):
                                # this block of code can be applied to either a closed or open-world
                                if config.COVARIATE_SHIFT == 0:  # Normal case
                                    # monitored webpage so we take instances for training and testing as we do regularly
                                    webpageTrain = Datastore.getWebpagesWangTor(
                                        [webpageId],
                                        seed - config.NUM_TRAINING_TRACES,
                                        seed)
                                    webpageTest = Datastore.getWebpagesWangTor(
                                        [webpageId], seed,
                                        seed + config.NUM_TESTING_TRACES)
                                else:
                                    # span time training/testing
                                    # monitored webpage so we take instances for training and testing as we do regularly
                                    #webpageTrain = Datastore.getWebpagesWangTor( [webpageId], 0, config.NUM_TRAINING_TRACES )
                                    #webpageTest  = Datastore.getWebpagesWangTor( [webpageId], config.NUM_TRAINING_TRACES+config.COVARIATE_SHIFT, config.NUM_TRAINING_TRACES+config.COVARIATE_SHIFT+config.NUM_TESTING_TRACES )

                                    endSlideTrain = config.START_SLIDE_TRAIN + config.NUM_TRAINING_TRACES
                                    webpageTrain = Datastore.getWebpagesWangTor(
                                        [webpageId], config.START_SLIDE_TRAIN,
                                        endSlideTrain)
                                    webpageTest = Datastore.getWebpagesWangTor(