示例#1
0
def algorithm1_mod(train1, train2):
    """
    - Performs algorithm 1 described in 'Mining Railway Delay Dependencies in
    Large-Scale Real-World Delay Data' (Flier, Gelashvili, Graffagnino,
    Nunkesser).
    - train1 and train2 must be numpy arrays containing delay times of the
    trains. There can be no missing values, and train1[d], train2[d] must be
    delay data from the same day d. Implicitly train1 and train2 must be of
    equal length.
    - This is a modified version of algorithm1 as described in section 5
    of 'Mining Railway Delay Dependencies in Large-Scale Real-World Delay Data'
    (Flier, Gelashvili, Graffagnino, Nunkesser).
    """

    train1, train2 = train_sorting.sort_two_non_dec(train1, train2)
    train1 = train_sorting.append(train1, float('inf'))
    train2 = train_sorting.append(train2, float(0))

    #set max number of exceptional points
    rbar = 0.025*(len(train1))

    #Locals
    exceptional = Queue.PriorityQueue(maxsize=int(math.floor(rbar)))
    s_i = train_sorting.difference(train1, train2)
    k = 0 #pylint:disable=invalid-name
    k_star = 0
    s = s_i[0]#pylint:disable=invalid-name
    s_star = 0
    l = 0 #pylint:disable=invalid-name
    e_star = 0 # maximal delay
    sol = False

    #The algorithm:
    for i in range(len(train1)):
        if s_i[i] > s:
            if exceptional.full():
                sol = True
                #cannot extend current solution to train1[i], train2[i]
                if k > k_star:
                    #update best solution
                    k_star = k
                    s_star = s
                    e_star = train1[i - 1]

                #initialize new solution
                s = s_i[exceptional.get()] #pylint:disable=invalid-name
                
                #find first point in new interval
                while train1[l] < s and l < len(train1):
                    l += 1 #pylint:disable=invalid-name
                k = i - l + 1
            else:
                exceptional.put(i, s_i[i])
                k += 1
        else:
            k += 1
    if sol:
        return (k_star, s_star, e_star)
    else:
        return algorithm1(train1, train2)
示例#2
0
def algorithm1(train1, train2):
    """
    - Performs algorithm 1 described in 'Mining Railway Delay Dependencies in
    Large-Scale Real-World Delay Data' (Flier, Gelashvili, Graffagnino,
    Nunkesser).
    - train1 and train2 must be numpy arrays containing delay times of the
    trains. There can be no missing values, and train1[d], train2[d] must be
    delay data from the same day d. Implicitly train1 and train2 must be of
    equal length.
    """

    train1, train2 = train_sorting.sort_two_non_dec(train1, train2)
    train1 = train_sorting.append(train1, float('inf'))
    train2 = train_sorting.append(train2, float(0))

    #Locals
    diff = train_sorting.difference(train1, train2)
    points = 0
    points_star = 0
    bft = diff[0] #buffertime
    bft_star = 0
    lpi = 0 #last point index
    md_star = 0 # maximal delay

    #The algorithm:
    for i in range(len(train1)):
        if diff[i] > bft:
            if points > points_star:
                #update best solution
                points_star = points
                bft_star = bft
                md_star = train1[i-1]

            bft = diff[i]
            notdone = True
            while notdone:
                if (train1[lpi] < bft and
                    lpi < len(train1)):
                    lpi += 1
                else:
                    notdone = False
            points = i - lpi + 1
        else:
            points += 1

    return (points_star, bft_star, md_star)
示例#3
0
def algorithm2(train1, train2, minwidth=60):
    """
    - Performs algorithm 2 described in 'Mining Railway Delay Dependencies in
    Large-Scale Real-World Delay Data' (Flier, Gelashvili, Graffagnino,
    Nunkesser).
    - Optional parameter minwidth describes the minimum requiered headway
    between trains using the same infrastructure, varies from station to
    station.
    - train1 and train2 must be numpy arrays containing delay times of the
    trains. There can be no missing values, and train1[d], train2[d] must be
    delay data from the same day d. Implicitly train1 and train2 must be of
    equal length.
    """
    train1, train2 = train_sorting.sort_two_non_dec(train1, train2)
    train1 = train_sorting.append(train1, float('inf'))
    train2 = train_sorting.append(train2, 0)

    #Locals
    intercepts = sorted(train_sorting.difference(train1, train2))
    points = 0
    points_star = 0
    left = 0
    leftstar = 0
    right = 0
    rightstar = 0
    fai = 0 #index of first point above stripe

    #The algorithm
    for j in range(1, len(intercepts)):
        left = intercepts[j-1]
        right = intercepts[j]
        if right - left >= minwidth:

            while train1[fai] < left:
                fai += 1

            points = j - fai
            if points > points_star:
                #update best solution
                points_star = points
                leftstar = left
                rightstar = right

    return (points_star, leftstar, rightstar)