Beispiel #1
0
            result = np.concatenate((result, col), axis=1)

    return result


avg_window_size = 3
btc_window_size = 4
avg = [10, 22, 30, 42, 50, 62, 70, 82, 90, 102]
btc = [110, 123, 130, 143, 150, 163, 170, 183, 190, 203]
trend = [212, 224, 232, 244, 252, 264, 272, 284, 292, 304]

df = DataFrame({'btc': btc,
                'trend': trend})
print(btc)

avg_diff = data_misc.difference(avg, 1)
avg_supervised = data_misc.timeseries_to_supervised(avg_diff, avg_window_size)
print(avg_supervised)

btc_supervised = supervised_diff_dt(df, btc_window_size)

# We pair the avg_supervised column with the weight_supervised
cut_beginning = [avg_window_size, btc_window_size]
cut_beginning = max(cut_beginning)

avg_supervised = avg_supervised.values[cut_beginning:, :]
btc_supervised = btc_supervised[cut_beginning:, :]

# Concatenate with numpy
supervised = np.concatenate((btc_supervised, avg_supervised), axis=1)
Beispiel #2
0
from Util import misc

window_size = 5  # 15
path = 'C:/tmp/bitcoin/'
input_file = 'bitcoin_usd_bitcoin_block_chain_trend_by_day.csv'
series = read_csv(path + input_file, header=0, sep=',', nrows=1438)
series = series.iloc[::-1]

for i in range(0, 30):
    corr = series['Avg'].autocorr(lag=i)
    print('Corr: %.2f Lang: %i' % (corr, i))

avg = series['Avg']
avg_values = avg.values
# Stationary Data
diff_values = data_misc.difference(avg_values, 1)
avg_values = diff_values
print("Diff values")

supervised = data_misc.timeseries_to_supervised(avg_values, window_size)
# print(raw_values)
supervised = supervised.values[window_size:, :]
# supervised = list(range(1, 101))

size_supervised = len(supervised)
split_train_val = int(size_supervised * 0.60)
split_val_test = int(size_supervised * 0.20)

train = supervised[0:split_train_val]
val = supervised[split_train_val:split_train_val + split_val_test]
test = supervised[split_train_val + split_val_test:]
    return rmse, predictions


print('main_passangers.py, stationary.')
series = read_csv('../data/airline-passengers.csv', header=0, sep='\t')

date = series['Date'].values
date = numpy.delete(date, (0), axis=0)

raw_values = series['Passangers'].values

size_raw_values = len(raw_values)
split = int(size_raw_values * 0.80)  # 0.80
print('raw_values:' + str(len(raw_values)))

diff_values = data_misc.difference(raw_values, 1)
print('Diff:' + str(len(diff_values)))

print('Raw values total size: %i, Train size: %i, Test size: %i ' %
      (size_raw_values, split, size_raw_values - split))

supervised = data_misc.timeseries_to_supervised(diff_values, 1)

supervised_values = supervised.values
# supervised_values = supervised_values[1:, :]

# raw_values = numpy.delete(raw_values, (-1), axis=0)

print('Supervised:' + str(len(supervised_values)))
print('Raw values:' + str(len(raw_values)))