Пример #1
0
def get_col(stop_file, col):
    data = get_data(stop_file, cols=[col])
    return data[col]
Пример #2
0
def get_miss(stop_file):
    data = get_data(stop_file, cols=['miss'])
    return data['miss']
# TODO: fitting stopping time to a dist seems harder, better see miss seq

import matplotlib.pyplot as plt
from fitter import Fitter
from scipy.stats import normaltest

from collatz.v1.misc import get_fullpath, get_data, logmsg

STOP_FILE = get_fullpath('data/collatz-stop-100.csv')
stop = get_data(STOP_FILE)['stop']
plt.hist(stop, density=True, bins=100)
plt.show()

_, pvalue = normaltest(stop)
logmsg('Normality test p-value = %.20f', pvalue)

f = Fitter(stop.sample(300000), timeout=60)
f.fit()
f.summary()