Ejemplos de Paint.GetDataFromDataframe en Python

Lenguaje de programación: Python

Namespace/Package Name: class_paint

Clase / Tipo: Paint

Método / Función: GetDataFromDataframe

Ejemplos en hotexamples.com: 3

Python Paint.GetDataFromDataframe - 3 ejemplos encontrados. Estos son los ejemplos en Python del mundo real mejor valorados de class_paint.Paint.GetDataFromDataframe extraídos de proyectos de código abierto. Puedes valorar ejemplos para ayudarnos a mejorar la calidad de los ejemplos.

Métodos usados con frecuencia

Mostrar Ocultar

Paint(4)

GetDataFromDataframe(3)

GetDataFromExcel(1)

bar(1)

box(1)

heat(1)

histo(1)

joint(1)

xyplot(1)

Ejemplo n.º 1

Mostrar archivo

def predict():
    pr = Predict()
    x = [
        'ridge', 'ridge', 'lasso', 'lasso', 'linear', 'linear', 'SVM', 'SVM',
        'random', 'random'
    ]
    y = []
    y += pr.ridge()  # 分别比较各种回归算法（岭回归、套索回归、线性回归、支持向量机）和纯随机数之间的准确率
    y += pr.lasso()
    y += pr.linear()
    y += pr.SVM()
    y += pr.random()
    hue = ['train_accuracy', 'test_accuracy'] * 5
    data = pd.DataFrame({'algorithm': x, 'accuracy': y, 'kind': hue})
    p = Paint()
    p.GetDataFromDataframe(data)
    plt.figure(figsize=(8, 8))
    p21 = p.bar('algorithm', 'accuracy', 'kind')
    plt.savefig('图13：各种回归算法及随机数预测准确率柱状图')

Ejemplo n.º 2

Mostrar archivo

def wash():  #对得到的数据进行初步处理
    w = Wash()  # 下10行对各特征值进行数据类型转换和过滤极端异常值
    w.GetDataFromDatabase('data.db')
    w.UnitPriceWash()
    w.StructureWash()
    w.StoreyWash()
    w.SizeWash()
    w.AgeWash()
    w.DecorateWash()
    w.XYWash()
    raw_df = w.df
    raw_df.drop_duplicates(['unit_price', 'structure', 'storey', 'size'],
                           inplace=True)  # 去重

    p = Paint()  #绘制价格和地段示意图，用于分析找到城市中心位置
    p.GetDataFromDataframe(raw_df)
    plt.figure(figsize=(8, 8))
    pc1 = p.xyplot()
    plt.savefig('图1：上海二手房价格与地段示意图')
    w.GetDistance(2)  #通过Kmeans聚类找到房价的两个质心位置，并计算各房屋距离两个质心的平均距离
    w.Select()
    df = w.df
    df.to_excel('RawData.xls')  # 将初步清洗的数据存储于excel中

Ejemplo n.º 3

Mostrar archivo

Archivo: main.py Proyecto: sikadeer/CS902-FINAL-project

def norm():  #对初步清洗的数据进行归一化
    w = Wash()
    w.GetDataFromExcel('RawData.xls')
    for i in ['unit_price', 'size', 'age', 'distance']:  # 对数据进行不同方式的归一化并比较其效果
        w.MaxMinNorm(i)
        w.LogNorm(i)
        w.ZscoreNorm(i)
    df = w.df
    p = Paint()
    p.GetDataFromDataframe(df)
    plt.figure(figsize=(8, 8))  #对未归一化的效果进行可视化，并计算其偏度和峰度
    plt.subplot(221)
    pc2 = p.histo('unit_price', bins=30, x=75000, y=0.00002)
    plt.subplot(222)
    pc3 = p.histo('size', bins=30, x=120, y=0.012)
    plt.subplot(223)
    pc4 = p.histo('age', bins=30, x=25, y=0.06)
    plt.subplot(224)
    pc5 = p.histo('distance', bins=30, x=55, y=0.08)
    plt.suptitle('Histogram of Raw Data')
    plt.savefig('图2：未归一化的数据直方图')

    plt.figure(figsize=(8, 8))  #对max-min归一化的效果进行可视化，并计算其偏度和峰度
    plt.subplot(221)
    pc6 = p.histo('MaxMinNormunit_price', bins=30, x=0.6, y=2.5)
    plt.subplot(222)
    pc7 = p.histo('MaxMinNormsize', bins=30, x=0.6, y=2.5)
    plt.subplot(223)
    pc8 = p.histo('MaxMinNormage', bins=30, x=0.6, y=2.5)
    plt.subplot(224)
    pc9 = p.histo('MaxMinNormdistance', bins=30, x=0.6, y=8)
    plt.suptitle('Histogram of Max-Min Normalization')
    plt.savefig('图3：max-min归一化的直方图')

    plt.figure(figsize=(8, 8))  #对对数归一化的效果进行可视化，并计算其偏度和峰度
    plt.subplot(221)
    pc6 = p.histo('LogNormunit_price', bins=30, x=0.65, y=2)
    plt.subplot(222)
    pc7 = p.histo('LogNormsize', bins=30, x=0.65, y=2)
    plt.subplot(223)
    pc8 = p.histo('LogNormage', bins=30, x=0.65, y=4)
    plt.subplot(224)
    pc9 = p.histo('LogNormdistance', bins=30, x=0.65, y=4)
    plt.suptitle('Histogram of Log Normalization')
    plt.savefig('图4：Log归一化的直方图')

    plt.figure(figsize=(8, 8))  #对Zscore归一化的效果进行可视化，并计算其偏度和峰度
    plt.subplot(221)
    pc10 = p.histo('ZscoreNormunit_price', bins=30, x=0.65, y=2)
    plt.subplot(222)
    pc11 = p.histo('ZscoreNormsize', bins=30, x=0.65, y=2)
    plt.subplot(223)
    pc12 = p.histo('ZscoreNormage', bins=30, x=0.65, y=2)
    plt.subplot(224)
    pc13 = p.histo('ZscoreNormdistance', bins=30, x=0.65, y=6)
    plt.suptitle('Histogram of Zscore Normalization')
    plt.savefig('图5：ZscoreNorm归一化的直方图')

    df['unit_price'] = df['LogNormunit_price']  #对比后最终选用对数归一化方法
    df['size'] = df['LogNormsize']
    df['age'] = df['LogNormage']
    df['distance'] = df['LogNormdistance']
    df.drop([
        'MaxMinNormunit_price', 'LogNormunit_price', 'ZscoreNormunit_price',
        'MaxMinNormsize', 'LogNormsize', 'ZscoreNormsize', 'MaxMinNormage',
        'LogNormage', 'ZscoreNormage', 'MaxMinNormdistance', 'LogNormdistance',
        'ZscoreNormdistance'
    ],
            axis=1,
            inplace=True)
    df.to_excel('Washed Data.xls')  # 将归一化的数据存储于excel中
    print('数据归一化部分已完成')