Python get_iris示例，brightics.function.test_data.get_iris Python示例

示例#1

0

显示文件

文件： manipulation_test.py 项目： eastshine94/studio

 def test1(self):
     df = get_iris()
     out_df = sort(df,
                   input_cols=['species', 'petal_length'],
                   is_asc=['desc', 'asc'])['out_table']
     print(df)
     print(out_df)

示例#2

0

显示文件

 def test_validation(self):
     df = get_iris()
     with self.assertRaises(BrighticsFunctionException) as bfe:
         out_df = sort(df, input_cols=[], is_asc=['desc'])['out_table']
         
     test_errors = bfe.exception.errors
     self.assertTrue({'0033': ['input_cols']} in test_errors)

示例#3

0

显示文件

 def test_groupby1(self):
     df = get_iris()
     train_out = xgb_regression_train(
         df,
         feature_cols=['sepal_length', 'sepal_width', 'petal_length'],
         label_col='petal_width',
         group_by=['species'])
     predict_out = xgb_regression_predict(df, train_out['model'])
     print(predict_out['out_table'][['petal_width', 'prediction']])

示例#4

0

显示文件

 def test3(self):
     # df = df_iris.copy().query(''' species != 'setosa' ''')
     df = get_iris()
     print(df)
     out = add_expression_column_if(
         df, 'encoded_species',
         ['''species == 'setosa' ''', '''species == 'virginica' '''],
         ['1.0', '2.0'], '0.0')['out_table']
     print(out['encoded_species'][48:102])

示例#5

0

显示文件

文件： one_hot_encoder_test.py 项目： shovsj/studio

def get_iris_randomgroup():
    df = get_iris()
    random_group1 = []
    random_group2 = []
    random_group2_map = {1: 'A', 2: 'B'}
    for i in range(len(df)):
        random_group1.append(random.randint(1, 2))
        random_group2.append(random_group2_map[random.randint(1, 2)])
    df['random_group1'] = random_group1
    df['random_group2'] = random_group2
    return df

示例#6

0

显示文件

    def groupby1(self):
        df = get_iris()
        random_group = []
        for i in range(len(df)):
            random_group.append(random.randint(1, 2))
        df['random_group'] = random_group

        train_out = svm_classification_train(df,
                                             feature_cols=[
                                                 'sepal_length', 'sepal_width',
                                                 'petal_length', 'petal_width'
                                             ],
                                             label_col='species',
                                             group_by=['random_group'])
        predict_out = svm_classification_predict(df, train_out['model'])
        print(predict_out['out_table'][['species', 'prediction']])

示例#7

0

显示文件

    def test1(self):
        iris = get_iris()

        df_splitted = split_data(iris, 0.7, 0.3)
        train_df = df_splitted['train_table']
        test_df = df_splitted['test_table']

        train_out = svm_classification_train(train_df,
                                             feature_cols=[
                                                 'sepal_length', 'sepal_width',
                                                 'petal_length', 'petal_width'
                                             ],
                                             label_col='species')
        # print(train_out['model']['svc_model'])

        predict_out = svm_classification_predict(test_df, train_out['model'])
        print(predict_out['out_table'][['species', 'prediction']])

示例#8

0

显示文件

文件： classification_test.py 项目： shovsj/studio

    def test_predict_thresholds(self):
        iris = get_iris()

        df_splitted = split_data(table=iris, train_ratio=0.7, test_ratio=0.3)
        train_df = df_splitted['train_table']
        test_df = df_splitted['test_table']

        train_out = svm_classification_train(table=train_df,
                                             feature_cols=[
                                                 'sepal_length', 'sepal_width',
                                                 'petal_length', 'petal_width'
                                             ],
                                             label_col='species')
        # print(train_out['model']['svc_model'])

        predict_out = svm_classification_predict(table=test_df,
                                                 model=train_out['model'],
                                                 thresholds=[0.1, 0.2, 0.3])
        print(predict_out['out_table'][['species', 'prediction']])

示例#9

0

显示文件

 def setUp(self):
     print("*** Chi-square Test of Independence UnitTest Start ***")
     self.iris = get_iris()

示例#10

0

显示文件

 def setUp(self):
     print("*** SQL UnitTest Start ***")
     df_iris = get_iris()

示例#11

0

显示文件

    
    Unless required by applicable law or agreed to in writing, software
    distributed under the License is distributed on an "AS IS" BASIS,
    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
    See the License for the specific language governing permissions and
    limitations under the License.
"""

import unittest
import pandas as pd
import numpy as np
from brightics.function.test_data import get_iris
from brightics.function.transform import sql_execute
from brightics.common.repr import strip_margin

df_iris = get_iris()


class SQLTest(unittest.TestCase):
    def test_percentile(self):
        query = strip_margin('''
        | SELECT percentile(sepal_length, 25) FROM #{DF(0)}
        |''')

        result_df = sql_execute(df_iris, query)['out_table']
        print(result_df)
        self.assertEqual(5.1, result_df.values[0][0],
                         'The percentile is not correct.')

    def test_array(self):
        query = strip_margin('''

示例#12

0

显示文件

 def kmeans_groupby1(self):
     df = get_iris()
     train_out = kmeans_train_predict(df, input_cols=['sepal_length', 'sepal_width', 'petal_length', 'petal_width'], group_by=['species'])
     predict_out = kmeans_predict(df, train_out['model'])
     print(predict_out['out_table'])

示例#13

0

显示文件

文件： manipulation_test.py 项目： eastshine94/studio

 def test2(self):
     df = get_iris()
     out_df = sort(df, input_cols=[], is_asc=['desc'])['out_table']
     print(df)
     print(out_df)