Пример #1
0
def main():
    sf = ss.Select(Sequence = True, Random = False, Cross = False) #初始化选择器,选择你需要的流程
    sf.ImportDF(df,label = 'nextbuy') #导入数据集以及目标标签
    sf.ImportLossFunction(score, direction = 'ascend') #导入评价函数以及优化方向
    sf.InitialNonTrainableFeatures(['buy','nextbuy','o_date','a_date','PredictDays','user_id']) #初始化不能用的特征
    sf.InitialFeatures(['age_x', 'sex_x', 'user_lv_cd_x', 'buycnt', 'daybeforelastbuy_o_ave']) #初始化其实特征组合
    sf.GenerateCol() #生成特征库 (具体该函数变量请参考根目录下的readme)
    sf.SetSample(1, samplemode = 1) #初始化抽样比例和随机过程
    sf.SetTimeLimit(100) #设置算法运行最长时间,以分钟为单位
    sf.clf = lgbm.LGBMRegressor(random_state=1, num_leaves =6, n_estimators=1000, max_depth=3, learning_rate = 0.2, n_jobs=8) #设定回归模型
    sf.SetLogFile('record.log') #初始化日志文件
    sf.run(validate) #输入检验函数并开始运行
Пример #2
0
def seq(df, f, notusable, clf):
    sf = sequence_selection.Select(Sequence=True, Random=True,
                                   Cross=True)  #初始化选择器,选择你需要的流程
    sf.ImportDF(df, label='buy')  #导入数据集以及目标标签
    sf.ImportLossFunction(score1, direction='ascend')  #导入评价函数以及优化方向
    #sf.ImportCrossMethod(CrossMethod)
    sf.InitialNonTrainableFeatures(notusable)  #初始化不能用的特征
    sf.InitialFeatures(f)
    sf.GenerateCol()  #生成特征库 (具体该函数变量请参考根目录下的readme)
    #    sf.SetTimeLimit(120) #设置算法运行最长时间,以分钟为单位
    sf.clf = clf
    sf.SetLogFile('record_seq8.log')  #初始化日志文件
    return sf.run(validate)  #输入检验函数并开始运行
Пример #3
0
def main():
    sf = ss.Select(Sequence = True, Random = True, Cross = False) #select the way you want to process searching
    sf.ImportDF(prepareData(),label = 'is_trade')
    sf.ImportLossFunction(modelscore,direction = 'descend')
    sf.ImportCrossMethod(CrossMethod)
    sf.InitialNonTrainableFeatures(['used','instance_id', 'item_property_list', 'context_id', 'context_timestamp', 'predict_category_property', 'is_trade'])
    sf.InitialFeatures(['item_category_list', 'item_price_level','item_sales_level','item_collected_level', 'item_pv_level','day'])
    sf.GenerateCol(key = 'mean', selectstep = 2)
    sf.SetSample(0.1, samplemode = 0, samplestate = 0)
#    sf.SetFeaturesLimit(5)
    sf.SetTimeLimit(1)
    sf.clf = lgbm.LGBMClassifier(random_state=1, num_leaves = 6, n_estimators=5000, max_depth=3, learning_rate = 0.05, n_jobs=8)
    sf.SetLogFile('recordml.log')
    sf.run(validation)
def main():
    sf = ss.Select(Sequence=True, Random=False, Cross=True)
    sf.ImportDF(prepareData(), label='Survived')
    sf.ImportLossFunction(modelscore, direction='ascend')
    sf.ImportCrossMethod(CrossMethod)
    sf.InitialNonTrainableFeatures(['Survived'])
    sf.InitialFeatures([])
    sf.GenerateCol()
    sf.SetSample(0.5, samplemode=0, samplestate=0)
    sf.AddPotentialFeatures(['Pclass'])
    sf.clf = LogisticRegression()
    sf.SetLogFile('record2.log')
    #    sf.SetFeaturesLimit(5)
    sf.SetTimeLimit(0.2)
    sf.run(validation)
Пример #5
0
def main():
    sf = ss.Select(Sequence=True, Random=False, Cross=False)  #初始化选择器,选择你需要的流程
    sf.ImportDF(prepareData(), label='buy')  #导入数据集以及目标标签
    sf.ImportLossFunction(score1, direction='ascend')  #导入评价函数以及优化方向
    sf.ImportCrossMethod(CrossMethod)
    sf.InitialNonTrainableFeatures(['USRID', 'FLAG'])  #初始化不能用的特征
    combine_col = ['V1', 'V2', 'V3', 'V4', 'V5', 'V6', 'V7', 'V8', 'V9']  #,
    # 'V10', 'V11', 'V12', 'V13', 'V14', 'V15', 'V16', 'V17', 'V18', 'V19',
    # 'V20', 'V21', 'V22', 'V23', 'V24', 'V25', 'V26', 'V27', 'V28', 'V29',
    # 'V30']
    sf.InitialFeatures(combine_col)  #初始化其实特征组合
    sf.GenerateCol()  #生成特征库 (具体该函数变量请参考根目录下的readme)
    sf.SetSample(1, samplemode=1)  #初始化抽样比例和随机过程
    sf.SetTimeLimit(100)  #设置算法运行最长时间,以分钟为单位
    sf.clf = lgb.LGBMClassifier(random_state=1,
                                num_leaves=6,
                                n_estimators=1000,
                                max_depth=3,
                                learning_rate=0.2,
                                n_jobs=8)  #设定回归模型
    sf.SetLogFile('record.log')  #初始化日志文件
    sf.run(validate)  #输入检验函数并开始运行