Пример #1
0
    def test_titanic(self):
        query = 'READ "../data/train.csv" (separator = ",", header = 0) AND\
        REPLACE (missing="NaN", strategy="mode") AND SPLIT (train = .8, test = 0.2) AND\
        AND ENCODE (strategy = "regular") AND\
        CLASSIFY (predictors = [1,3,4,5,6,7,8,9,10,11,12], label = 2, algorithm = forest)'

        assert execute(query, verbose=None) is not None
Пример #2
0
    def test_auto(self):
        query = 'READ "../data/auto.csv" (separator = "\s+", header = None) AND\
         REPLACE (missing = "?", strategy = "mode") AND\
          SPLIT (train = .8, test = .2) AND \
          REGRESS (predictors = [2,3,4,5,6,7,8], label = 1, algorithm = lasso)'

        assert execute(query, verbose=None) is not None
Пример #3
0
    def test_chronic(self):
        query = 'READ "../data/chronic.csv" (separator = ",", header = None) AND\
        REPLACE (missing="?", strategy = "mode") AND ENCODE (strategy = "regular") \
        AND SPLIT (train = .8, test = 0.2) AND CLASSIFY \
        (predictors = [1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24],\
         label = 25, algorithm = logistic)'

        assert execute(query, verbose=None) is not None
Пример #4
0
 def test_persistence_preprocessing(self):
     result = execute(
         'READ "../data/census.csv" (separator=",", header = 0, types = [1:numeric, 2:string]) AND\
         REPLACE (strategy = "mode", missing = "NaN", persist = "replace.csv" ) and\
         ENCODE (strategy = "regular", persist = "encode.csv" ) and\
         SPLIT (train = .8, test = 0.2, persist = [test:test.csv, train:train.csv])')
     assert os.path.isfile('replace.csv')
     os.remove('replace.csv')
     assert os.path.isfile('encode.csv')
     os.remove('encode.csv')
     assert os.path.isfile('test.csv')
     os.remove('test.csv')
     assert os.path.isfile('train.csv')
     os.remove('train.csv')
Пример #5
0
def test():
    return execute(query, verbose=None)
Пример #6
0
import sml
from sml import execute

query1 = 'LOAD auto.sml AND\
  REGRESS (predictors = [2,3,4,5,6,7,8], label = 1, algorithm = simple)'

execute(query1, verbose=True)
Пример #7
0
from sml import execute

query = 'READ "data/auto.csv" (separator = "\s+", header = None)'
execute(query, verbose=False)

query = 'READ "data/auto.csv" (separator = "\s+", header = None)'
execute(query, verbose=True)

#TODO: Fix header Bug
#query = 'READ "data/auto.csv" (separator = "\s+", header = [test1,test2,test3,test4,test5,test6,test6,test7,test8,test9])'
#execute(query, verbose=True)
Пример #8
0
 def test_wine(self):
     query = 'READ "../data/wine.csv" (separator = ";", header = 0) AND SPLIT (train = .8, test = 0.2) AND CLASSIFY (predictors = [1,2,3,4,5,6,7,8,9,10,11], label = 12, algorithm = knn)'
     assert execute(query, verbose=None) is not None
Пример #9
0
 def test_spam(self):
     query = 'READ "../data/spam.csv" AND SPLIT (train = .8, test = 0.2) AND CLASSIFY (predictors = [1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56], label = 58, algorithm = bayes)'
     assert execute(query, verbose=None) is not None
Пример #10
0
 def test_seeds(self):
     query = 'READ "../data/seeds.csv" (separator = "\s+", header = 0) AND SPLIT (train = .8, test = .2, validation = .0) and REPLACE (missing="NaN", strategy="mode") AND CLUSTER (predictors = [1,2,3,4,5,6,7], label = 8, algorithm = kmeans)'
     assert execute(query, verbose=None) is not None
Пример #11
0
    def test_iris(self):
        query = 'READ "../data/iris.csv" AND \
         SPLIT (train = .8, test = 0.2) AND \
         CLASSIFY (predictors = [1,2,3,4], label = 5, algorithm = svm)'

        assert execute(query, verbose=None) is not None
Пример #12
0
    def test_computer(self):
        query = 'READ "../data/computer.csv" (separator = ",", header = 0) AND \
        SPLIT (train = .8, test = .2, validation = .0) AND ENCODE (strategy = "regular")\
         AND REGRESS (predictors = [1,2,3,4,5,6,7,8,9], label = 10, algorithm = ridge)'

        assert execute(query, verbose=None) is not None
Пример #13
0
 def test_census(self):
     query = 'READ "../data/census.csv" (separator=",", header = 0, types = [1:numeric, 2:string]) AND REPLACE (missing = "NaN", strategy = "mode") and ENCODE (strategy = "regular") and SPLIT (train = .8, test = 0.2) and CLASSIFY (predictors=[1,2,3,4,5 , 6,7, 8, 9, 10 ,11 ,12, 13,14], label = 15, algorithm = logistic)'
     assert execute(query, verbose=None) is not None
Пример #14
0
 def test_boston(self):
     query = 'READ "../data/boston.csv" (separator = "\s+", header = 0) AND SPLIT (train = .8, test = .2, validation = .0) AND REGRESS (predictors = [1,2,3,4,5,6,7,8,9,10,11,12,13], label = 14, algorithm = elastic)'
     assert execute(query, verbose=None) is not None