Python connect Exemples, veritable.connect Python Exemples

Exemple #1

0

Afficher le fichier

 def setup_class(self):
     self.API = veritable.connect(TEST_API_KEY, TEST_BASE_URL,
                                  **connect_kwargs)
     self.t = self.API.create_table()
     self.t.batch_upload_rows([{
         '_id': 'row1',
         'cat': 'a',
         'ct': 0,
         'real': 1.02394,
         'bool': True
     }, {
         '_id': 'row2',
         'cat': 'b',
         'ct': 0,
         'real': 0.92131,
         'bool': False
     }, {
         '_id': 'row3',
         'cat': 'c',
         'ct': 1,
         'real': 1.82812,
         'bool': True
     }, {
         '_id': 'row4',
         'cat': 'c',
         'ct': 1,
         'real': 0.81271,
         'bool': True
     }, {
         '_id': 'row5',
         'cat': 'd',
         'ct': 2,
         'real': 1.14561,
         'bool': False
     }, {
         '_id': 'row6',
         'cat': 'a',
         'ct': 5,
         'real': 1.03412,
         'bool': False
     }])
     self.schema = {
         'cat': {
             'type': 'categorical'
         },
         'ct': {
             'type': 'count'
         },
         'real': {
             'type': 'real'
         },
         'bool': {
             'type': 'boolean'
         }
     }
     self.a = self.t.create_analysis(self.schema,
                                     analysis_id="a1",
                                     force=True)
     self.a.wait()

Exemple #2

0

Afficher le fichier

Fichier : app.py Projet : jtmcmc/heart_app

def predict():
	API_KEY = '<API_KEY>'
	api = veritable.connect(api_key=API_KEY)
	table = api.get_table('heart_data')
	analysis = table.get_analysis('heart_analysis')
	foo = request.args.to_dict().keys()
	new_patient = sj.loads(foo[0])
	del new_patient['']
	for k in new_patient:
		new_patient[k] = float(new_patient[k])
	new_patient['num'] = None
	prediction = analysis.predict(new_patient)
	return jsonify(predicted=prediction['num'])

Exemple #3

0

Afficher le fichier

Fichier : test_cursor.py Projet : rkomartin/veritable-python

 def setup_class(self):
     self.API = veritable.connect(TEST_API_KEY, TEST_BASE_URL,
         **connect_kwargs)
     self.t = self.API.create_table()
     self.t.batch_upload_rows(
     [{'_id': 'row1', 'cat': 'a', 'ct': 0, 'real': 1.02394, 'bool': True},
      {'_id': 'row2', 'cat': 'b', 'ct': 0, 'real': 0.92131, 'bool': False},
      {'_id': 'row3', 'cat': 'c', 'ct': 1, 'real': 1.82812, 'bool': True},
      {'_id': 'row4', 'cat': 'c', 'ct': 1, 'real': 0.81271, 'bool': True},
      {'_id': 'row5', 'cat': 'd', 'ct': 2, 'real': 1.14561, 'bool': False},
      {'_id': 'row6', 'cat': 'a', 'ct': 5, 'real': 1.03412, 'bool': False}
     ])
     self.connection = self.t._conn
     self.collection = self.t._link("rows")

Exemple #4

0

Afficher le fichier

def main(data_file, schema_file):
    rows = json.loads(open(data_file).read())
    schema = json.loads(open(schema_file).read())
    
    api = veritable.connect()
    
    if not api.table_exists(TABLE_NAME):
        print 'Creating table'
        table = api.create_table(TABLE_NAME)
    else:
        print 'Getting table'
        table = api.get_table(TABLE_NAME)
    
    print 'Uploading rows'
    table.batch_upload_rows(rows)
    print 'Creating analysis'
    analysis = table.create_analysis(schema)

Exemple #5

0

Afficher le fichier

Fichier : test_cursor.py Projet : rkomartin/veritable-python

 def setup_class(self):
     self.API = veritable.connect(TEST_API_KEY, TEST_BASE_URL,
                                  **connect_kwargs)
     self.t = self.API.create_table()
     self.t.batch_upload_rows([{
         '_id': 'row1',
         'cat': 'a',
         'ct': 0,
         'real': 1.02394,
         'bool': True
     }, {
         '_id': 'row2',
         'cat': 'b',
         'ct': 0,
         'real': 0.92131,
         'bool': False
     }, {
         '_id': 'row3',
         'cat': 'c',
         'ct': 1,
         'real': 1.82812,
         'bool': True
     }, {
         '_id': 'row4',
         'cat': 'c',
         'ct': 1,
         'real': 0.81271,
         'bool': True
     }, {
         '_id': 'row5',
         'cat': 'd',
         'ct': 2,
         'real': 1.14561,
         'bool': False
     }, {
         '_id': 'row6',
         'cat': 'a',
         'ct': 5,
         'real': 1.03412,
         'bool': False
     }])
     self.connection = self.t._conn
     self.collection = self.t._link("rows")

Exemple #6

0

Afficher le fichier

Fichier : test_group.py Projet : rkomartin/veritable-python

 def setup_class(self):
     self.API = veritable.connect(TEST_API_KEY, TEST_BASE_URL,
         **connect_kwargs)
     self.t = self.API.create_table()
     self.rows = [{'_id': 'row1', 'cat': 'a', 'ct': 0, 'real': 1.02394, 'bool': True},
      {'_id': 'row2', 'cat': 'b', 'ct': 0, 'real': 0.92131, 'bool': False},
      {'_id': 'row3', 'cat': 'c', 'ct': 1, 'real': 1.82812, 'bool': True},
      {'_id': 'row4', 'cat': 'c', 'ct': 1, 'real': 0.81271, 'bool': True},
      {'_id': 'row5', 'cat': 'd', 'ct': 2, 'real': 1.14561, 'bool': False},
      {'_id': 'row6', 'cat': 'a', 'ct': 5, 'real': 1.03412, 'bool': False}]
     self.t.batch_upload_rows(self.rows)
     self.schema = {'cat': {'type': 'categorical'},
               'ct': {'type': 'count'},
               'real': {'type': 'real'},
               'bool': {'type': 'boolean'}
               }
     self.a = self.t.create_analysis(self.schema, analysis_id="a1",
         force=True)
     self.a.wait()

Exemple #7

0

Afficher le fichier

Fichier : run.py Projet : veronicalimpooikhoon/bank-data-example

def main():

    ##########
    # UPLOAD #
    ##########

    # 1. Define the schema for the table - specify column names and data types
    table_schema = {
        'age': {
            'type': 'count'
        },
        'sex': {
            'type': 'categorical'
        },
        'region': {
            'type': 'categorical'
        },
        'income': {
            'type': 'real'
        },
        'married': {
            'type': 'boolean'
        },
        'children': {
            'type': 'count'
        },
        'car': {
            'type': 'boolean'
        },
        'save_act': {
            'type': 'boolean'
        },
        'current_act': {
            'type': 'boolean'
        },
        'mortgage': {
            'type': 'boolean'
        },
        'pep': {
            'type': 'boolean'
        },
    }

    # 2. Load the data from csv and divide it into training and test subsets
    rows = read_csv(
        DATA_FILE
    )  # Load rows from CSV, returns all row data values as strings
    clean_data(rows, table_schema
               )  # Convert row data values to correct types based on schema
    training_rows, test_rows = split_rows(
        rows, TRAIN_FRAC)  # Split into training and test sets

    # 3. Connect to the Veritable API
    api = veritable.connect()
    if api.table_exists(TABLE_ID):
        print("Deleting old table '%s'" % TABLE_ID)
        api.delete_table(TABLE_ID)

    # 4. Create a Veritable Table and upload training rows
    print("Creating table '%s' and uploading rows" % TABLE_ID)
    table = api.create_table(table_id=TABLE_ID)
    table.batch_upload_rows(training_rows)

    ###########
    # ANALYZE #
    ###########

    # 5. Create a Veritable Analysis and wait for it to complete
    print("Creating analysis '%s' and waiting for it to complete" %
          ANALYSIS_ID)
    analysis = table.create_analysis(schema=table_schema,
                                     analysis_id=ANALYSIS_ID)
    analysis.wait()

    ###########
    # PREDICT #
    ###########

    # 6. For each row in the test set, predict the value and uncertainty for the target column
    print("Making predictions")

    prediction_results = []
    for test_row in test_rows:
        # Prepare the prediction request
        prediction_request = test_row.copy()  # Copy known values from test row
        del prediction_request[
            '_id']  # '_id' should not be present in prediction requests
        prediction_request[
            TARGET_COL] = None  # None values are predicted by Veritable

        # Make predictions
        prediction = analysis.predict(prediction_request, PRED_COUNT)

        # Derive a single value estimate and uncertainty metric
        estimate = prediction[TARGET_COL]
        uncertainty = prediction.uncertainty[TARGET_COL]

        # Compare estimate to actual value from test row
        is_correct = (estimate == test_row[TARGET_COL])

        # Collect results
        prediction_results.append({
            'is_correct': is_correct,
            'uncertainty': uncertainty
        })

    # 7. Evaluate prediction accuracy using different maximum uncertainty thresholds
    for maximum_uncertainty in MAXIMUM_UNCERTAINTY_THRESHOLDS:
        # Treat prediction results as unknown if uncertainty is above the maximum_uncertainty threshold
        unknown_prediction_results = [
            r for r in prediction_results
            if r['uncertainty'] > maximum_uncertainty
        ]
        unknown_count = len(unknown_prediction_results)

        # Only look at prediction results if uncertainty is below the maximum_uncertainty threshold
        known_prediction_results = [
            r for r in prediction_results
            if r['uncertainty'] <= maximum_uncertainty
        ]
        known_count = len(known_prediction_results)

        # Identify prediction results we looked at that are correct
        known_correct_prediction_results = [
            r for r in known_prediction_results if r['is_correct']
        ]
        known_correct_count = len(known_correct_prediction_results)

        print(
            "Predictions for {0} are {1:.0%} ({2}/{3}) correct with {4:.0%} ({5}/{6}) ignored using a maximum uncertainty of {7}"
            .format(
                TARGET_COL,
                0.0 if known_count == 0 else float(known_correct_count) /
                known_count, known_correct_count, known_count,
                float(unknown_count) / (known_count + unknown_count),
                unknown_count, known_count + unknown_count,
                maximum_uncertainty))

Exemple #8

0

Afficher le fichier

Fichier : run.py Projet : Salmation/bank-data-example

def main():

    ##########
    # UPLOAD #
    ##########

    # 1. Define the schema for the table - specify column names and data types
    table_schema = {
        'age': {'type': 'count'},
        'sex': {'type': 'categorical'},
        'region': {'type': 'categorical'},
        'income': {'type': 'real'},
        'married': {'type': 'boolean'},
        'children': {'type': 'count'},
        'car': {'type': 'boolean'},
        'save_act': {'type': 'boolean'},
        'current_act': {'type': 'boolean'},
        'mortgage': {'type': 'boolean'},
        'pep': {'type': 'boolean'},
    }

    # 2. Load the data from csv and divide it into training and test subsets
    rows = read_csv(DATA_FILE)                                  # Load rows from CSV, returns all row data values as strings
    clean_data(rows, table_schema)                               # Convert row data values to correct types based on schema
    training_rows, test_rows = split_rows(rows, TRAIN_FRAC)     # Split into training and test sets

    # 3. Connect to the Veritable API
    api = veritable.connect()
    if api.table_exists(TABLE_ID):
        print("Deleting old table '%s'" %TABLE_ID)
        api.delete_table(TABLE_ID)

    # 4. Create a Veritable Table and upload training rows
    print("Creating table '%s' and uploading rows" %TABLE_ID)
    table = api.create_table(table_id=TABLE_ID)
    table.batch_upload_rows(training_rows)



    ###########
    # ANALYZE #
    ###########

    # 5. Create a Veritable Analysis and wait for it to complete
    print("Creating analysis '%s' and waiting for it to complete" %ANALYSIS_ID)
    analysis = table.create_analysis(schema=table_schema, analysis_id=ANALYSIS_ID)
    analysis.wait()



    ###########
    # PREDICT #
    ###########


    # 6. For each row in the test set, predict the value and uncertainty for the target column
    print("Making predictions")

    prediction_results = []
    for test_row in test_rows:
        # Prepare the prediction request
        prediction_request = test_row.copy()        # Copy known values from test row
        del prediction_request['_id']               # '_id' should not be present in prediction requests
        prediction_request[TARGET_COL] = None       # None values are predicted by Veritable

        # Make predictions
        prediction = analysis.predict(prediction_request, PRED_COUNT)

        # Derive a single value estimate and uncertainty metric
        estimate = prediction[TARGET_COL]
        uncertainty = prediction.uncertainty[TARGET_COL]

        # Compare estimate to actual value from test row
        is_correct = (estimate == test_row[TARGET_COL])

        # Collect results
        prediction_results.append( { 'is_correct':is_correct, 'uncertainty':uncertainty } )


    # 7. Evaluate prediction accuracy using different maximum uncertainty thresholds
    for maximum_uncertainty in MAXIMUM_UNCERTAINTY_THRESHOLDS:
        # Treat prediction results as unknown if uncertainty is above the maximum_uncertainty threshold
        unknown_prediction_results = [r for r in prediction_results if r['uncertainty'] > maximum_uncertainty]
        unknown_count = len(unknown_prediction_results)

        # Only look at prediction results if uncertainty is below the maximum_uncertainty threshold
        known_prediction_results = [r for r in prediction_results if r['uncertainty'] <= maximum_uncertainty]
        known_count = len(known_prediction_results)

        # Identify prediction results we looked at that are correct
        known_correct_prediction_results = [r for r in known_prediction_results if r['is_correct']]
        known_correct_count = len(known_correct_prediction_results)

        print( "Predictions for {0} are {1:.0%} ({2}/{3}) correct with {4:.0%} ({5}/{6}) ignored using a maximum uncertainty of {7}".format(
                    TARGET_COL,
                    0.0 if known_count == 0 else float(known_correct_count) / known_count,
                    known_correct_count,
                    known_count,
                    float(unknown_count) / (known_count+unknown_count),
                    unknown_count,
                    known_count+unknown_count,
                    maximum_uncertainty ) )

Exemple #9

0

Afficher le fichier

Fichier : test_tables.py Projet : rkomartin/veritable-python

 def setup_class(self):
     self.API = veritable.connect(TEST_API_KEY, TEST_BASE_URL,
         **connect_kwargs)

Exemple #10

0

Afficher le fichier

Fichier : app.py Projet : rkomartin/user-recs-example


MIN_RATINGS = 100
TABLE_NAME = 'movielens'

# load the item metadata from a static file; in a production system this
# information would likely come from a database
ITEMS = [it 
    for it in json.loads(open('recs/static/movie_descriptions.json').read())
    if it['num_ratings'] > MIN_RATINGS]
ITEMS.sort(key=lambda x: x['name'])
ITEM_NAMES = dict([(m['id'], m['name']) for m in ITEMS])

# connect to the Veritable API and perform baseline predictions; this will
# allow us to compute rating "lift" later
api = veritable.connect()
analysis = get_last_successful_analysis(api, TABLE_NAME)
baselines = get_baselines(analysis, ITEMS)
app = Flask(__name__)


def item_filter(per_item_preds, baseline_val):
    '''
    Decides whether an item should be considered for inclusion in the 
    recommendations. This version requires that three conditions be met:
    
    1. The item must have a reasonably high predicted rating (per_item_mean > 3.)
    2. The predictions must indicate that the user will rate the item higher than
       its baseline rating (lift > .2)
    3. The predictions must not be too uncertain regarding the positive 
       lift (conf > .75)

Exemple #11

0

Afficher le fichier