Python Dataset.merge Examples

Programming Language: Python

Namespace/Package Name: pybamboo.dataset

Class/Type: Dataset

Method/Function: merge

Examples at hotexamples.com: 10

Python Dataset.merge - 10 examples found. These are the top rated real world Python examples of pybamboo.dataset.Dataset.merge extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

Dataset(24)

merge(5)

get_data(4)

add_calculation(4)

delete(4)

join(4)

get_info(4)

remove_calculation(2)

get_calculations(2)

add_aggregation(1)

get_aggregations(1)

get_aggregate_datasets(1)

get_row(1)

get_summary(1)

delete_row(1)

count(1)

add_calculations(1)

resample(1)

Example #1

Show file

 def test_merge(self):
     # already have one dataset in self.dataset
     dataset = Dataset(path=self.CSV_FILE, connection=self.connection)
     result = Dataset.merge([self.dataset, dataset],
                            connection=self.connection)
     self.assertTrue(isinstance(result, Dataset))
     self._cleanup(dataset)
     self._cleanup(result)

Example #2

Show file

File: test_dataset.py Project: SEL-Columbia/pybamboo

 def test_merge(self):
     # already have one dataset in self.dataset
     dataset = Dataset(path=self.CSV_FILE,
                       connection=self.connection)
     result = Dataset.merge([self.dataset, dataset],
                            connection=self.connection)
     self.assertTrue(isinstance(result, Dataset))
     self._cleanup(dataset)
     self._cleanup(result)

Example #3

Show file

 def test_merge_default_connection(self):
     dataset = Dataset(path=self.CSV_FILE,
                       connection=self.default_connection)
     other_dataset = Dataset(path=self.CSV_FILE,
                             connection=self.default_connection)
     result = Dataset.merge([dataset, other_dataset])
     self.assertTrue(isinstance(result, Dataset))
     self._cleanup(dataset)
     self._cleanup(other_dataset)
     self._cleanup(result)

Example #4

Show file

File: test_dataset.py Project: SEL-Columbia/pybamboo

 def test_merge_default_connection(self):
     dataset = Dataset(path=self.CSV_FILE,
                       connection=self.default_connection)
     other_dataset = Dataset(path=self.CSV_FILE,
                             connection=self.default_connection)
     result = Dataset.merge([dataset, other_dataset])
     self.assertTrue(isinstance(result, Dataset))
     self._cleanup(dataset)
     self._cleanup(other_dataset)
     self._cleanup(result)

Example #5

Show file

 def test_merge_fail(self):
     other_dataset = Dataset('12345', connection=self.connection)
     result = Dataset.merge([self.dataset, other_dataset],
                            connection=self.connection)
     self.assertFalse(result)

Example #6

Show file

 def test_merge_bad_datasets(self):
     dataset = {}
     other_dataset = []
     with self.assertRaises(PyBambooException):
         Dataset.merge([dataset, other_dataset], connection=self.connection)

Example #7

Show file

File: nigeria.py Project: SEL-Columbia/nigeria-analysis

                state = dataset.get_info()['state']
                print state
            bamboo_ids[sector]['originals'][name] = dataset.id
            with open(bamboo_id_file, 'wb') as f:
                f.write(json.dumps(bamboo_ids))

# merge originals
for sector in bamboo_ids.keys():
    if not bamboo_ids[sector]['merged']:
        print 'no merged dataset for sector: %s' % sector
        datasets = [
            Dataset(connection=connection, dataset_id=id)
            for name, id in bamboo_ids[sector]['originals'].iteritems()
        ]
        print 'merging datasets: %s' % [dataset.id for dataset in datasets]
        merged = Dataset.merge(datasets, connection=connection)
        print 'merged: %s' % merged
        state = merged.get_info()['state']
        while state != 'ready':
            time.sleep(1)
            state = merged.get_info()['state']
        bamboo_ids[sector]['merged'] = merged.id
        with open(bamboo_id_file, 'wb') as f:
            f.write(json.dumps(bamboo_ids))

# add calculations
print "starting: add calculations"
for sector in bamboo_ids.keys():
    print "adding calculation for sector %s" % sector
    calculations = []
    with open('calculations/%s.txt' % sector) as f:

Example #8

Show file

File: nigeria.py Project: SEL-Columbia/nigeria-analysis

            while state != 'ready':
                time.sleep(1)
                state = dataset.get_info()['state']
                print state
            bamboo_ids[sector]['originals'][name] = dataset.id
            with open(bamboo_id_file, 'wb') as f:
                f.write(json.dumps(bamboo_ids))

# merge originals
for sector in bamboo_ids.keys():
    if not bamboo_ids[sector]['merged']:
        print 'no merged dataset for sector: %s' % sector
        datasets = [Dataset(connection=connection, dataset_id=id) for name, id
            in bamboo_ids[sector]['originals'].iteritems()]
        print 'merging datasets: %s' % [dataset.id for dataset in datasets]
        merged = Dataset.merge(datasets, connection=connection)
        print 'merged: %s' % merged
        state = merged.get_info()['state']
        while state != 'ready':
            time.sleep(1)
            state = merged.get_info()['state']
        bamboo_ids[sector]['merged'] = merged.id
        with open(bamboo_id_file, 'wb') as f:
            f.write(json.dumps(bamboo_ids))

# add calculations
print "starting: add calculations"
for sector in bamboo_ids.keys():
    print "adding calculation for sector %s" % sector
    calculations = []
    with open('calculations/%s.txt' % sector) as f:

Example #9

Show file

File: test_dataset.py Project: SEL-Columbia/pybamboo

 def test_merge_fail(self):
     other_dataset = Dataset('12345', connection=self.connection)
     result = Dataset.merge([self.dataset, other_dataset],
                            connection=self.connection)
     self.assertFalse(result)

Example #10

Show file

File: test_dataset.py Project: SEL-Columbia/pybamboo

 def test_merge_bad_datasets(self):
     dataset = {}
     other_dataset = []
     with self.assertRaises(PyBambooException):
         Dataset.merge([dataset, other_dataset],
                       connection=self.connection)