Exemplo n.º 1
0
    def test_similar_row_from_datum_and_rate(self):
        filter_warning()
        recommender = Recommender.run(Config())
        loader = StubLoader()
        schema = Schema({'v': Schema.ID})
        dataset = Dataset(loader, schema)
        for (idx, row_id,
             result) in recommender.similar_row_from_datum_and_rate(dataset):
            self.assertEqual(0, len(result))

        # rate must be in (0, 1].
        def func():
            for _ in recommender.similar_row_from_datum_and_rate(dataset,
                                                                 rate=0.0):
                pass

        self.assertRaises(ValueError, lambda: func())

        def func():
            for _ in recommender.similar_row_from_datum_and_rate(dataset,
                                                                 rate=1.01):
                pass

        self.assertRaises(ValueError, lambda: func())

        schema = Schema({'v': Schema.NUMBER})
        dataset = Dataset(loader, schema)
        for (idx, row_id,
             result) in recommender.similar_row_from_datum_and_rate(dataset):
            self.assertEqual(None, row_id)  # there is no id in column_table
            self.assertEqual(
                0, len(result))  # there is no similar row in column_table

        recommender.stop()
Exemplo n.º 2
0
    def test_similar_row_from_id_and_score(self):
        filter_warning()
        recommender = Recommender.run(Config())
        loader = StubLoader()

        # dataset must have id when execute `similar_row_from_id_and_score`
        schema = Schema({'v': Schema.NUMBER})
        dataset = Dataset(loader, schema)

        def func():
            for _ in recommender.similar_row_from_id_and_score(dataset):
                pass

        self.assertRaises(RuntimeError, lambda: func())

        schema = Schema({'v': Schema.ID})
        dataset = Dataset(loader, schema)
        for (idx, row_id,
             result) in recommender.similar_row_from_id_and_score(dataset):
            self.assertEqual(str(idx + 1),
                             row_id)  # there is no id in column_table
            self.assertEqual(
                0, len(result))  # there is no similar row in column_table

        recommender.stop()
Exemplo n.º 3
0
  def test_simple(self):
    schema = Schema({
      'id': Schema.ID,
      'k1': Schema.STRING,
      'k2': Schema.NUMBER,
    })
    (row_id, d) = schema.transform({'id': 'user001', 'k1': 'abc', 'k2': '123'})

    self.assertEqual(row_id, 'user001')
    self.assertEqual({'k1': 'abc'}, dict(d.string_values))
    self.assertEqual({'k2': 123}, dict(d.num_values))
Exemplo n.º 4
0
    def test_simple(self):
        schema = Schema({
            'id': Schema.ID,
            'k1': Schema.STRING,
            'k2': Schema.NUMBER,
        })
        (row_id, d) = schema.transform({
            'id': 'user001',
            'k1': 'abc',
            'k2': '123'
        })

        self.assertEqual(row_id, 'user001')
        self.assertEqual({'k1': 'abc'}, dict(d.string_values))
        self.assertEqual({'k2': 123}, dict(d.num_values))
Exemplo n.º 5
0
    def test_update_row(self):
        recommender = Recommender.run(Config())
        loader = StubLoader()

        # dataset must have id when execute `update_row`
        schema = Schema({'v': Schema.NUMBER})
        dataset = Dataset(loader, schema)

        def func():
            for _ in recommender.update_row(dataset):
                pass

        self.assertRaises(RuntimeError, lambda: func())

        schema = Schema({'v': Schema.ID})
        dataset = Dataset(loader, schema)
        for (idx, row_id, result) in recommender.update_row(dataset):
            self.assertEqual(result, True)
        recommender.stop()
Exemplo n.º 6
0
    def test_similar_row_from_datum(self):
        filter_warning()
        recommender = Recommender.run(Config())
        loader = StubLoader()
        schema = Schema({'v': Schema.ID})
        dataset = Dataset(loader, schema)
        for (idx, row_id,
             result) in recommender.similar_row_from_datum(dataset):
            self.assertEqual(0, len(result))

        schema = Schema({'v': Schema.NUMBER})
        dataset = Dataset(loader, schema)
        for (idx, row_id,
             result) in recommender.similar_row_from_datum(dataset):
            self.assertEqual(None, row_id)  # there is no id in column_table
            self.assertEqual(
                0, len(result))  # there is no similar row in column_table

        recommender.stop()
Exemplo n.º 7
0
    def test_complete_row_from_datum(self):
        filter_warning()
        recommender = Recommender.run(Config())
        loader = StubLoader()

        schema = Schema({'v': Schema.ID})
        dataset = Dataset(loader, schema)
        for (idx, row_id, d) in recommender.complete_row_from_datum(dataset):
            self.assertEqual(0, len(d.string_values))
            self.assertEqual(0, len(d.num_values))
            self.assertEqual(0, len(d.binary_values))

        schema = Schema({'v': Schema.NUMBER})
        dataset = Dataset(loader, schema)
        for (idx, row_id, d) in recommender.complete_row_from_datum(dataset):
            self.assertEqual(None, row_id)  # there is no id in column_table.
            self.assertEqual(0, len(d.string_values))
            self.assertEqual(0, len(d.num_values))
            self.assertEqual(0, len(d.binary_values))

        recommender.stop()
Exemplo n.º 8
0
    def test_clear_row(self):
        recommender = Recommender.run(Config())
        loader = StubLoader()

        # dataset must have id when execute `clear_row`.
        schema = Schema({'v': Schema.NUMBER})
        dataset = Dataset(loader, schema)

        def func():
            for _ in recommender.clear_row(dataset):
                pass

        self.assertRaises(RuntimeError, lambda: func())

        schema = Schema({'v': Schema.ID})
        dataset = Dataset(loader, schema)

        # expect to get False when table is empty.
        for (idx, row_id, result) in recommender.clear_row(dataset):
            self.assertEqual(result, True)

        recommender.stop()
Exemplo n.º 9
0
    def test_complete_row_from_id(self):
        filter_warning()
        recommender = Recommender.run(Config())
        loader = StubLoader()

        # dataset must have id when execute `complete_row_from_id`
        schema = Schema({'v': Schema.NUMBER})
        dataset = Dataset(loader, schema)

        def func():
            for _ in recommender.complete_row_from_id(dataset):
                pass

        self.assertRaises(RuntimeError, lambda: func())

        schema = Schema({'v': Schema.ID})
        dataset = Dataset(loader, schema)
        for (idx, row_id, d) in recommender.complete_row_from_id(dataset):
            self.assertEqual(0, len(d.string_values))
            self.assertEqual(0, len(d.num_values))
            self.assertEqual(0, len(d.binary_values))

        recommender.stop()
Exemplo n.º 10
0
Using Recommender
========================================

This is a simple example that illustrates Recommender service usage.

"""

from jubakit.recommender import Recommender, Schema, Dataset, Config
from jubakit.loader.csv import CSVLoader

# Load a CSV file.
loader = CSVLoader('npb.csv')

# Define a Schema that defines types for each columns of the CSV file.
schema = Schema({
    'name': Schema.ID,
    'team': Schema.STRING,
}, Schema.NUMBER)

# Create a Dataset.
dataset = Dataset(loader, schema)

# Create an Recommender Service.
cfg = Config(method='lsh')
recommender = Recommender.run(cfg)

# Update the Recommender model.
for (idx, row_id, success) in recommender.update_row(dataset):
    pass

# Calculate the similarity in recommender model from row-id and display top-2 similar items.
print('{0}\n recommend similar players from row-id \n{1}'.format(