Beispiel #1
0
import pkgutil

from backport import OrderedDict

import dedupe.variables
import dedupe.variables.base as base
from dedupe.variables.base import MissingDataType
from dedupe.variables.interaction import InteractionType

for _, module, _ in pkgutil.iter_modules(dedupe.variables.__path__,
                                         'dedupe.variables.'):
    __import__(module)

FIELD_CLASSES = dict(base.allSubclasses(base.FieldType))


class DataModel(dict):
    def __init__(self, fields):

        self['bias'] = 0

        primary_fields, data_model = typifyFields(fields)
        self.derived_start = len(data_model)

        data_model += interactions(fields, primary_fields)
        data_model += missing(data_model)

        self['fields'] = data_model
        self.n_fields = len(self['fields'])
        self.primary_fields = primary_fields
Beispiel #2
0
import pkgutil

import numpy
import copyreg

import dedupe.variables
import dedupe.variables.base as base
from dedupe.variables.base import MissingDataType
from dedupe.variables.interaction import InteractionType

for _, module, _ in pkgutil.iter_modules(dedupe.variables.__path__,
                                         'dedupe.variables.'):
    __import__(module)

FIELD_CLASSES = {k: v for k, v in base.allSubclasses(base.FieldType) if k}


class DataModel(object):
    def __init__(self, fields):

        primary_fields, variables = typifyFields(fields)
        self.primary_fields = primary_fields
        self._derived_start = len(variables)

        variables += interactions(fields, primary_fields)
        variables += missing(variables)

        self._missing_field_indices = missing_field_indices(variables)
        self._interaction_indices = interaction_indices(variables)

        self._variables = variables
Beispiel #3
0
import pkgutil

from collections import OrderedDict

import dedupe.variables
import dedupe.variables.base as base
from dedupe.variables.base import MissingDataType
from dedupe.variables.interaction import InteractionType

for _, module, _  in pkgutil.iter_modules(dedupe.variables.__path__, 
                                          'dedupe.variables.') :
    __import__(module)


FIELD_CLASSES = dict(base.allSubclasses(base.FieldType))

class DataModel(dict) :

    def __init__(self, fields):

        self['bias'] = 0

        primary_fields, data_model = typifyFields(fields)
        self.derived_start = len(data_model)

        data_model += interactions(fields, primary_fields)
        data_model += missing(data_model)

        self['fields'] = data_model
        self.n_fields = len(self['fields'])
        self.primary_fields = primary_fields
Beispiel #4
0
import numpy
import copyreg
import types

import dedupe.variables
import dedupe.variables.base as base
from dedupe.variables.base import MissingDataType
from dedupe.variables.interaction import InteractionType

for _, module, _ in pkgutil.iter_modules(dedupe.variables.__path__,
                                         'dedupe.variables.'):
    __import__(module)


FIELD_CLASSES = {k: v for k, v in base.allSubclasses(base.FieldType) if k}


class DataModel(object):

    def __init__(self, fields):

        primary_fields, variables = typifyFields(fields)
        self.primary_fields = primary_fields
        self._derived_start = len(variables)

        variables += interactions(fields, primary_fields)
        variables += missing(variables)

        self._missing_field_indices = missing_field_indices(variables)
        self._interaction_indices = interaction_indices(variables)