コード例 #1
0
def test_create_model():
    model = Model('test')
    case = Node({"handle": "case"})
    #  set_trace()
    case.props['days_to_enrollment'] = Property(
        {"handle": 'days_to_enrollment'})
    model.add_node(case)
    assert isinstance(model.nodes['case'], Node)
    assert model.props[('case', 'days_to_enrollment')]
    model.add_node({"handle": "sample"})
    assert model.nodes["sample"]
    assert isinstance(model.nodes["sample"], Node)
    assert model.nodes["sample"].model == 'test'
    case_id = Property({"handle": "case_id", "value_domain": "string"})
    model.add_prop(case, case_id)
    assert model.props[("case", "case_id")]
    assert model.props[("case", "case_id")].value_domain == 'string'
    assert 'case_id' in model.nodes['case'].props
    sample = model.nodes["sample"]
    of_case = Edge({"handle": "of_case", "src": sample, "dst": case})
    of_case.props['operator'] = Property({
        "handle": "operator",
        "value_domain": "boolean"
    })
    model.add_edge(of_case)
    assert model.edges[('of_case', 'sample', 'case')]
    assert model.contains(of_case.props['operator'])
    assert of_case.props['operator'].model == 'test'
    assert model.props[('of_case', 'sample', 'case', 'operator')]
    assert model.props[('of_case', 'sample', 'case',
                        'operator')].value_domain == 'boolean'
    dx = Property({"handle": "diagnosis", "value_domain": "value_set"})
    tm = Term({"value": "CRS"})
    model.add_prop(case, dx)
    model.add_terms(dx, tm, 'rockin_pneumonia', 'fungusamongus')
    assert {x.value
            for x in dx.terms.values()
            } == {'CRS', 'rockin_pneumonia', 'fungusamongus'}
コード例 #2
0
class MDF(object):
    default_mult = "one_to_one"
    default_type = "TBD"

    def __init__(self, *yaml_files, handle=None):
        """Create a :class:`Model` from MDF YAML files.
        :param str|file|url *yaml_files: MDF filenames or file objects, in desired merge order
        :param str handle: Handle (name) for the resulting Model
        :attribute model: the :class:`bento_meta.model.Model` created"""
        if not handle or not isinstance(handle, str):
            raise ArgError("arg handle= must be a str - name for model")
        self.handle = handle
        self.files = yaml_files
        self.schema = om.MergedOptions()
        self._model = None
        if self.files:
            self.load_yaml()
            self.create_model()
        else:
            warn("No MDF files provided to constructor")
        pass

    @property
    def model(self):
        """The :class:`bento_meta.model.Model` object created from the MDF input"""
        return self._model

    def load_yaml(self):
        """Load YAML files or open file handles specified in constructor"""
        yloader = yaml.loader.Loader
        for f in self.files:
            if isinstance(f, str):
                if re.match("(?:file|https?)://", f):
                    response = requests.get(f)
                    if not response.ok:
                        raise ArgError(
                            "Fetching url {} returned code {}".format(
                                response.url, response.status_code))
                    response.encoding = "utf8"
                    f = response.text
                else:
                    f = open(f, "r")
            try:
                yml = yaml.load(f, Loader=yloader)
                self.schema.update(yml)
            except ConstructorError as ce:
                print("YAML constructor failed in '{fn}':\n{e}".format(
                    fn=f.name, e=ce))
                raise ce
            except ParserError as pe:
                print("YAML parser failed in '{fn}':\n{e}".format(fn=f.name,
                                                                  e=pe))
                raise pe
            except Exception:
                raise

    def create_model(self):
        """Create :class:`Model` instance from loaded YAML
        Note: This is brittle, since the syntax of MDF is hard-coded into this method."""
        if not self.schema.keys():
            raise ValueError("attribute 'schema' not set - are yamls loaded?")
        self._model = Model(handle=self.handle)
        ynodes = self.schema["Nodes"]
        yedges = self.schema["Relationships"]
        ypropdefs = self.schema["PropDefinitions"]
        yunps = self.schema.get("UniversalNodeProperties")
        yurps = self.schema.get("UniversalRelationshipProperties")
        # create nodes
        for n in ynodes:
            yn = ynodes[n]
            init = {"handle": n, "model": self.handle}
            for a in ["category", "desc"]:
                if yn.get(a):
                    init[a] = yn[a]
            node = self._model.add_node(init)
            if yn.get("Tags"):
                tags = CollValue({}, owner=node, owner_key="tags")
                for t in yn["Tags"]:
                    tags[t] = Tag({"value": t})
                node["tags"] = tags
        # create edges (relationships)
        for e in yedges:
            ye = yedges[e]
            for ends in ye["Ends"]:
                init = {
                    "handle": e,
                    "model": self.handle,
                    "src": self._model.nodes[ends["Src"]],
                    "dst": self._model.nodes[ends["Dst"]],
                    "multiplicity": ends.get("Mul") or ye.get("Mul")
                    or MDF.default_mult,
                    "desc": ends.get("Desc") or ye.get("Desc"),
                }
                edge = self._model.add_edge(init)
                Tags = ye.get("Tags") or ends.get("Tags")
                if Tags:
                    tags = CollValue({}, owner=edge, owner_key="tags")
                    for t in Tags:
                        tags[t] = Tag({"value": t})
                        edge["tags"] = tags
        # create properties
        for ent in ChainMap(self._model.nodes, self._model.edges).values():
            if isinstance(ent, Node):
                pnames = ynodes[ent.handle]["Props"]
                if yunps:
                    pnames.extend(
                        yunps["mayHave"] if yunps.get("mayHave") else [])
                    pnames.extend(
                        yunps["mustHave"] if yunps.get("mustHave") else [])
            elif isinstance(ent, Edge):
                # props elts appearing Ends hash take
                # precedence over Props elt in the
                # handle's hash
                (hdl, src, dst) = ent.triplet
                [end] = [
                    e for e in yedges[hdl]["Ends"]
                    if e["Src"] == src and e["Dst"] == dst
                ]
                pnames = end.get("Props") or yedges[hdl].get("Props")
                if yurps:
                    pnames.extend(
                        yurps["mayHave"] if yurps.get("mayHave") else [])
                    pnames.extend(
                        yurps["mustHave"] if yurps.get("mustHave") else [])
            else:
                raise AttributeError(
                    "unhandled entity type {type} for properties".format(
                        type=type(ent).__name__))
            if pnames:
                for pname in pnames:
                    ypdef = ypropdefs.get(pname)
                    if not ypdef:
                        warn(
                            "property '{pname}' does not have a corresponding propdef"
                            .format(pname=pname))
                        break
                    init = {"handle": pname, "model": self.handle}
                    if ypdef.get("Type"):
                        init.update(self.calc_value_domain(ypdef["Type"]))
                    else:
                        init["value_domain"] = MDF.default_type
                    prop = self._model.add_prop(ent, init)
                    ent.props[prop.handle] = prop
                    if ypdef.get("Tags"):
                        tags = CollValue({}, owner=node, owner_key="tags")
                        for t in ypdef["Tags"]:
                            tags[t] = Tag({"value": t})
                        prop["tags"] = tags
        return self._model

    def calc_value_domain(self, typedef):
        if isinstance(typedef, dict):
            if typedef.get("pattern"):
                return {
                    "value_domain": "regexp",
                    "pattern": typedef["pattern"]
                }
            elif typedef.get("units"):
                return {
                    "value_domain": typedef.get("value_type"),
                    "units": ";".join(typedef.get("units")),
                }
            else:
                # punt
                warn("MDF type descriptor unrecognized: json looks like {j}".
                     format(j=json.dumps(typedef)))
                return {"value_domain": json.dumps(typedef)}
        elif isinstance(typedef,
                        list):  # a valueset: create value set and term objs
            vs = ValueSet({"_id": str(uuid4())})
            vs.handle = self.handle + vs._id[0:8]
            if re.match("^(?:https?|bolt)://", typedef[0]):  # looks like url
                vs.url = typedef[0]
            else:  # an enum
                for t in typedef:
                    vs.terms[t] = Term({"value": t})
            return {"value_domain": "value_set", "value_set": vs}
        else:
            return {"value_domain": MDF.default_type}