class Core: """Core of the semantics management, dealing with the RDFS and other Semantic triples. The only reason to have it in a separate class is for an easier maintainability. This is a common superclass only. In the present module, it is subclassed by a L{RDFS Closure<RDFClosure.RDFSClosure.RDFS_Semantics>} class and a L{OWL RL Closure<RDFClosure.OWLRL.OWLRL_Semantics>} classes. There are some methods that are implemented in the subclasses only, ie, this class cannot be used by itself! @ivar IMaxNum: maximal index of C{rdf:_i} occurrence in the graph @ivar literal_proxies: L{Literal Proxies with BNodes<RDFClosure.Literals.LiteralProxies>} for the graph @type literal_proxies: L{LiteralProxies<RDFClosure.Literals.LiteralProxies>} @ivar graph: the real graph @type graph: rdflib.Graph @ivar axioms: whether axioms should be added or not @type axioms: boolean @ivar daxioms: whether datatype axioms should be added or not @type daxioms: boolean @ivar added_triples: triples added to the graph, conceptually, during one processing cycle @type added_triples: set of triples @ivar error_messages: error messages (typically inconsistency messages in OWL RL) found during processing. These are added to the final graph at the very end as separate BNodes with error messages @type error_messages: array of strings @ivar rdfs: whether RDFS inference is also done (used in subclassed only) @type rdfs: boolean """ # noinspection PyUnusedLocal def __init__(self, graph, axioms, daxioms, rdfs=False): """ @param graph: the RDF graph to be extended @type graph: rdflib.Graph @param axioms: whether axioms should be added or not @type axioms: boolean @param daxioms: whether datatype axioms should be added or not @type daxioms: boolean @param rdfs: whether RDFS inference is also done (used in subclassed only) @type rdfs: boolean """ self._debug = debugGlobal # Calculate the maximum 'n' value for the '_i' type predicates (see Horst's paper) n = 1 maxnum = 0 cont = True while cont: cont = False predicate = ns_rdf[("_%d" % n)] for (s, p, o) in graph.triples((None, predicate, None)): # there is at least one if we got here maxnum = n n += 1 cont = True self.IMaxNum = maxnum self.graph = graph self.axioms = axioms self.daxioms = daxioms self.rdfs = rdfs self.error_messages = [] self.empty_stored_triples() def add_error(self, message): """ Add an error message @param message: error message @type message: string """ if message not in self.error_messages: self.error_messages.append(message) def pre_process(self): """ Do some pre-processing step. This method before anything else in the closure. By default, this method is empty, subclasses can add content to it by overriding it. """ pass def post_process(self): """ Do some post-processing step. This method when all processing is done, but before handling possible errors (ie, the method can add its own error messages). By default, this method is empty, subclasses can add content to it by overriding it. """ pass def rules(self, t, cycle_num): """ The core processing cycles through every tuple in the graph and dispatches it to the various methods implementing a specific group of rules. By default, this method raises an exception; indeed, subclasses I{must} add content to by overriding it. @param t: one triple on which to apply the rules @type t: tuple @param cycle_num: which cycle are we in, starting with 1. This value is forwarded to all local rules; it is also used locally to collect the bnodes in the graph. """ raise Exception("This method should not be called directly; subclasses should override it") def add_axioms(self): """ Add axioms. This is only a placeholder and raises an exception by default; subclasses I{must} fill this with real content """ raise Exception("This method should not be called directly; subclasses should override it") def add_d_axioms(self): """ Add d axioms. This is only a placeholder and raises an exception by default; subclasses I{must} fill this with real content """ raise Exception("This method should not be called directly; subclasses should override it") def one_time_rules(self): """ This is only a placeholder; subclasses should fill this with real content. By default, it is just an empty call. This set of rules is invoked only once and not in a cycle. """ pass # noinspection PyBroadException def get_literal_value(self, node): """ Return the literal value corresponding to a Literal node. Used in error messages. @param node: literal node @return: the literal value itself """ try: return self.literal_proxies.bnode_to_lit[node].lex except: # TODO: implement return "????" # noinspection PyAttributeOutsideInit def empty_stored_triples(self): """ Empty the internal store for triples """ self.added_triples = set() def flush_stored_triples(self): """ Send the stored triples to the graph, and empty the container """ for t in self.added_triples: self.graph.add(t) self.empty_stored_triples() def store_triple(self, t): """ In contrast to its name, this does not yet add anything to the graph itself, it just stores the tuple in an L{internal set<Core.added_triples>}. (It is important for this to be a set: some of the rules in the various closures may generate the same tuples several times.) Before adding the tuple to the set, the method checks whether the tuple is in the final graph already (if yes, it is not added to the set). The set itself is emptied at the start of every processing cycle; the triples are then effectively added to the graph at the end of such a cycle. If the set is actually empty at that point, this means that the cycle has not added any new triple, and the full processing can stop. @param t: the triple to be added to the graph, unless it is already there @type t: a 3-element tuple of (s,p,o) """ (s, p, o) = t if not(isinstance(s, rdflibLiteral) or isinstance(p, rdflibLiteral)) and t not in self.graph: if self._debug or offlineGeneration: print(t) self.added_triples.add(t) # noinspection PyAttributeOutsideInit def closure(self): """ Generate the closure the graph. This is the real 'core'. The processing rules store new triples via the L{separate method<store_triple>} which stores them in the L{added_triples<added_triples>} array. If that array is emtpy at the end of a cycle, it means that the whole process can be stopped. If required, the relevant axiomatic triples are added to the graph before processing in cycles. Similarly the exchange of literals against bnodes is also done in this step (and restored after all cycles are over). """ self.pre_process() # Handling the axiomatic triples. In general, this means adding all tuples in the list that # forwarded, and those include RDF or RDFS. In both cases the relevant parts of the container axioms should also # be added. if self.axioms: self.add_axioms() # Create the bnode proxy structure for literals self.literal_proxies = LiteralProxies(self.graph, self) # Add the datatype axioms, if needed (note that this makes use of the literal proxies, the order of the call # is important! if self.daxioms: self.add_d_axioms() self.flush_stored_triples() # Get first the 'one-time rules', ie, those that do not need an extra round in cycles down the line self.one_time_rules() self.flush_stored_triples() # Go cyclically through all rules until no change happens new_cycle = True cycle_num = 0 while new_cycle: # yes, there was a change, let us go again cycle_num += 1 # DEBUG: print the cycle number out if self._debug: print("----- Cycle #:%d" % cycle_num) # go through all rules, and collect the replies (to see whether any change has been done) # the new triples to be added are collected separately not to interfere with # the current graph yet self.empty_stored_triples() # Execute all the rules; these might fill up the added triples array for t in self.graph: self.rules(t, cycle_num) # Add the tuples to the graph (if necessary, that is). If any new triple has been generated, a new cycle # will be necessary... new_cycle = len(self.added_triples) > 0 for t in self.added_triples: self.graph.add(t) # All done, but we should restore the literals from their proxies self.literal_proxies.restore() self.post_process() self.flush_stored_triples() # Add possible error messages if self.error_messages: # I am not sure this is the right vocabulary to use for this purpose, but I haven't found anything! # I could, of course, come up with my own, but I am not sure that would be kosher... ERRNS = Namespace("http://www.daml.org/2002/03/agents/agent-ont#") self.graph.bind("err","http://www.daml.org/2002/03/agents/agent-ont#") for m in self.error_messages: message = BNode() self.graph.add((message, type, ERRNS['ErrorMessage'])) self.graph.add((message, ERRNS['error'], rdflibLiteral(m)))
class Core : """Core of the semantics management, dealing with the RDFS and other Semantic triples. The only reason to have it in a separate class is for an easier maintainability. This is a common superclass only. In the present module, it is subclassed by a L{RDFS Closure<RDFClosure.RDFSClosure.RDFS_Semantics>} class and a L{OWL RL Closure<RDFClosure.OWLRL.OWLRL_Semantics>} classes. There are some methods that are implemented in the subclasses only, ie, this class cannot be used by itself! @ivar IMaxNum: maximal index of C{rdf:_i} occurrence in the graph @ivar literal_proxies: L{Literal Proxies with BNodes<RDFClosure.Literals.LiteralProxies>} for the graph @type literal_proxies: L{LiteralProxies<RDFClosure.Literals.LiteralProxies>} @ivar graph: the real graph @type graph: rdflib.Graph @ivar axioms: whether axioms should be added or not @type axioms: boolean @ivar daxioms: whether datatype axioms should be added or not @type daxioms: boolean @ivar added_triples: triples added to the graph, conceptually, during one processing cycle @type added_triples: set of triples @ivar error_messages: error messages (typically inconsistency messages in OWL RL) found during processing. These are added to the final graph at the very end as separate BNodes with error messages @type error_messages: array of strings @ivar rdfs: whether RDFS inference is also done (used in subclassed only) @type rdfs: boolean """ # noinspection PyUnusedLocal def __init__(self, graph, axioms, daxioms, rdfs=False): """ @param graph: the RDF graph to be extended @type graph: rdflib.Graph @param axioms: whether axioms should be added or not @type axioms: boolean @param daxioms: whether datatype axioms should be added or not @type daxioms: boolean @param rdfs: whether RDFS inference is also done (used in subclassed only) @type rdfs: boolean """ self._debug = debugGlobal # Calculate the maximum 'n' value for the '_i' type predicates (see Horst's paper) n = 1 maxnum = 0 cont = True while cont: cont = False predicate = ns_rdf[("_%d" % n)] for (s, p, o) in graph.triples((None, predicate, None)): # there is at least one if we got here maxnum = n n += 1 cont = True self.IMaxNum = maxnum self.graph = graph self.axioms = axioms self.daxioms = daxioms self.rdfs = rdfs self.error_messages = [] self.empty_stored_triples() def add_error(self, message): """ Add an error message @param message: error message @type message: string """ if message not in self.error_messages: self.error_messages.append(message) def pre_process(self): """ Do some pre-processing step. This method before anything else in the closure. By default, this method is empty, subclasses can add content to it by overriding it. """ pass def post_process(self): """ Do some post-processing step. This method when all processing is done, but before handling possible errors (ie, the method can add its own error messages). By default, this method is empty, subclasses can add content to it by overriding it. """ pass def rules(self,t,cycle_num): """ The core processing cycles through every tuple in the graph and dispatches it to the various methods implementing a specific group of rules. By default, this method raises an exception; indeed, subclasses I{must} add content to by overriding it. @param t: one triple on which to apply the rules @type t: tuple @param cycle_num: which cycle are we in, starting with 1. This value is forwarded to all local rules; it is also used locally to collect the bnodes in the graph. """ raise Exception("This method should not be called directly; subclasses should override it") def add_axioms(self): """ Add axioms. This is only a placeholder and raises an exception by default; subclasses I{must} fill this with real content """ raise Exception("This method should not be called directly; subclasses should override it") def add_d_axioms(self): """ Add d axioms. This is only a placeholder and raises an exception by default; subclasses I{must} fill this with real content """ raise Exception("This method should not be called directly; subclasses should override it") def one_time_rules(self): """ This is only a placeholder; subclasses should fill this with real content. By default, it is just an empty call. This set of rules is invoked only once and not in a cycle. """ pass # noinspection PyBroadException def get_literal_value(self, node): """ Return the literal value corresponding to a Literal node. Used in error messages. @param node: literal node @return: the literal value itself """ try: return self.literal_proxies.bnode_to_lit[node].lex except: return "????" # noinspection PyAttributeOutsideInit def empty_stored_triples(self): """ Empty the internal store for triples """ self.added_triples = set() def flush_stored_triples(self): """ Send the stored triples to the graph, and empty the container """ for t in self.added_triples: self.graph.add(t) self.empty_stored_triples() def store_triple(self, t): """ In contrast to its name, this does not yet add anything to the graph itself, it just stores the tuple in an L{internal set<Core.added_triples>}. (It is important for this to be a set: some of the rules in the various closures may generate the same tuples several times.) Before adding the tuple to the set, the method checks whether the tuple is in the final graph already (if yes, it is not added to the set). The set itself is emptied at the start of every processing cycle; the triples are then effectively added to the graph at the end of such a cycle. If the set is actually empty at that point, this means that the cycle has not added any new triple, and the full processing can stop. @param t: the triple to be added to the graph, unless it is already there @type t: a 3-element tuple of (s,p,o) """ (s, p, o) = t if not(isinstance(s, rdflibLiteral) or isinstance(p, rdflibLiteral)) and t not in self.graph: if self._debug or offlineGeneration: print t self.added_triples.add(t) # noinspection PyAttributeOutsideInit def closure(self): """ Generate the closure the graph. This is the real 'core'. The processing rules store new triples via the L{separate method<store_triple>} which stores them in the L{added_triples<added_triples>} array. If that array is emtpy at the end of a cycle, it means that the whole process can be stopped. If required, the relevant axiomatic triples are added to the graph before processing in cycles. Similarly the exchange of literals against bnodes is also done in this step (and restored after all cycles are over). """ self.pre_process() # Handling the axiomatic triples. In general, this means adding all tuples in the list that # forwarded, and those include RDF or RDFS. In both cases the relevant parts of the container axioms should also # be added. if self.axioms: self.add_axioms() # Create the bnode proxy structure for literals self.literal_proxies = LiteralProxies(self.graph, self) # Add the datatype axioms, if needed (note that this makes use of the literal proxies, the order of the call is important! if self.daxioms: self.add_d_axioms() self.flush_stored_triples() # Get first the 'one-time rules', ie, those that do not need an extra round in cycles down the line self.one_time_rules() self.flush_stored_triples() # Go cyclically through all rules until no change happens new_cycle = True cycle_num = 0 while new_cycle: # yes, there was a change, let us go again cycle_num += 1 # DEBUG: print the cycle number out if self._debug: print "----- Cycle #:%d" % cycle_num # go through all rules, and collect the replies (to see whether any change has been done) # the new triples to be added are collected separately not to interfere with # the current graph yet self.empty_stored_triples() # Execute all the rules; these might fill up the added triples array for t in self.graph: self.rules(t, cycle_num) # Add the tuples to the graph (if necessary, that is). If any new triple has been generated, a new cycle # will be necessary... new_cycle = len(self.added_triples) > 0 for t in self.added_triples: self.graph.add(t) # All done, but we should restore the literals from their proxies self.literal_proxies.restore() self.post_process() self.flush_stored_triples() # Add possible error messages if self.error_messages: # I am not sure this is the right vocabulary to use for this purpose, but I haven't found anything! # I could, of course, come up with my own, but I am not sure that would be kosher... ERRNS = Namespace("http://www.daml.org/2002/03/agents/agent-ont#") self.graph.bind("err","http://www.daml.org/2002/03/agents/agent-ont#") for m in self.error_messages: message = BNode() self.graph.add((message, type, ERRNS['ErrorMessage'])) self.graph.add((message, ERRNS['error'], rdflibLiteral(m)))
def closure(self): """ Generate the closure the graph. This is the real 'core'. The processing rules store new triples via the L{separate method<store_triple>} which stores them in the L{added_triples<added_triples>} array. If that array is emtpy at the end of a cycle, it means that the whole process can be stopped. If required, the relevant axiomatic triples are added to the graph before processing in cycles. Similarly the exchange of literals against bnodes is also done in this step (and restored after all cycles are over). """ self.pre_process() # Handling the axiomatic triples. In general, this means adding all tuples in the list that # forwarded, and those include RDF or RDFS. In both cases the relevant parts of the container axioms should also # be added. if self.axioms: self.add_axioms() # Create the bnode proxy structure for literals self.literal_proxies = LiteralProxies(self.graph, self) # Add the datatype axioms, if needed (note that this makes use of the literal proxies, the order of the call # is important! if self.daxioms: self.add_d_axioms() self.flush_stored_triples() # Get first the 'one-time rules', ie, those that do not need an extra round in cycles down the line self.one_time_rules() self.flush_stored_triples() # Go cyclically through all rules until no change happens new_cycle = True cycle_num = 0 while new_cycle: # yes, there was a change, let us go again cycle_num += 1 # DEBUG: print the cycle number out if self._debug: print("----- Cycle #:%d" % cycle_num) # go through all rules, and collect the replies (to see whether any change has been done) # the new triples to be added are collected separately not to interfere with # the current graph yet self.empty_stored_triples() # Execute all the rules; these might fill up the added triples array for t in self.graph: self.rules(t, cycle_num) # Add the tuples to the graph (if necessary, that is). If any new triple has been generated, a new cycle # will be necessary... new_cycle = len(self.added_triples) > 0 for t in self.added_triples: self.graph.add(t) # All done, but we should restore the literals from their proxies self.literal_proxies.restore() self.post_process() self.flush_stored_triples() # Add possible error messages if self.error_messages: # I am not sure this is the right vocabulary to use for this purpose, but I haven't found anything! # I could, of course, come up with my own, but I am not sure that would be kosher... ERRNS = Namespace("http://www.daml.org/2002/03/agents/agent-ont#") self.graph.bind("err","http://www.daml.org/2002/03/agents/agent-ont#") for m in self.error_messages: message = BNode() self.graph.add((message, type, ERRNS['ErrorMessage'])) self.graph.add((message, ERRNS['error'], rdflibLiteral(m)))
def closure(self): """ Generate the closure the graph. This is the real 'core'. The processing rules store new triples via the L{separate method<store_triple>} which stores them in the L{added_triples<added_triples>} array. If that array is emtpy at the end of a cycle, it means that the whole process can be stopped. If required, the relevant axiomatic triples are added to the graph before processing in cycles. Similarly the exchange of literals against bnodes is also done in this step (and restored after all cycles are over). """ self.pre_process() # Handling the axiomatic triples. In general, this means adding all tuples in the list that # forwarded, and those include RDF or RDFS. In both cases the relevant parts of the container axioms should also # be added. if self.axioms: self.add_axioms() # Create the bnode proxy structure for literals self.literal_proxies = LiteralProxies(self.graph, self) # Add the datatype axioms, if needed (note that this makes use of the literal proxies, the order of the call is important! if self.daxioms: self.add_d_axioms() self.flush_stored_triples() # Get first the 'one-time rules', ie, those that do not need an extra round in cycles down the line self.one_time_rules() self.flush_stored_triples() # Go cyclically through all rules until no change happens new_cycle = True cycle_num = 0 while new_cycle: # yes, there was a change, let us go again cycle_num += 1 # DEBUG: print the cycle number out if self._debug: print "----- Cycle #:%d" % cycle_num # go through all rules, and collect the replies (to see whether any change has been done) # the new triples to be added are collected separately not to interfere with # the current graph yet self.empty_stored_triples() # Execute all the rules; these might fill up the added triples array for t in self.graph: self.rules(t, cycle_num) # Add the tuples to the graph (if necessary, that is). If any new triple has been generated, a new cycle # will be necessary... new_cycle = len(self.added_triples) > 0 for t in self.added_triples: self.graph.add(t) # All done, but we should restore the literals from their proxies self.literal_proxies.restore() self.post_process() self.flush_stored_triples() # Add possible error messages if self.error_messages: # I am not sure this is the right vocabulary to use for this purpose, but I haven't found anything! # I could, of course, come up with my own, but I am not sure that would be kosher... ERRNS = Namespace("http://www.daml.org/2002/03/agents/agent-ont#") self.graph.bind("err","http://www.daml.org/2002/03/agents/agent-ont#") for m in self.error_messages: message = BNode() self.graph.add((message, type, ERRNS['ErrorMessage'])) self.graph.add((message, ERRNS['error'], rdflibLiteral(m)))