Python ensure_unicode示例，Cerebrum.modules.xmlutils.xml2object.ensure_unicode Python示例

示例#1

0

显示文件

文件： sapxml2object.py 项目： unioslo/cerebrum

    def _make_contact(self, elem, priority):
        """Return a DataContact instance out of elem."""

        kommtype2const = {
            u"Faks arbeid": DataContact.CONTACT_FAX,
            u"Telefaks midlertidig arbeidssted": DataContact.CONTACT_FAX,
            u"Arbeidstelefon 1": DataContact.CONTACT_PHONE,
            u"Arbeidstelefon 2": DataContact.CONTACT_PHONE,
            u"Arbeidstelefon 3": DataContact.CONTACT_PHONE,
            u"Mobilnummer, jobb": DataContact.CONTACT_MOBILE_WORK,
            u"Mobilnummer, privat": DataContact.CONTACT_MOBILE_PRIVATE,
            u"Privat mobil synlig på web":
                DataContact.CONTACT_MOBILE_PRIVATE_PUBLIC}

        ctype = elem.find("Type")
        if ctype is None:
            return None

        ctype = ensure_unicode(ctype.text.strip(), self.encoding)

        ctype = kommtype2const.get(ctype)
        if ctype is None:
            return None

        cvalue = ensure_unicode(elem.find("Verdi").text.strip(), self.encoding)
        cvalue = deuglify_phone(cvalue)

        return DataContact(ctype, cvalue, priority)

示例#2

0

显示文件

文件： sapxml2object.py 项目： Narvik-kommune/cerebrum

    def _make_contact(self, element):
        comm_type = element.find("Type")
        value = element.find("Verdi")
        if comm_type is None or value is None or value.text is None:
            return None

        priority = element.find("Prioritet")
        if (priority is not None and priority.text is not None
                and priority.text.isdigit()):
            priority = int(priority.text)
        else:
            return None

        comm2const = {
            "E-post adresse": DataContact.CONTACT_EMAIL,
            "Telefax": DataContact.CONTACT_FAX,
            "Telefon1": DataContact.CONTACT_PHONE,
            "Telefon2": DataContact.CONTACT_PHONE,
            "URL": DataContact.CONTACT_URL,
        }
        comm_type = ensure_unicode(comm_type.text, self.encoding)
        if comm_type not in comm2const:
            return None

        value = ensure_unicode(value.text, self.encoding)
        if comm_type in ("Telefax", "Telefon1", "Telefon2"):
            value = deuglify_phone(value)

        return DataContact(comm2const[comm_type], value, priority)

示例#3

0

显示文件

文件： sapxml2object.py 项目： unioslo/cerebrum

    def _make_contact(self, element):
        comm_type = element.find("Type")
        value = element.find("Verdi")
        if comm_type is None or value is None or value.text is None:
            return None

        priority = element.find("Prioritet")
        if (
                priority is not None and
                priority.text is not None and
                priority.text.isdigit()
        ):
            priority = int(priority.text)
        else:
            return None

        comm2const = {
            "E-post adresse": DataContact.CONTACT_EMAIL,
            "Telefax": DataContact.CONTACT_FAX,
            "Telefon1": DataContact.CONTACT_PHONE,
            "Telefon2": DataContact.CONTACT_PHONE,
            "URL": DataContact.CONTACT_URL,
        }
        comm_type = ensure_unicode(comm_type.text, self.encoding)
        if comm_type not in comm2const:
            return None

        value = ensure_unicode(value.text, self.encoding)
        if comm_type in ("Telefax", "Telefon1", "Telefon2"):
            value = deuglify_phone(value)

        return DataContact(comm2const[comm_type], value, priority)

示例#4

0

显示文件

文件： sapxml2object.py 项目： Narvik-kommune/cerebrum

    def _make_names(self, sub):
        """Extract name information from XML element sub."""

        tag2kind = {
            "Akronym": DataOU.NAME_ACRONYM,
            "Navn20": DataOU.NAME_SHORT,
            "Navn120": DataOU.NAME_LONG,
        }

        language = sub.findtext(".//Sprak")
        # Accumulate the results. One <stednavn> gives rise to several
        # DataName instances.
        result = list()
        for tmp in sub.getiterator():
            if tmp.tag not in tag2kind or not tmp.text:
                continue

            # Common mistake. The keys are, like, right next to each other.
            if language.lower() == "no":
                language = "nb"

            # It has been decided that we need to consider nn/nb/en only
            if language.lower() not in ("nn", "nb", "ny", "en"):
                continue
            result.append(
                DataName(tag2kind[tmp.tag],
                         ensure_unicode(tmp.text.strip(), self.encoding),
                         language))

        return result

示例#5

0

显示文件

文件： sapxml2object.py 项目： unioslo/cerebrum

    def _make_names(self, sub):
        """Extract name information from XML element sub."""

        tag2kind = {"Akronym": DataOU.NAME_ACRONYM,
                    "Navn20": DataOU.NAME_SHORT,
                    "Navn120": DataOU.NAME_LONG, }

        language = sub.findtext(".//Sprak")
        # Accumulate the results. One <stednavn> gives rise to several
        # DataName instances.
        result = list()
        for tmp in sub.getiterator():
            if tmp.tag not in tag2kind or not tmp.text:
                continue

            # Common mistake. The keys are, like, right next to each other.
            if language.lower() == "no":
                language = "nb"

            # It has been decided that we need to consider nn/nb/en only
            if language.lower() not in ("nn", "nb", "ny", "en"):
                continue
            result.append(DataName(tag2kind[tmp.tag],
                                   ensure_unicode(tmp.text.strip(),
                                                  self.encoding),
                                   language))

        return result

示例#6

0

显示文件

文件： fsxml2object.py 项目： unioslo/cerebrum

    def _make_contact(self, element):
        """Return a DataContact entry corresponding to a given XML element."""

        comm_type = ensure_unicode(element.get("kommtypekode"), self.encoding)
        value = ensure_unicode(element.get("kommnrverdi"), self.encoding)

        if not value:
            return None, None

        if comm_type == "TLF":
            return DataContact.CONTACT_PHONE, value
        elif comm_type == "FAX":
            return DataContact.CONTACT_FAX, value
        elif comm_type == "EKSTRA TLF":
            return DataContact.CONTACT_PHONE, value

        return None, None

示例#7

0

显示文件

文件： ltxml2object.py 项目： Narvik-kommune/cerebrum

    def _make_contact(self, elem, contact_prefs):
        """Derive contact information from LT data.

        We do not have the exact meanings, so this is guesswork. One element
        can result in multiple contact entries.
        """

        result = list()
        if elem.tag == "arbtlf":
            if int(elem.get("telefonnr")):
                result.append(
                    (DataContact.CONTACT_PHONE, elem.get("telefonnr")))
            if int(elem.get("linjenr")):
                result.append(
                    (DataContact.CONTACT_PHONE, "%i%05i" %
                     (int(elem.get("innvalgnr")), int(elem.get("linjenr")))))
            # fi
        elif elem.tag == "komm":
            comm_type = elem.get("kommtypekode")
            value = elem.get("kommnrverdi", elem.get("telefonnr", None))
            if (comm_type in (
                    "ARBTLF",
                    "EKSTRA TLF",
                    "JOBBTLFUTL",
            ) and value):
                result.append((DataContact.CONTACT_PHONE,
                               ensure_unicode(value, self.encoding)))
            if comm_type in ("FAX", "FAXUTLAND") and value:
                result.append((DataContact.CONTACT_FAX,
                               ensure_unicode(value, self.encoding)))
            # fi
        # fi

        # Since we do not have priority data, we'll simple assign priorities
        # on per category basis.
        tmp = list()
        for c_kind, c_value in result:
            priority = contact_prefs.get(c_kind, 0)
            contact_prefs[c_kind] = priority + 1
            tmp.append(DataContact(c_kind, c_value, priority))
        # od

        return tmp

示例#8

0

显示文件

文件： ltxml2object.py 项目： unioslo/cerebrum

    def _register_names(self, result, element):
        attr2type = {
            "fornavn": result.NAME_FIRST,
            "etternavn": result.NAME_LAST,
            "tittel_personlig": result.NAME_TITLE,
        }

        for kind, value in element.items():
            if kind in attr2type:
                result.add_name(DataName(attr2type[kind],
                                         ensure_unicode(value, self.encoding)))

示例#9

0

显示文件

文件： sapxml2object.py 项目： Narvik-kommune/cerebrum

    def _make_address(self, addr_element):
        """Make a DataAddress instance out of an <Adresse>."""

        assert addr_element.tag == "Adresse"

        sap2intern = {
            "Besøksadresse": DataAddress.ADDRESS_BESOK,
            "Postadresse": DataAddress.ADDRESS_POST,
            "Bostedsadresse": DataAddress.ADDRESS_PRIVATE,
            "Avvikende postadresse": DataAddress.ADDRESS_OTHER_POST,
            "Avvikende besøksadresse": DataAddress.ADDRESS_OTHER_BESOK,
        }

        zip = city = country = addr_kind = ""
        street = []

        for sub in addr_element.getiterator():
            if not sub.text:
                continue
            value = ensure_unicode(sub.text.strip(), self.encoding)

            if sub.tag in ("Gateadresse", ):
                street.insert(0, value)
            if sub.tag in ("Adressetillegg", ):
                street.append(value)
            elif sub.tag in ("Postnummer", ):
                zip = value
                # IVR 2007-01-04 FIXME: 8 is the length of the field in the
                # database. It's a bit ugly to do things this way, though.
                if len(zip) > 8:
                    return None
            elif sub.tag in ("Poststed", ):
                city = value
            elif sub.tag in ("Landkode", ):
                country = value
            elif sub.tag in ("Type", ):
                addr_kind = sap2intern.get(value, "")
            elif sub.tag in ("CO", ):
                # CO-fields don't seem to be registered intentionally
                # or with any kind of plan an regularity. we will stop
                # importing them for now, and do an evaluation at a
                # latter time. Jazz, 2011-10-28
                #
                # street.insert(0, value)
                continue
        # If we do not know the address kind, we *cannot* register it.
        if not addr_kind:
            return None
        else:
            return DataAddress(kind=addr_kind,
                               street=street,
                               zip=zip,
                               city=city,
                               country=country)

示例#10

0

显示文件

文件： ltxml2object.py 项目： Narvik-kommune/cerebrum

    def _register_names(self, result, element):
        attr2type = {
            "fornavn": result.NAME_FIRST,
            "etternavn": result.NAME_LAST,
            "tittel_personlig": result.NAME_TITLE,
        }

        for kind, value in element.items():
            if kind in attr2type:
                result.add_name(
                    DataName(attr2type[kind],
                             ensure_unicode(value, self.encoding)))

示例#11

0

显示文件

文件： ltxml2object.py 项目： Narvik-kommune/cerebrum

    def _pull_name(self, element, *possible_keys):
        """Return a first of possible_keys that is present in element."""
        for key in possible_keys:
            if element.get(key):
                value = ensure_unicode(element.get(key), self.encoding)
                return value
            # fi
        # od

        # NB! A name that is not there *must* be represented as None. "" (empty
        # string) is NOT the same as no name.
        return None

示例#12

0

显示文件

文件： sapxml2object.py 项目： unioslo/cerebrum

    def _make_sgm(self, element):
        """ Return a sgm object. """

        name = element.findtext(".//OrgNavn")
        type = element.findtext(".//OrgType")
        extent = element.findtext(".//Omfang")
        start = element.findtext(".//Startdato")
        if start:
            start = self._make_mxdate(ensure_unicode(start, self.encoding),
                                      format="%Y-%m-%d")
        else:
            start = None
        end = element.findtext(".//Sluttdato")
        if end:
            end = self._make_mxdate(ensure_unicode(end, self.encoding),
                                    format="%Y-%m-%d")
        else:
            end = None
        description = ensure_unicode(element.findtext(".//Tekst"),
                                     self.encoding)
        return DataExternalWork(name, type, extent, start, end, description)

示例#13

0

显示文件

文件： ltxml2object.py 项目： unioslo/cerebrum

    def _pull_name(self, element, *possible_keys):
        """Return a first of possible_keys that is present in element."""
        for key in possible_keys:
            if element.get(key):
                value = ensure_unicode(element.get(key), self.encoding)
                return value
            # fi
        # od

        # NB! A name that is not there *must* be represented as None. "" (empty
        # string) is NOT the same as no name.
        return None

示例#14

0

显示文件

文件： sapxml2object.py 项目： Narvik-kommune/cerebrum

    def _make_sgm(self, element):
        """ Return a sgm object. """

        name = element.findtext(".//OrgNavn")
        type = element.findtext(".//OrgType")
        extent = element.findtext(".//Omfang")
        start = element.findtext(".//Startdato")
        if start:
            start = self._make_mxdate(ensure_unicode(start, self.encoding),
                                      format="%Y-%m-%d")
        else:
            start = None
        end = element.findtext(".//Sluttdato")
        if end:
            end = self._make_mxdate(ensure_unicode(end, self.encoding),
                                    format="%Y-%m-%d")
        else:
            end = None
        description = ensure_unicode(element.findtext(".//Tekst"),
                                     self.encoding)
        return DataExternalWork(name, type, extent, start, end, description)

示例#15

0

显示文件

文件： sapxml2object.py 项目： unioslo/cerebrum

    def _make_title(self, title_kind, title_element):
        """Return a DataName representing title with language."""

        language = title_element.findtext(".//Sprak")
        value = ensure_unicode(title_element.findtext(".//Navn"),
                               self.encoding)

        if not (language and value):
            return None

        x = DataName(title_kind, value, language)
        return x

示例#16

0

显示文件

文件： sapxml2object.py 项目： Narvik-kommune/cerebrum

    def _make_title(self, title_kind, title_element):
        """Return a DataName representing title with language."""

        language = title_element.findtext(".//Sprak")
        value = ensure_unicode(title_element.findtext(".//Navn"),
                               self.encoding)

        if not (language and value):
            return None

        x = DataName(title_kind, value, language)
        return x

示例#17

0

显示文件

文件： ltxml2object.py 项目： unioslo/cerebrum

    def _make_contact(self, elem, contact_prefs):
        """Derive contact information from LT data.

        We do not have the exact meanings, so this is guesswork. One element
        can result in multiple contact entries.
        """

        result = list()
        if elem.tag == "arbtlf":
            if int(elem.get("telefonnr")):
                result.append((DataContact.CONTACT_PHONE,
                               elem.get("telefonnr")))
            if int(elem.get("linjenr")):
                result.append((DataContact.CONTACT_PHONE,
                               "%i%05i" % (int(elem.get("innvalgnr")),
                                           int(elem.get("linjenr")))))
            # fi
        elif elem.tag == "komm":
            comm_type = elem.get("kommtypekode")
            value = elem.get("kommnrverdi", elem.get("telefonnr", None))
            if (comm_type in ("ARBTLF", "EKSTRA TLF", "JOBBTLFUTL",) and
                    value):
                result.append((DataContact.CONTACT_PHONE,
                               ensure_unicode(value, self.encoding)))
            if comm_type in ("FAX", "FAXUTLAND") and value:
                result.append((DataContact.CONTACT_FAX,
                               ensure_unicode(value, self.encoding)))
            # fi
        # fi

        # Since we do not have priority data, we'll simple assign priorities
        # on per category basis.
        tmp = list()
        for c_kind, c_value in result:
            priority = contact_prefs.get(c_kind, 0)
            contact_prefs[c_kind] = priority + 1
            tmp.append(DataContact(c_kind, c_value, priority))
        # od

        return tmp

示例#18

0

显示文件

文件： sapxml2object.py 项目： unioslo/cerebrum

    def _make_address(self, addr_element):
        """Make a DataAddress instance out of an <Adresse>."""

	assert addr_element.tag == "Adresse"

        sap2intern = {
            "Besøksadresse": DataAddress.ADDRESS_BESOK,
            "Postadresse": DataAddress.ADDRESS_POST,
            "Bostedsadresse": DataAddress.ADDRESS_PRIVATE,
            "Avvikende postadresse": DataAddress.ADDRESS_OTHER_POST,
            "Avvikende besøksadresse": DataAddress.ADDRESS_OTHER_BESOK,
        }

	zip = city = country = addr_kind = ""
        street = []

        for sub in addr_element.getiterator():
            if not sub.text:
                continue
            value = ensure_unicode(sub.text.strip(), self.encoding)

            if sub.tag in ("Gateadresse",):
                street.insert(0, value)
            if sub.tag in ("Adressetillegg",):
                street.append(value)
            elif sub.tag in ("Postnummer",):
                zip = value
                # IVR 2007-01-04 FIXME: 8 is the length of the field in the
                # database. It's a bit ugly to do things this way, though.
                if len(zip) > 8:
                    return None
            elif sub.tag in ("Poststed",):
                city = value
            elif sub.tag in ("Landkode",):
                country = value
            elif sub.tag in ("Type",):
                addr_kind = sap2intern.get(value, "")
            elif sub.tag in ("CO",):
                # CO-fields don't seem to be registered intentionally
                # or with any kind of plan an regularity. we will stop
                # importing them for now, and do an evaluation at a
                # latter time. Jazz, 2011-10-28
                #
                # street.insert(0, value)
                continue
        # If we do not know the address kind, we *cannot* register it.
        if not addr_kind:
            return None
        else:
            return DataAddress(kind=addr_kind,
                               street=street, zip=zip,
                               city=city, country=country)

示例#19

0

显示文件

文件： sapxml2object.py 项目： Narvik-kommune/cerebrum

    def _make_contact(self, elem, priority):
        """Return a DataContact instance out of elem."""

        kommtype2const = {
            u"Faks arbeid":
            DataContact.CONTACT_FAX,
            u"Telefaks midlertidig arbeidssted":
            DataContact.CONTACT_FAX,
            u"Arbeidstelefon 1":
            DataContact.CONTACT_PHONE,
            u"Arbeidstelefon 2":
            DataContact.CONTACT_PHONE,
            u"Arbeidstelefon 3":
            DataContact.CONTACT_PHONE,
            u"Mobilnummer, jobb":
            DataContact.CONTACT_MOBILE_WORK,
            u"Mobilnummer, privat":
            DataContact.CONTACT_MOBILE_PRIVATE,
            u"Privat mobil synlig på web":
            DataContact.CONTACT_MOBILE_PRIVATE_PUBLIC
        }

        ctype = elem.find("Type")
        if ctype is None:
            return None

        ctype = ensure_unicode(ctype.text.strip(), self.encoding)

        ctype = kommtype2const.get(ctype)
        if ctype is None:
            return None

        cvalue = ensure_unicode(elem.find("Verdi").text.strip(), self.encoding)
        cvalue = deuglify_phone(cvalue)

        return DataContact(ctype, cvalue, priority)

示例#20

0

显示文件

文件： sapxml2object.py 项目： Narvik-kommune/cerebrum

    def _make_role(self, elem):
        """Make an employment out of a <Roller>...</Roller>.

              SAP uses <Roller>-elements to designate bilagslønnede and gjester.

        """
        ou_id = None
        start_date = end_date = None
        kind = None
        code = None

        for sub in elem.getiterator():
            if not sub.text:
                continue

            value = ensure_unicode(sub.text.strip(), self.encoding)

            if sub.tag == "Navn":
                code = value

                if value == "BILAGSLØNN":
                    kind = DataEmployment.BILAG
                else:
                    # For guests, we distinguish between different guest kinds
                    # For bilagslønnede, we don't care (they are all alike)
                    kind = DataEmployment.GJEST
            elif sub.tag == "Stedkode":
                sko = make_sko(value)
                if sko is not None:
                    ou_id = (DataOU.NO_SKO, sko)
            elif sub.tag == "Startdato":
                start_date = self._make_mxdate(value, format="%Y-%m-%d")
            elif sub.tag == "Sluttdato":
                end_date = self._make_mxdate(value, format="%Y-%m-%d")

        if ou_id is None:
            return None

        return DataEmployment(kind=kind,
                              percentage=None,
                              code=code,
                              start=start_date,
                              end=end_date,
                              place=ou_id,
                              category=None)

示例#21

0

显示文件

文件： sapxml2object.py 项目： unioslo/cerebrum

    def _make_role(self, elem):
        """Make an employment out of a <Roller>...</Roller>.

              SAP uses <Roller>-elements to designate bilagslønnede and gjester.

        """
        ou_id = None
        start_date = end_date = None
        kind = None
        code = None

        for sub in elem.getiterator():
            if not sub.text:
                continue

            value = ensure_unicode(sub.text.strip(), self.encoding)

            if sub.tag == "Navn":
                code = value

                if value == "BILAGSLØNN":
                    kind = DataEmployment.BILAG
                else:
                    # For guests, we distinguish between different guest kinds
                    # For bilagslønnede, we don't care (they are all alike)
                    kind = DataEmployment.GJEST
            elif sub.tag == "Stedkode":
                sko = make_sko(value)
                if sko is not None:
                    ou_id = (DataOU.NO_SKO, sko)
            elif sub.tag == "Startdato":
                start_date = self._make_mxdate(value, format="%Y-%m-%d")
            elif sub.tag == "Sluttdato":
                end_date = self._make_mxdate(value, format="%Y-%m-%d")

        if ou_id is None:
            return None

        return DataEmployment(kind=kind, percentage=None,
                              code=code,
                              start=start_date, end=end_date,
                              place=ou_id, category=None)

示例#22

0

显示文件

文件： sapxml2object.py 项目： unioslo/cerebrum

    def _make_employment(self, emp_element):
        """Make a DataEmployment instance of an <Hovedstilling>, </Bistilling>.

        emp_element is the XML-subtree representing the employment. Returns a
        DataEmployment object, representing the XML-employment object.

        """
        percentage = code = None
        start_date = end_date = None
        ou_id = None
        category = None
        kind = self.tag2type[emp_element.tag]
        mg = mug = None

        for sub in emp_element.getiterator():
            if not sub.text:
                continue

            value = ensure_unicode(sub.text.strip(), self.encoding)

            if sub.tag == "Stillingsprosent":
                percentage = float(value)
            elif sub.tag == "SKO":
                code = int(value[0:4])

                if getattr(self, 'filter_out_sko_0000', True):
                    # 0000 are to be discarded. This is by design.
                    if code == 0:
                        return None
                # Some elements have the proper category set in AdmForsk
                if category is None:
                    category = self._code2category(code)
            elif sub.tag == "Stilling":
                tmp = value.split(" ")
                if len(tmp) != 1 and category is None:
                    category = self._code2category(tmp[0])
            elif sub.tag == "Startdato":
                start_date = self._make_mxdate(value, format="%Y-%m-%d")
            elif sub.tag == "Sluttdato":
                end_date = self._make_mxdate(value, format="%Y-%m-%d")
            elif sub.tag == "Orgenhet":
                sko = make_sko(value)
                if sko is not None:
                    ou_id = (DataOU.NO_SKO, sko)
            elif sub.tag == "AdmForsk":
                # if neither is specified, use, the logic in
                # stillingsgruppebetegnelse to decide on the category
                if value == "Vit":
                    category = DataEmployment.KATEGORI_VITENSKAPLIG
                elif value == "T/A":
                    category = DataEmployment.KATEGORI_OEVRIG
            elif sub.tag == "Status":
                # <Status> indicates whether the employment entry is actually
                # valid.
                if value != "Aktiv":
                    return None
            elif sub.tag == "Stillingsnummer":
                # this code means that the employment has been terminated (why
                # would there be two elements for that?)
                if value == "99999999":
                    return None
                # these are temp employments (bilagslønnede) that we can
                # safely disregard (according to baardj).
                if value == "30010895":
                    return None
            elif sub.tag == "MEGType":
                mg = int(value)
            elif sub.tag == "MUGType":
                mug = int(value)
            # IVR 2007-07-11 FIXME: We should take a look at <Arsak>, since it
            # contains deceased status for a person.

        # We *must* have an OU to which this employment is attached.
        if getattr(self, 'require_ou_for_assignments', True) and not ou_id:
            return None

        kind = self.tag2type[emp_element.tag]
        tmp = DataEmployment(kind=kind, percentage=percentage,
                             code=code, start=start_date, end=end_date,
                             place=ou_id, category=category,
                             mg=mg, mug=mug)

        for element in emp_element.findall(".//Tittel"):
            work_title = self._make_title(DataEmployment.WORK_TITLE, element)
            if work_title:
                tmp.add_name(work_title)

        return tmp

示例#23

0

显示文件

文件： sapxml2object.py 项目： unioslo/cerebrum

    def next_object(self, element):
        """Return the next DataOU object."""

        result = DataOU()

        # IVR 2007-12-24 FIXME: One of the attributes is special, and tags the
        # OU's intended usage code (bruksområde). Find out which attribute
        # this is.
        # Iterate over *all* subelements
        for sub in element.getiterator():
            value = None
            if sub.text:
                value = ensure_unicode(sub.text.strip(), self.encoding)
            if sub.tag == "Stedkode":
                sko = make_sko(value)
                if sko is not None:
                    result.add_id(self.tag2type[sub.tag], sko)
                else:
                    # invalid value for the <Stedkode> tag
                    if self.logger:
                        self.logger.warn(
                            'Detected XML <Stedkode> '
                            'tag with invalid value: %s',
                            value
                        )
            elif sub.tag == "Overordnetstedkode":
                sko = make_sko(value)
                if sko is not None:
                    result.parent = (result.NO_SKO, sko)
            elif sub.tag == "Navn":
                for name in self._make_names(sub):
                    result.add_name(name)
            elif sub.tag in ("Adresse",):
                result.add_address(self._make_address(sub))
            elif sub.tag in ("Startdato", "Sluttdato"):
                date = self._make_mxdate(sub.text, format="%Y-%m-%d")
                if sub.tag == "Startdato":
                    result.start_date = date
                else:
                    result.end_date = date

        # Whether the OU can be published in various online directories
        result.publishable = False
        for tmp in element.findall(".//Bruksomrade/Type"):
            if tmp.text == "Tillatt Organisasjon":
                result.publishable = True
            # <StedType> tell us how an OU can be used. This information is
            # represented in Cerebrum with the help of spreads and can be
            # accessed via the EntitySpread interface.
            result.add_usage_code(tmp.text)

        celems = element.findall("Kommunikasjon")
        for sub in celems:
            ct = self._make_contact(sub)
            if ct:
                result.add_contact(ct)

        # We require an OU to have a name.
        # Ideally, the information about expired OUs should be complete as
        # well, but we won't be this lucky in our lifetimes. So, for expired
        # OUs we won't care about the names.
        # Neither do we care about the missing names of not yet active
        # OUs; we choose to hope that the names will be in place when
        # the OU becomes active.
        if result.get_name(DataOU.NAME_LONG) is None:
            ou_no_sko_str = result.get_id(DataOU.NO_SKO)
            if not ou_no_sko_str:
                ou_no_sko_str = 'Missing a valid NO_SKO value'
            if result.end_date and result.end_date < now():
                if self.logger:
                    self.logger.debug("No name for expired OU %s",
                                      ou_no_sko_str)
            elif result.start_date and result.start_date > now():
                if self.logger:
                    self.logger.debug("No name for future OU %s",
                                      ou_no_sko_str)
            else:
                if self.logger:
                    self.logger.warn("No name available for OU %s",
                                     ou_no_sko_str)
                return None

        return result

示例#24

0

显示文件

文件： ltxml2object.py 项目： Narvik-kommune/cerebrum

    def _make_employment(self, elem):
        """Convert element to proper employment record."""
        # There are 3 kinds -- tils, bilag && gjest. All in different
        # formats, of course:
        percentage = code = title = None
        start_date = end_date = None
        category = None
        ou_id = None
        leave = []
        tag2kind = {
            "bilag": DataEmployment.BILAG,
            "tils": DataEmployment.HOVEDSTILLING,
            "gjest": DataEmployment.GJEST,
        }
        xml2cat = {
            "ØVR": DataEmployment.KATEGORI_OEVRIG,
            "VIT": DataEmployment.KATEGORI_VITENSKAPLIG,
        }

        def make_sko(f, i, g):
            return tuple([int(elem.get(x)) for x in (f, i, g)])

        if elem.tag == "bilag":
            end_date = self._make_mxdate(elem.get("dato_oppgjor"))
            ou_id = (DataOU.NO_SKO,
                     make_sko("fakultetnr_kontering", "instituttnr_kontering",
                              "gruppenr_kontering"))
        elif elem.tag == "gjest":
            ou_id = (DataOU.NO_SKO,
                     make_sko("fakultetnr", "instituttnr", "gruppenr"))
            start_date = self._make_mxdate(elem.get("dato_fra"))
            end_date = self._make_mxdate(elem.get("dato_til"))
            code = ensure_unicode(elem.get("gjestetypekode"), self.encoding)
        elif elem.tag == "tils":
            percentage = float(elem.get("prosent_tilsetting"))
            code = ensure_unicode(elem.get("stillingkodenr_beregnet_sist"),
                                  self.encoding)
            title = ensure_unicode(elem.get("tittel"), self.encoding)
            if title == "professor II":
                percentage = percentage / 5.0
            # fi
            start_date = self._make_mxdate(elem.get("dato_fra"))
            end_date = self._make_mxdate(elem.get("dato_til"))
            ou_id = (DataOU.NO_SKO,
                     make_sko("fakultetnr_utgift", "instituttnr_utgift",
                              "gruppenr_utgift"))
            if elem.get("hovedkat"):
                category = xml2cat[ensure_unicode(elem.get("hovedkat"),
                                                  self.encoding)]

        # Handle leave (permisjon).
        for child in elem:
            if child.tag == "permisjon":
                tmp = {}
                tmp['percentage'] = float(child.get("prosent_permisjon"))
                tmp['start_date'] = self._make_mxdate(elem.get("dato_fra"))
                tmp['end_date'] = self._make_mxdate(elem.get("dato_til"))
                leave.append(tmp)

        return DataEmployment(kind=tag2kind[elem.tag],
                              percentage=percentage,
                              code=code,
                              title=title,
                              start=start_date,
                              end=end_date,
                              place=ou_id,
                              category=category,
                              leave=leave)

示例#25

0

显示文件

文件： sapxml2object.py 项目： unioslo/cerebrum

 def ext(subelm):
     answer = element.find(subelm)
     if answer is not None and answer.text:
         return ensure_unicode(answer.text, self.encoding)
     return ""

示例#26

0

显示文件

文件： ltxml2object.py 项目： unioslo/cerebrum

    def _make_employment(self, elem):
        """Convert element to proper employment record."""
        # There are 3 kinds -- tils, bilag && gjest. All in different
        # formats, of course:
        percentage = code = title = None
        start_date = end_date = None
        category = None
        ou_id = None
        leave = []
        tag2kind = {
            "bilag": DataEmployment.BILAG,
            "tils": DataEmployment.HOVEDSTILLING,
            "gjest": DataEmployment.GJEST,
        }
        xml2cat = {
            "ØVR": DataEmployment.KATEGORI_OEVRIG,
            "VIT": DataEmployment.KATEGORI_VITENSKAPLIG,
        }

        def make_sko(f, i, g):
            return tuple([int(elem.get(x)) for x in (f, i, g)])

        if elem.tag == "bilag":
            end_date = self._make_mxdate(elem.get("dato_oppgjor"))
            ou_id = (DataOU.NO_SKO,
                     make_sko("fakultetnr_kontering", "instituttnr_kontering",
                              "gruppenr_kontering"))
        elif elem.tag == "gjest":
            ou_id = (DataOU.NO_SKO,
                     make_sko("fakultetnr", "instituttnr", "gruppenr"))
            start_date = self._make_mxdate(elem.get("dato_fra"))
            end_date = self._make_mxdate(elem.get("dato_til"))
            code = ensure_unicode(elem.get("gjestetypekode"), self.encoding)
        elif elem.tag == "tils":
            percentage = float(elem.get("prosent_tilsetting"))
            code = ensure_unicode(elem.get("stillingkodenr_beregnet_sist"),
                                  self.encoding)
            title = ensure_unicode(elem.get("tittel"), self.encoding)
            if title == "professor II":
                percentage = percentage / 5.0
            # fi
            start_date = self._make_mxdate(elem.get("dato_fra"))
            end_date = self._make_mxdate(elem.get("dato_til"))
            ou_id = (DataOU.NO_SKO,
                     make_sko("fakultetnr_utgift", "instituttnr_utgift",
                              "gruppenr_utgift"))
            if elem.get("hovedkat"):
                category = xml2cat[ensure_unicode(elem.get("hovedkat"),
                                                  self.encoding)]

        # Handle leave (permisjon).
        for child in elem:
            if child.tag == "permisjon":
                tmp = {}
                tmp['percentage'] = float(child.get("prosent_permisjon"))
                tmp['start_date'] = self._make_mxdate(elem.get("dato_fra"))
                tmp['end_date'] = self._make_mxdate(elem.get("dato_til"))
                leave.append(tmp)

        return DataEmployment(kind=tag2kind[elem.tag],
                              percentage=percentage,
                              code=code, title=title,
                              start=start_date, end=end_date, place=ou_id,
                              category=category,
                              leave=leave)

示例#27

0

显示文件

文件： sapxml2object.py 项目： Narvik-kommune/cerebrum

 def ext(subelm):
     answer = element.find(subelm)
     if answer is not None and answer.text:
         return ensure_unicode(answer.text, self.encoding)
     return ""

示例#28

0

显示文件

文件： sapxml2object.py 项目： Narvik-kommune/cerebrum

    def next_object(self, element):
        """Return the next DataOU object."""

        result = DataOU()

        # IVR 2007-12-24 FIXME: One of the attributes is special, and tags the
        # OU's intended usage code (bruksområde). Find out which attribute
        # this is.
        # Iterate over *all* subelements
        for sub in element.getiterator():
            value = None
            if sub.text:
                value = ensure_unicode(sub.text.strip(), self.encoding)
            if sub.tag == "Stedkode":
                sko = make_sko(value)
                if sko is not None:
                    result.add_id(self.tag2type[sub.tag], sko)
                else:
                    # invalid value for the <Stedkode> tag
                    if self.logger:
                        self.logger.warn(
                            'Detected XML <Stedkode> '
                            'tag with invalid value: %s', value)
            elif sub.tag == "Overordnetstedkode":
                sko = make_sko(value)
                if sko is not None:
                    result.parent = (result.NO_SKO, sko)
            elif sub.tag == "Navn":
                for name in self._make_names(sub):
                    result.add_name(name)
            elif sub.tag in ("Adresse", ):
                result.add_address(self._make_address(sub))
            elif sub.tag in ("Startdato", "Sluttdato"):
                date = self._make_mxdate(sub.text, format="%Y-%m-%d")
                if sub.tag == "Startdato":
                    result.start_date = date
                else:
                    result.end_date = date

        # Whether the OU can be published in various online directories
        result.publishable = False
        for tmp in element.findall(".//Bruksomrade/Type"):
            if tmp.text == "Tillatt Organisasjon":
                result.publishable = True
            # <StedType> tell us how an OU can be used. This information is
            # represented in Cerebrum with the help of spreads and can be
            # accessed via the EntitySpread interface.
            result.add_usage_code(tmp.text)

        celems = element.findall("Kommunikasjon")
        for sub in celems:
            ct = self._make_contact(sub)
            if ct:
                result.add_contact(ct)

        # We require an OU to have a name.
        # Ideally, the information about expired OUs should be complete as
        # well, but we won't be this lucky in our lifetimes. So, for expired
        # OUs we won't care about the names.
        # Neither do we care about the missing names of not yet active
        # OUs; we choose to hope that the names will be in place when
        # the OU becomes active.
        if result.get_name(DataOU.NAME_LONG) is None:
            ou_no_sko_str = result.get_id(DataOU.NO_SKO)
            if not ou_no_sko_str:
                ou_no_sko_str = 'Missing a valid NO_SKO value'
            if result.end_date and result.end_date < now():
                if self.logger:
                    self.logger.debug("No name for expired OU %s",
                                      ou_no_sko_str)
            elif result.start_date and result.start_date > now():
                if self.logger:
                    self.logger.debug("No name for future OU %s",
                                      ou_no_sko_str)
            else:
                if self.logger:
                    self.logger.warn("No name available for OU %s",
                                     ou_no_sko_str)
                return None

        return result

示例#29

0

显示文件

文件： sapxml2object.py 项目： unioslo/cerebrum

    def next_object(self, element):
        """Return the next SAPPerson object.

        Consume the next XML-element describing a person, and return a
        suitable representation (SAPPerson).

        Should something fail (which prevents this method from constructing a
        proper SAPPerson object), an exception is raised.

        """
        result = SAPPerson()

        # Per baardj's request, we consider middle names as first names.
        middle = ""
        middle = element.find("Person/Mellomnavn")
        if middle is not None and middle.text:
            middle = ensure_unicode(middle.text.strip(), self.encoding)

        # Iterate over *all* subelements, 'fill up' the result object
        for sub in element.getiterator():
            value = None
            if sub.text:
                value = ensure_unicode(sub.text.strip(), self.encoding)

            if sub.tag == "Fornavn":
                if middle:
                    value += " " + middle

                # IVR 2007-05-30 FIXME: This is not pretty.
                #
                # In an e-mail from 2007-05-29, Johannes Paulsen suggests that
                # marking invalid entries with '*' in the some of the name
                # elements is the easiest approach. This is an ugly hack, but
                # since the invalid entries will not disappear anytime soon,
                # this is the easiest way of skipping them.
                #
                # JAZZ 2007-08-01
                # '*' did not work all that well as it is used as common
                # wildcard in SAP. Johannes suggests that we use '@' in
                # stead. As the data is not updated yet (we don't know when
                # that will happen) we need to test for '*' as well in order
                # to skip all the invalid elements
                #
                if '*' in value or '@' in value:
                    if self.logger:
                        self.logger.debug("Name contains '@' or '*', ignored")
                    # Since the element is marked as void, there is no need to
                    # process further (we have no guarantee that any data
                    # would make sense and we won't have even more spurious
                    # warnings).
                    return None
                result.add_name(DataName(self.tag2type[sub.tag], value))
            elif sub.tag == "Etternavn":
                if '*' in value or '@' in value:
                    if self.logger:
                        self.logger.debug("Name contains '@' or '*', ignored")
                    # Se <Fornavn>.
                    return None
                result.add_name(DataName(self.tag2type[sub.tag], value))
            elif sub.tag == "Fodselsnummer" and value is not None:
                result.add_id(self.tag2type[sub.tag], personnr_ok(value))
            elif sub.tag == "Ansattnummer":
                result.add_id(self.tag2type[sub.tag], value)
                self.logger.debug(value)
            elif sub.tag == "Fodselsdato":
                result.birth_date = self._make_mxdate(value, format="%Y-%m-%d")
            elif sub.tag == "Kjonn":
                result.gender = self.tag2type[value]
            elif sub.tag == "Adresse":
                result.add_address(self._make_address(sub))
            elif sub.tag in ("Hovedstilling", "Bistilling"):
                emp = self._make_employment(sub)
                if emp is not None:
                    result.add_employment(emp)
            elif sub.tag == "Roller" and sub.findtext("IKKE-ANGIT") is None:
                emp = self._make_role(sub)
                if emp is not None:
                    result.add_employment(emp)
            elif sub.tag == "Person":
                # Lots of the other entries above also are part of the
                # "person"-firstlevel element, but we need to
                # specifically look here for Tittel => personal title,
                # to avoid confusion with worktitles
                for subsub in sub.findall("Tittel"):
                    personal_title = self._make_title(HRDataPerson.NAME_TITLE,
                                                      subsub)
                    if personal_title:
                        result.add_name(personal_title)
            elif sub.tag == "PersonligID":
                # Store additional person ids, like passport numbers.
                # Handle passport numbers
                if sub.find('Type').text in self.sap2idtype:
                    # Add the ID to the data-structure
                    pers_id = '{0}-{1}'.format(
                        ensure_unicode(sub.find('Land').text, self.encoding),
                        ensure_unicode(sub.find('Verdi').text, self.encoding)
                    )
                    result.add_id(self.sap2idtype[sub.find('Type').text],
                                  pers_id)
                else:
                    self.logger.debug(
                        "Unknown %s type '%s': skipping id type",
                        sub.tag, sub.find('Type').text)
            elif sub.tag == "SGM":
                # New feature and unique (for now?) for UiO is SGM,
                # external attachments for person.
                self.logger.debug("SGM for %s", result)
                result.add_external_work(self._make_sgm(sub))
        # We need to order 'Telefon 1' and 'Telefon 2' properly
        celems = list(element.findall("Kommunikasjon"))
        celems.sort(lambda x, y: cmp(x.find("Type").text,
                                     y.find("Type").text))
        # TBD: Priorities!
        priority = 0
        for ct in celems:
            contact = self._make_contact(ct, priority)
            if contact:
                result.add_contact(contact)
                priority += 1

        # Reservations for catalogue publishing
        # default: One active employment => can be published
        to_reserve = not result.has_active_employments()

        # Everyone with 'RESE' is reserved (regardless of everything else)
        # If no 'RESE' exists, but there is a 'SAMT' => no reservation
        for i in element.findall("Adresse/Reservert"):
            if i.text:
                tmp = i.text.strip()
                if tmp == "RESE":
                    to_reserve = True
                    break
                elif tmp == "SAMT":
                    to_reserve = False
        result.reserved = to_reserve

        # Address magic
        # If there is a sensible 'Sted for lønnsslipp', it will result i
        # proper "post/besøksaddresse" later. This code matches LT's behaviour
        # more closely (an employee 'inherits' the address of his/her
        # "primary" workplace.
        for sub in element.getiterator("Kommunikasjon"):
            txt = ensure_unicode(sub.findtext("Type"), self.encoding)
            val = ensure_unicode(sub.findtext("Verdi"), self.encoding)
            if (txt and txt == "Sted for lønnslipp" and val
                    # *some* of the entries have a space here and there.
                    # and some contain non-digit data
                    and val.replace(" ", "").isdigit()):
                val = val.replace(" ", "")
                fak, inst, gruppe = [int(x) for x in
                                     (val[:2], val[2:4], val[4:])]
                result.primary_ou = (cereconf.DEFAULT_INSTITUSJONSNR,
                                     fak, inst, gruppe)

        # We require people to have first/last name.
        if not (result.get_name(result.NAME_FIRST) and
                result.get_name(result.NAME_LAST)):
            self.logger.warn(
                "People must have first and last names. %s skipped",
                list(result.iterids())
            )
            return None

        return result

示例#30

0

显示文件

文件： fsxml2object.py 项目： unioslo/cerebrum

    def next_object(self, element):
        """Returns a DataEntity representation of the 'next' XML element."""
        result = FSOU()
        sko = tuple([int(element.get(x)) for x in ("fakultetnr",
                                                   "instituttnr",
                                                   "gruppenr")])
        result.add_id(result.NO_SKO, sko)
        # Parent ID - sko
        sko = tuple([int(element.get(x)) for x in ("fakultetnr_for_org_sted",
                                                   "instituttnr_for_org_sted",
                                                   "gruppenr_for_org_sted")])
        result.parent = (result.NO_SKO, sko)
        # stedkode_konv occationally contains SAP-OU-id for some
        # SAP-implementations. NB! This does not apply to UiO (as UiO's
        # implementation uses sko).
        if element.get("stedkode_konv"):
            result.add_id(result.NO_SAP_ID, element.get("stedkode_konv"))

        # IVR 2007-01-02: Everything coming from FS is publishable. However,
        # we may want to revise that at some point.
        result.publishable = True

        # names
        for name_kind, xmlname, lang in (
                (result.NAME_LONG, "stednavn", "nb"),
                (result.NAME_SHORT, "forkstednavn", "nb"),
                (result.NAME_ACRONYM, "akronym", "nb")):
            value = self._pull_name(element, xmlname)
            if value:
                result.add_name(DataName(name_kind, value, lang))

        # addresses
        extract = lambda x: ensure_unicode(element.get(x, ""), self.encoding)
        for xmlkind, address_kind in (("besok", DataAddress.ADDRESS_BESOK),
                                      ("intern", DataAddress.ADDRESS_POST)):
            zipcode = extract("poststednr_%s_adr" % xmlkind)
            street = (extract("adresselinje1_%s_adr" % xmlkind),
                      extract("adresselinje2_%s_adr" % xmlkind))
            result.add_address(DataAddress(kind=address_kind,
                                           street=street,
                                           zip=zipcode,
                                           city="",
                                           country=""))
        # contact information
        priority = 0
        for subelement in element.findall("komm"):
            kind, value = self._make_contact(subelement)
            if kind and value:
                result.add_contact(DataContact(kind, value, priority))
                priority += 1
        # We require a sko from FS ...
        if not result.get_id(result.NO_SKO):
            self.logger.warn("OU %s is missing stedkode. Skipped",
                             result)
            return None
        # ... and a name
        if not result.get_name(result.NAME_LONG):
            self.logger.warn("OU %s is missing name. Skipped",
                             result)
            return None
        return result

示例#31

0

显示文件

文件： ltxml2object.py 项目： unioslo/cerebrum

 def get_value(element_value):
     return ensure_unicode(element_value, self.encoding)

示例#32

0

显示文件

文件： ltxml2object.py 项目： Narvik-kommune/cerebrum

 def get_value(element_value):
     return ensure_unicode(element_value, self.encoding)

示例#33

0

显示文件

文件： sapxml2object.py 项目： Narvik-kommune/cerebrum

    def _make_employment(self, emp_element):
        """Make a DataEmployment instance of an <Hovedstilling>, </Bistilling>.

        emp_element is the XML-subtree representing the employment. Returns a
        DataEmployment object, representing the XML-employment object.

        """
        percentage = code = None
        start_date = end_date = None
        ou_id = None
        category = None
        kind = self.tag2type[emp_element.tag]
        mg = mug = None

        for sub in emp_element.getiterator():
            if not sub.text:
                continue

            value = ensure_unicode(sub.text.strip(), self.encoding)

            if sub.tag == "Stillingsprosent":
                percentage = float(value)
            elif sub.tag == "SKO":
                code = int(value[0:4])

                if getattr(self, 'filter_out_sko_0000', True):
                    # 0000 are to be discarded. This is by design.
                    if code == 0:
                        return None
                # Some elements have the proper category set in AdmForsk
                if category is None:
                    category = self._code2category(code)
            elif sub.tag == "Stilling":
                tmp = value.split(" ")
                if len(tmp) != 1 and category is None:
                    category = self._code2category(tmp[0])
            elif sub.tag == "Startdato":
                start_date = self._make_mxdate(value, format="%Y-%m-%d")
            elif sub.tag == "Sluttdato":
                end_date = self._make_mxdate(value, format="%Y-%m-%d")
            elif sub.tag == "Orgenhet":
                sko = make_sko(value)
                if sko is not None:
                    ou_id = (DataOU.NO_SKO, sko)
            elif sub.tag == "AdmForsk":
                # if neither is specified, use, the logic in
                # stillingsgruppebetegnelse to decide on the category
                if value == "Vit":
                    category = DataEmployment.KATEGORI_VITENSKAPLIG
                elif value == "T/A":
                    category = DataEmployment.KATEGORI_OEVRIG
            elif sub.tag == "Status":
                # <Status> indicates whether the employment entry is actually
                # valid.
                if value != "Aktiv":
                    return None
            elif sub.tag == "Stillingsnummer":
                # this code means that the employment has been terminated (why
                # would there be two elements for that?)
                if value == "99999999":
                    return None
                # these are temp employments (bilagslønnede) that we can
                # safely disregard (according to baardj).
                if value == "30010895":
                    return None
            elif sub.tag == "MEGType":
                mg = int(value)
            elif sub.tag == "MUGType":
                mug = int(value)
            # IVR 2007-07-11 FIXME: We should take a look at <Arsak>, since it
            # contains deceased status for a person.

        # We *must* have an OU to which this employment is attached.
        if getattr(self, 'require_ou_for_assignments', True) and not ou_id:
            return None

        kind = self.tag2type[emp_element.tag]
        tmp = DataEmployment(kind=kind,
                             percentage=percentage,
                             code=code,
                             start=start_date,
                             end=end_date,
                             place=ou_id,
                             category=category,
                             mg=mg,
                             mug=mug)

        for element in emp_element.findall(".//Tittel"):
            work_title = self._make_title(DataEmployment.WORK_TITLE, element)
            if work_title:
                tmp.add_name(work_title)

        return tmp

示例#34

0

显示文件

文件： sapxml2object.py 项目： Narvik-kommune/cerebrum

    def next_object(self, element):
        """Return the next SAPPerson object.

        Consume the next XML-element describing a person, and return a
        suitable representation (SAPPerson).

        Should something fail (which prevents this method from constructing a
        proper SAPPerson object), an exception is raised.

        """
        result = SAPPerson()

        # Per baardj's request, we consider middle names as first names.
        middle = ""
        middle = element.find("Person/Mellomnavn")
        if middle is not None and middle.text:
            middle = ensure_unicode(middle.text.strip(), self.encoding)

        # Iterate over *all* subelements, 'fill up' the result object
        for sub in element.getiterator():
            value = None
            if sub.text:
                value = ensure_unicode(sub.text.strip(), self.encoding)

            if sub.tag == "Fornavn":
                if middle:
                    value += " " + middle

                # IVR 2007-05-30 FIXME: This is not pretty.
                #
                # In an e-mail from 2007-05-29, Johannes Paulsen suggests that
                # marking invalid entries with '*' in the some of the name
                # elements is the easiest approach. This is an ugly hack, but
                # since the invalid entries will not disappear anytime soon,
                # this is the easiest way of skipping them.
                #
                # JAZZ 2007-08-01
                # '*' did not work all that well as it is used as common
                # wildcard in SAP. Johannes suggests that we use '@' in
                # stead. As the data is not updated yet (we don't know when
                # that will happen) we need to test for '*' as well in order
                # to skip all the invalid elements
                #
                if '*' in value or '@' in value:
                    if self.logger:
                        self.logger.debug("Name contains '@' or '*', ignored")
                    # Since the element is marked as void, there is no need to
                    # process further (we have no guarantee that any data
                    # would make sense and we won't have even more spurious
                    # warnings).
                    return None
                result.add_name(DataName(self.tag2type[sub.tag], value))
            elif sub.tag == "Etternavn":
                if '*' in value or '@' in value:
                    if self.logger:
                        self.logger.debug("Name contains '@' or '*', ignored")
                    # Se <Fornavn>.
                    return None
                result.add_name(DataName(self.tag2type[sub.tag], value))
            elif sub.tag == "Fodselsnummer" and value is not None:
                result.add_id(self.tag2type[sub.tag], personnr_ok(value))
            elif sub.tag == "Ansattnummer":
                result.add_id(self.tag2type[sub.tag], value)
                self.logger.debug(value)
            elif sub.tag == "Fodselsdato":
                result.birth_date = self._make_mxdate(value, format="%Y-%m-%d")
            elif sub.tag == "Kjonn":
                result.gender = self.tag2type[value]
            elif sub.tag == "Adresse":
                result.add_address(self._make_address(sub))
            elif sub.tag in ("Hovedstilling", "Bistilling"):
                emp = self._make_employment(sub)
                if emp is not None:
                    result.add_employment(emp)
            elif sub.tag == "Roller" and sub.findtext("IKKE-ANGIT") is None:
                emp = self._make_role(sub)
                if emp is not None:
                    result.add_employment(emp)
            elif sub.tag == "Person":
                # Lots of the other entries above also are part of the
                # "person"-firstlevel element, but we need to
                # specifically look here for Tittel => personal title,
                # to avoid confusion with worktitles
                for subsub in sub.findall("Tittel"):
                    personal_title = self._make_title(HRDataPerson.NAME_TITLE,
                                                      subsub)
                    if personal_title:
                        result.add_name(personal_title)
            elif sub.tag == "PersonligID":
                # Store additional person ids, like passport numbers.
                # Handle passport numbers
                if sub.find('Type').text in self.sap2idtype:
                    # Add the ID to the data-structure
                    pers_id = '{0}-{1}'.format(
                        ensure_unicode(sub.find('Land').text, self.encoding),
                        ensure_unicode(sub.find('Verdi').text, self.encoding))
                    result.add_id(self.sap2idtype[sub.find('Type').text],
                                  pers_id)
                else:
                    self.logger.debug("Unknown %s type '%s': skipping id type",
                                      sub.tag,
                                      sub.find('Type').text)
            elif sub.tag == "SGM":
                # New feature and unique (for now?) for UiO is SGM,
                # external attachments for person.
                self.logger.debug("SGM for %s", result)
                result.add_external_work(self._make_sgm(sub))
        # We need to order 'Telefon 1' and 'Telefon 2' properly
        celems = list(element.findall("Kommunikasjon"))
        celems.sort(lambda x, y: cmp(x.find("Type").text, y.find("Type").text))
        # TBD: Priorities!
        priority = 0
        for ct in celems:
            contact = self._make_contact(ct, priority)
            if contact:
                result.add_contact(contact)
                priority += 1

        # Reservations for catalogue publishing
        # default: One active employment => can be published
        to_reserve = not result.has_active_employments()

        # Everyone with 'RESE' is reserved (regardless of everything else)
        # If no 'RESE' exists, but there is a 'SAMT' => no reservation
        for i in element.findall("Adresse/Reservert"):
            if i.text:
                tmp = i.text.strip()
                if tmp == "RESE":
                    to_reserve = True
                    break
                elif tmp == "SAMT":
                    to_reserve = False
        result.reserved = to_reserve

        # Address magic
        # If there is a sensible 'Sted for lønnsslipp', it will result i
        # proper "post/besøksaddresse" later. This code matches LT's behaviour
        # more closely (an employee 'inherits' the address of his/her
        # "primary" workplace.
        for sub in element.getiterator("Kommunikasjon"):
            txt = ensure_unicode(sub.findtext("Type"), self.encoding)
            val = ensure_unicode(sub.findtext("Verdi"), self.encoding)
            if (txt and txt == "Sted for lønnslipp" and val
                    # *some* of the entries have a space here and there.
                    # and some contain non-digit data
                    and val.replace(" ", "").isdigit()):
                val = val.replace(" ", "")
                fak, inst, gruppe = [
                    int(x) for x in (val[:2], val[2:4], val[4:])
                ]
                result.primary_ou = (cereconf.DEFAULT_INSTITUSJONSNR, fak,
                                     inst, gruppe)

        # We require people to have first/last name.
        if not (result.get_name(result.NAME_FIRST)
                and result.get_name(result.NAME_LAST)):
            self.logger.warn(
                "People must have first and last names. %s skipped",
                list(result.iterids()))
            return None

        return result

示例#35

0

显示文件

文件： fsxml2object.py 项目： unioslo/cerebrum

 def _pull_name(self, element, attribute_name):
     if element.get(attribute_name):
         value = ensure_unicode(element.get(attribute_name), self.encoding)
         return value
     return None