Exemplo n.º 1
0
def process_neo4j(args):

    # List refnames of all names in the Neo4j database
    # If there is no refname in db, then the name is handled as a refname.
    try:

        t = time.perf_counter()

        result = Name.get_all_first_names()
        for record1 in result:
            first = record1["first"]

            ref_name = ''
            names = first.split(" ")
            for name in names:
                record2 = None  # If there is no refname
                result = Refname.get_refname(name)

                for record2 in result:
                    #                    aname = record2["aname"]
                    bname = record2["bname"]
                    ref_name = ref_name + " " + bname
                    # print("\nName: " + aname + " ---> Refname: " + bname)

                if not record2:
                    ref_name = ref_name + " " + name

            print("\nPerson name: " + first + " ---> refname: " + ref_name)

        elapsed_time = time.perf_counter() - t
        print("\nTime needed: " + str(elapsed_time) + " seconds")

    except Exception as err:
        print("Virhe: {0}".format(err), file=stderr)
def process_neo4j(args):

    # List some data of the people with given refname
    try:
    
        result = Name.get_people_with_refname(args.refname)
        for record in result:
            get_name_data(record["handle"])

    except Exception as err:
        print("Virhe: {0}".format(err), file=stderr)
def process_neo4j(args):
    ''' 
        Compare a person from owner's set and another person in Taapeli db
        by the reference names of their first first name 
    '''
    try:
    
        t = time.perf_counter()
        print_cnt = 0

        u = User()
        u.userid = args.userid
        result = u.get_ids_and_refnames_of_people_of_user()
        for record in result:
            p = Person()
            # This id is the unique key of the node
            uniq_id = record["id"]
            p.id = uniq_id
            refname = record["refname"]
            p.get_person_and_name_data_by_id()

            # Use the first of first names of the refname as a search key,
            # E.g. refname = "Matti Johannes" ---> search with "Matti"
            names = refname.split(" ")
                
            tresult = Name.get_ids_of_people_with_refname_and_user_given('Taapeli', names[0])
            for trecord in tresult:
                tp = Person()
                tp.id = trecord["id"]
            
                if print_cnt == 0:
                    print("\nUnique id pairs of people with the same first name in")
                    print("the compared db : the Taapeli db")
                
                print("\n" + str(uniq_id) + " : " + str(tp.id))
                print_cnt += 1
          
        print("\n\nNumber of id pairs printted out: " + str(print_cnt))
        elapsed_time = time.perf_counter() - t
        print("\nTime needed: " + str(elapsed_time) + " seconds")

    except Exception as err:
        print("Virhe: {0}".format(err), file=stderr)
Exemplo n.º 4
0
def process_neo4j(args):

    # List people with the given name
    try:
    
        t = time.perf_counter()

        u = User()
        u.userid = args.userid
        result = u.get_refnames_of_people_of_user()
        for record in result:
            p = Person()
            p.handle = record["handle"]
            refname = record["refname"]
            p.get_person_and_name_data()

            # Use the first name of the refname as a search key,
            # E.g. refname = "Matti Johannes" ---> search with "Matti"
            names = refname.split(" ")
                
            tresult = Name.get_people_with_refname_and_user_given('Taapeli', names[0])
            for trecord in tresult:
                tp = Person()
                tp.handle = trecord["handle"]
                
                print("\nPerson in the compare db:")
                call_string = "python3 get_family_with_handle_given.py " + p.handle
                subprocess.call(call_string, shell=True)
                
                print("\nPerson in the Taapeli db:")
                call_string = "python3 get_family_with_handle_given.py " + tp.handle
                subprocess.call(call_string, shell=True)
                
                print("\n#-------------------------------------------------------------------#\n")
                                   
        elapsed_time = time.perf_counter() - t
        print("\nTime needed: " + str(elapsed_time) + " seconds")

    except Exception as err:
        print("Virhe: {0}".format(err), file=stderr)
Exemplo n.º 5
0
def process_neo4j(args):

    # Get family data of the person
    global points
    
    try:    
        t = time.perf_counter()
        print_cnt = 0
        
        total_points = []
        compared_ids = []
        taapeli_ids = []

        u = User()
        u.userid = args.userid
        result = u.get_ids_and_refnames_of_people_of_user()
        for record in result:
            p = Person()
            # This id is the unique key of the node
            p.uniq_id = record["id"]
            refname = record["refname"]
            p.get_person_and_name_data_by_id()

            # Use the first name of the refname as a search key,
            # E.g. refname = "Matti Johannes" ---> search with "Matti"
            names = refname.split(" ")
                
            tresult = Name.get_ids_of_people_with_refname_and_user_given('Taapeli', names[0])
            for trecord in tresult:
                tp = Person()
                tp.uniq_id = trecord["id"]
                
                # The fetching of the family and parents data of the main person is
                # split to two operations:
                #
                # If there are no parents in the db the result of 
                # get_parentin_id() operation is empty,
                # but the get_family_data operation prints out
                # the family of the main person.
                result = p.get_parentin_id()            
                for record in result:
                    main_parents_hlink = record["parentin_hlink"]
                    
                    result = tp.get_parentin_id()            
                    for record in result:
                        taapeli_parents_hlink = record["parentin_hlink"]
                        compare_parents_data(main_parents_hlink, taapeli_parents_hlink)
        
                compare_family_data(p, tp)
                
                total_points.append(points)
                compared_ids.append(p.uniq_id)
                taapeli_ids.append(tp.uniq_id)
                print_cnt += 1
                
        print("\nTotal points # Compared ids # Taapeli ids")
        print("-----------------------------------------")
        for i in range(len(total_points)):
            print("\n  " + str(total_points[i]) + "   #   " + str(compared_ids[i]) + "   #   " + str(taapeli_ids[i]))

        print("\nLines printted: " + str(print_cnt))
                
        elapsed_time = time.perf_counter() - t
        print("\nTime needed: " + str(elapsed_time) + " seconds")

    except Exception as err:
        print("Virhe: {0}".format(err), file=stderr)
Exemplo n.º 6
0
def list_surnames():
    result = Name.get_surnames()

    for record in result:
        print(record["surname"])
Exemplo n.º 7
0
def handle_people(collection, userid):
    # Get all the people in the collection
    people = collection.getElementsByTagName("person")

    print("*****People*****")
    counter = 0

    # Print detail of each person
    for person in people:

        p = Person()

        if person.hasAttribute("handle"):
            p.handle = person.getAttribute("handle")
        if person.hasAttribute("change"):
            p.change = person.getAttribute("change")
        if person.hasAttribute("id"):
            p.id = person.getAttribute("id")

        if len(person.getElementsByTagName('gender')) == 1:
            person_gender = person.getElementsByTagName('gender')[0]
            p.gender = person_gender.childNodes[0].data
        elif len(person.getElementsByTagName('gender')) > 1:
            print("Error: More than one gender tag in a person")

        if len(person.getElementsByTagName('name')) >= 1:
            for i in range(len(person.getElementsByTagName('name'))):
                person_name = person.getElementsByTagName('name')[i]
                pname = Name()
                if person_name.hasAttribute("alt"):
                    pname.alt = person_name.getAttribute("alt")
                if person_name.hasAttribute("type"):
                    pname.type = person_name.getAttribute("type")

                if len(person_name.getElementsByTagName('first')) == 1:
                    person_first = person_name.getElementsByTagName('first')[0]
                    if len(person_first.childNodes) == 1:
                        pname.first = person_first.childNodes[0].data
                    elif len(person_first.childNodes) > 1:
                        print(
                            "Error: More than one child node in a first name of a person"
                        )
                elif len(person_name.getElementsByTagName('first')) > 1:
                    print("Error: More than one first name in a person")

                if len(person_name.getElementsByTagName('surname')) == 1:
                    person_surname = person_name.getElementsByTagName(
                        'surname')[0]
                    if len(person_surname.childNodes) == 1:
                        pname.surname = person_surname.childNodes[0].data
                    elif len(person_surname.childNodes) > 1:
                        print(
                            "Error: More than one child node in a surname of a person"
                        )
                elif len(person_name.getElementsByTagName('surname')) > 1:
                    print("Error: More than one surname in a person")

                if len(person_name.getElementsByTagName('suffix')) == 1:
                    person_suffix = person_name.getElementsByTagName(
                        'suffix')[0]
                    pname.suffix = person_suffix.childNodes[0].data
                elif len(person_name.getElementsByTagName('suffix')) > 1:
                    print("Error: More than one suffix in a person")

                p.name.append(pname)

        if len(person.getElementsByTagName('eventref')) >= 1:
            for i in range(len(person.getElementsByTagName('eventref'))):
                person_eventref = person.getElementsByTagName('eventref')[i]
                if person_eventref.hasAttribute("hlink"):
                    p.eventref_hlink.append(
                        person_eventref.getAttribute("hlink"))
                if person_eventref.hasAttribute("role"):
                    p.eventref_role.append(
                        person_eventref.getAttribute("role"))

        if len(person.getElementsByTagName('parentin')) >= 1:
            for i in range(len(person.getElementsByTagName('parentin'))):
                person_parentin = person.getElementsByTagName('parentin')[i]
                if person_parentin.hasAttribute("hlink"):
                    p.parentin_hlink.append(
                        person_parentin.getAttribute("hlink"))

        if len(person.getElementsByTagName('citationref')) >= 1:
            for i in range(len(person.getElementsByTagName('citationref'))):
                person_citationref = person.getElementsByTagName(
                    'citationref')[i]
                if person_citationref.hasAttribute("hlink"):
                    p.citationref_hlink.append(
                        person_citationref.getAttribute("hlink"))

        p.save(userid)
        counter += 1

        # There can be so many individs to store that Cypher needs a pause
        time.sleep(0.1)

    print("Number of people stored: " + str(counter))