def process_neo4j(args): # List refnames of all names in the Neo4j database # If there is no refname in db, then the name is handled as a refname. try: t = time.perf_counter() result = Name.get_all_first_names() for record1 in result: first = record1["first"] ref_name = '' names = first.split(" ") for name in names: record2 = None # If there is no refname result = Refname.get_refname(name) for record2 in result: # aname = record2["aname"] bname = record2["bname"] ref_name = ref_name + " " + bname # print("\nName: " + aname + " ---> Refname: " + bname) if not record2: ref_name = ref_name + " " + name print("\nPerson name: " + first + " ---> refname: " + ref_name) elapsed_time = time.perf_counter() - t print("\nTime needed: " + str(elapsed_time) + " seconds") except Exception as err: print("Virhe: {0}".format(err), file=stderr)
def process_neo4j(args): # List some data of the people with given refname try: result = Name.get_people_with_refname(args.refname) for record in result: get_name_data(record["handle"]) except Exception as err: print("Virhe: {0}".format(err), file=stderr)
def process_neo4j(args): ''' Compare a person from owner's set and another person in Taapeli db by the reference names of their first first name ''' try: t = time.perf_counter() print_cnt = 0 u = User() u.userid = args.userid result = u.get_ids_and_refnames_of_people_of_user() for record in result: p = Person() # This id is the unique key of the node uniq_id = record["id"] p.id = uniq_id refname = record["refname"] p.get_person_and_name_data_by_id() # Use the first of first names of the refname as a search key, # E.g. refname = "Matti Johannes" ---> search with "Matti" names = refname.split(" ") tresult = Name.get_ids_of_people_with_refname_and_user_given('Taapeli', names[0]) for trecord in tresult: tp = Person() tp.id = trecord["id"] if print_cnt == 0: print("\nUnique id pairs of people with the same first name in") print("the compared db : the Taapeli db") print("\n" + str(uniq_id) + " : " + str(tp.id)) print_cnt += 1 print("\n\nNumber of id pairs printted out: " + str(print_cnt)) elapsed_time = time.perf_counter() - t print("\nTime needed: " + str(elapsed_time) + " seconds") except Exception as err: print("Virhe: {0}".format(err), file=stderr)
def process_neo4j(args): # List people with the given name try: t = time.perf_counter() u = User() u.userid = args.userid result = u.get_refnames_of_people_of_user() for record in result: p = Person() p.handle = record["handle"] refname = record["refname"] p.get_person_and_name_data() # Use the first name of the refname as a search key, # E.g. refname = "Matti Johannes" ---> search with "Matti" names = refname.split(" ") tresult = Name.get_people_with_refname_and_user_given('Taapeli', names[0]) for trecord in tresult: tp = Person() tp.handle = trecord["handle"] print("\nPerson in the compare db:") call_string = "python3 get_family_with_handle_given.py " + p.handle subprocess.call(call_string, shell=True) print("\nPerson in the Taapeli db:") call_string = "python3 get_family_with_handle_given.py " + tp.handle subprocess.call(call_string, shell=True) print("\n#-------------------------------------------------------------------#\n") elapsed_time = time.perf_counter() - t print("\nTime needed: " + str(elapsed_time) + " seconds") except Exception as err: print("Virhe: {0}".format(err), file=stderr)
def process_neo4j(args): # Get family data of the person global points try: t = time.perf_counter() print_cnt = 0 total_points = [] compared_ids = [] taapeli_ids = [] u = User() u.userid = args.userid result = u.get_ids_and_refnames_of_people_of_user() for record in result: p = Person() # This id is the unique key of the node p.uniq_id = record["id"] refname = record["refname"] p.get_person_and_name_data_by_id() # Use the first name of the refname as a search key, # E.g. refname = "Matti Johannes" ---> search with "Matti" names = refname.split(" ") tresult = Name.get_ids_of_people_with_refname_and_user_given('Taapeli', names[0]) for trecord in tresult: tp = Person() tp.uniq_id = trecord["id"] # The fetching of the family and parents data of the main person is # split to two operations: # # If there are no parents in the db the result of # get_parentin_id() operation is empty, # but the get_family_data operation prints out # the family of the main person. result = p.get_parentin_id() for record in result: main_parents_hlink = record["parentin_hlink"] result = tp.get_parentin_id() for record in result: taapeli_parents_hlink = record["parentin_hlink"] compare_parents_data(main_parents_hlink, taapeli_parents_hlink) compare_family_data(p, tp) total_points.append(points) compared_ids.append(p.uniq_id) taapeli_ids.append(tp.uniq_id) print_cnt += 1 print("\nTotal points # Compared ids # Taapeli ids") print("-----------------------------------------") for i in range(len(total_points)): print("\n " + str(total_points[i]) + " # " + str(compared_ids[i]) + " # " + str(taapeli_ids[i])) print("\nLines printted: " + str(print_cnt)) elapsed_time = time.perf_counter() - t print("\nTime needed: " + str(elapsed_time) + " seconds") except Exception as err: print("Virhe: {0}".format(err), file=stderr)
def list_surnames(): result = Name.get_surnames() for record in result: print(record["surname"])
def handle_people(collection, userid): # Get all the people in the collection people = collection.getElementsByTagName("person") print("*****People*****") counter = 0 # Print detail of each person for person in people: p = Person() if person.hasAttribute("handle"): p.handle = person.getAttribute("handle") if person.hasAttribute("change"): p.change = person.getAttribute("change") if person.hasAttribute("id"): p.id = person.getAttribute("id") if len(person.getElementsByTagName('gender')) == 1: person_gender = person.getElementsByTagName('gender')[0] p.gender = person_gender.childNodes[0].data elif len(person.getElementsByTagName('gender')) > 1: print("Error: More than one gender tag in a person") if len(person.getElementsByTagName('name')) >= 1: for i in range(len(person.getElementsByTagName('name'))): person_name = person.getElementsByTagName('name')[i] pname = Name() if person_name.hasAttribute("alt"): pname.alt = person_name.getAttribute("alt") if person_name.hasAttribute("type"): pname.type = person_name.getAttribute("type") if len(person_name.getElementsByTagName('first')) == 1: person_first = person_name.getElementsByTagName('first')[0] if len(person_first.childNodes) == 1: pname.first = person_first.childNodes[0].data elif len(person_first.childNodes) > 1: print( "Error: More than one child node in a first name of a person" ) elif len(person_name.getElementsByTagName('first')) > 1: print("Error: More than one first name in a person") if len(person_name.getElementsByTagName('surname')) == 1: person_surname = person_name.getElementsByTagName( 'surname')[0] if len(person_surname.childNodes) == 1: pname.surname = person_surname.childNodes[0].data elif len(person_surname.childNodes) > 1: print( "Error: More than one child node in a surname of a person" ) elif len(person_name.getElementsByTagName('surname')) > 1: print("Error: More than one surname in a person") if len(person_name.getElementsByTagName('suffix')) == 1: person_suffix = person_name.getElementsByTagName( 'suffix')[0] pname.suffix = person_suffix.childNodes[0].data elif len(person_name.getElementsByTagName('suffix')) > 1: print("Error: More than one suffix in a person") p.name.append(pname) if len(person.getElementsByTagName('eventref')) >= 1: for i in range(len(person.getElementsByTagName('eventref'))): person_eventref = person.getElementsByTagName('eventref')[i] if person_eventref.hasAttribute("hlink"): p.eventref_hlink.append( person_eventref.getAttribute("hlink")) if person_eventref.hasAttribute("role"): p.eventref_role.append( person_eventref.getAttribute("role")) if len(person.getElementsByTagName('parentin')) >= 1: for i in range(len(person.getElementsByTagName('parentin'))): person_parentin = person.getElementsByTagName('parentin')[i] if person_parentin.hasAttribute("hlink"): p.parentin_hlink.append( person_parentin.getAttribute("hlink")) if len(person.getElementsByTagName('citationref')) >= 1: for i in range(len(person.getElementsByTagName('citationref'))): person_citationref = person.getElementsByTagName( 'citationref')[i] if person_citationref.hasAttribute("hlink"): p.citationref_hlink.append( person_citationref.getAttribute("hlink")) p.save(userid) counter += 1 # There can be so many individs to store that Cypher needs a pause time.sleep(0.1) print("Number of people stored: " + str(counter))