Python DataPoint Examples

Programming Language: Python

Namespace/Package Name: snorkel.types

Class/Type: DataPoint

Examples at hotexamples.com: 22

Python DataPoint - 22 examples found. These are the top rated real world Python examples of snorkel.types.DataPoint extracted from open source projects. You can rate examples to help us improve the quality of examples.

Frequently Used Methods

Show Hide

num_squared(3)

asDict(2)

num(2)

person1_left_tokens(2)

person2_left_tokens(2)

person_lastnames(2)

person_names(2)

d_new(1)

double_num_squared(1)

double_num_squared_plus_1(1)

source_target(1)

Example #1

Show file

    def get_source_target(cand: DataPoint) -> DataPoint:
        """Returnsthe source and target mentioned in the sentence."""
        person_names = []

        source = [token.text for token in cand.doc if token.text in sources]
        target = [token.text for token in cand.doc if token.text in targets]

        try:
            cand.source_target = (source[0], target[0])
        except:
            cand.source_target = (np.nan, np.nan)
        return cand

Example #2

Show file

def get_left_tokens(cand: DataPoint) -> DataPoint:
    """
    Returns tokens in the length 3 window to the left of the person mentions
    """
    # TODO: need to pass window as input params
    window = 3

    end = cand.person1_word_idx[0]
    cand.person1_left_tokens = cand.tokens[0:end][-1 - window:-1]

    end = cand.person2_word_idx[0]
    cand.person2_left_tokens = cand.tokens[0:end][-1 - window:-1]
    return cand

Example #3

Show file

def get_left_tokens(cand: DataPoint) -> DataPoint:
    """
    Returns tokens in the three length window to the left of entity mentions.
    :param cand: A candidate DF.
    :return: Candidate DF with two new columns, each a list of tokens to the left of entities.
    """
    # TODO: make window a parameter
    window = 3
    end = cand.person1_word_idx[0]
    cand.person1_left_tokens = cand.tokens[0:end][1 - window: -1]
    end = cand.person2_word_idx[0]
    cand.person2_left_tokens = cand.tokens[0:end][1 - window: -1]
    return cand

Example #4

Show file

def get_text_between(cand: DataPoint) -> DataPoint:
    """
    Returns the text between the two person mentions in the sentence
    """
    start = cand.person1_word_idx[1] + 1
    end = cand.person2_word_idx[0]
    cand.text_between = " ".join(cand.tokens[start:end])
    return cand

Example #5

Show file

def get_text_between(cand: DataPoint) -> DataPoint:
    """
    Returns the text between two entity mentions.
    :param cand: A candidate DF.
    :return: Candidate DF with new column, text between entity mentions.
    """
    start = cand.person1_word_idx[1] + 1
    end = cand.person2_word_idx[0]
    cand.text_between = " ".join(cand.tokens[start:end])
    return cand

Example #6

Show file

def get_person_last_names(cand: DataPoint) -> DataPoint:
    """
    Returns the last names for the two person mentions in candidate
    """
    cand = get_person_text(cand)
    person1_name, person2_name = cand.person_names
    person1_lastname = (person1_name.split(" ")[-1]
                        if len(person1_name.split(" ")) > 1 else None)
    person2_lastname = (person2_name.split(" ")[-1]
                        if len(person2_name.split(" ")) > 1 else None)
    cand.person_lastnames = [person1_lastname, person2_lastname]
    return cand

Example #7

Show file

def get_person_text(cand: DataPoint) -> DataPoint:
    """
    Returns the text for the two person mentions in candidate
    """
    person_names = []
    for index in [1, 2]:
        field_name = "person{}_word_idx".format(index)
        start = cand[field_name][0]
        end = cand[field_name][1] + 1
        person_names.append(" ".join(cand["tokens"][start:end]))
    cand.person_names = person_names
    return cand

Example #8

Show file

def get_persons_last_name(cand: DataPoint) -> DataPoint:
    """
    Returns entity last names.
    :param cand: A candidate DF.
    :return: Candidate DF with a new column, a list of last names.
    """
    cand = get_person_text(cand)
    person1_name, person2_name = cand.person_names
    person1_last_name = (person1_name.split(" ")[-1] if len(person1_name.split(" ")) > 1 else None)
    person2_last_name = (person2_name.split(" ")[-1] if len(person2_name.split(" ")) > 1 else None)
    cand.person_lastnames = [person1_last_name, person2_last_name]
    return cand

Example #9

Show file

def get_person_text(cand: DataPoint) -> DataPoint:
    """
    Returns the text for the two person mentions in candidate sentence.
    :param cand: A candidate DF.
    :return: Candidate DF with new column, a list of entity names.
    """
    person_names = []
    for index in [1, 2]:
        field_name = "person{j}_word_idx".format(j=index)
        start = cand[field_name][0]
        end = cand[field_name][1] + 1
        person_names.append(" ".join(cand["tokens"][start:end]))
    cand.person_names = person_names
    return cand

Example #10

Show file

 def square(x: DataPoint) -> DataPoint:
     x.num_squared = square_hit_tracker(x.num)
     if x.num == 21:
         return None
     return x

Example #11

Show file

 def mapper_pre_2(x: DataPoint) -> DataPoint:
     x.double_num_squared_plus_1 = x.double_num_squared + 1
     return x

Example #12

Show file

def modify_in_place(x: DataPoint) -> DataPoint:
    x.d["my_key"] = 0
    return Row(num=x.num, d=x.d, d_new=x.d)

Example #13

Show file

def square(x: DataPoint) -> DataPoint:
    fields = x.asDict()
    fields["num_squared"] = x.num**2
    return Row(**fields)

Example #14

Show file

 def square(x: DataPoint) -> DataPoint:
     fields = x.asDict()
     fields["num_squared"] = square_hit_tracker(x.num)
     return Row(**fields)

Example #15

Show file

def copy_features(x: DataPoint) -> DataPoint:
    """Compute x2 + 0.25 for direct comparison to x1."""
    x.x3 = x.x2 + 0.25
    return x

Example #16

Show file

    def get_text_between(cand: DataPoint) -> DataPoint:
        """
        Returns the text between a source-target pair and the text to the left of the source
        """

        source_idx = [token.i for token in cand.doc if token.text in sources]
        target_idx = [token.i for token in cand.doc if token.text in targets]

        try:

            if (len(target_idx) == 1) & (len(source_idx) == 1) & (
                    source_idx[0] < target_idx[0]):
                cand.text_between = cand.doc[source_idx[0]:target_idx[0]]
                cand.text_to_source_left = cand.doc[:source_idx[0]]

            elif (len(target_idx) > 1) & (len(source_idx) == 1):
                for target_index in target_idx:
                    if source_idx[0] < target_index:
                        cand.text_between = cand.doc[
                            source_idx[0]:target_index]
                        cand.text_to_source_left = cand.doc[:source_idx[0]]

            elif (len(source_idx) > 1) & (len(target_idx) == 1):
                for source_index in source_idx:
                    if source_index < target_idx[0]:
                        cand.text_between = cand.doc[
                            source_index:target_idx[0]]
                        cand.text_to_source_left = cand.doc[:source_index]

            elif (len(source_idx) > 1) & (len(target_idx) > 1):
                for source_index in source_idx:
                    for target_index in target_idx:
                        if source_index < target_index:
                            cand.text_between = cand.doc[
                                source_index:target_index]
                            cand.text_to_source_left = cand.doc[:source_index]

            else:
                cand.text_between = 'NaN'
                cand.text_to_source_left = 'NaN'
        except:

            cand.text_between = 'NaN'
            cand.text_to_source_left = 'NaN'

        return cand

Example #17

Show file

def square(x: DataPoint) -> DataPoint:
    x.num_squared = x.num ** 2
    return x

Example #18

Show file

 def square(x: DataPoint) -> DataPoint:
     x.num_squared = square_hit_tracker(x.num)
     return x

Example #19

Show file

 def mapper_pre(x: DataPoint) -> DataPoint:
     x.double_num_squared = 2 * x.num_squared
     return x

Example #20

Show file

File: test_tf_applier.py Project: zuiwufenghua/slice_based_learning

def square_returns_none(x: DataPoint) -> DataPoint:
    if x.num == 2:
        return None
    x.num = x.num**2
    return x

Example #21

Show file

def modify_in_place(x: DataPoint) -> DataPoint:
    x.d["my_key"] = 0
    x.d_new = x.d
    return x

Example #22

Show file

def combine_text(x: DataPoint) -> DataPoint:
    x.text = f"{x.title} {x.article}"
    return x