Beispiel #1
0
def Is_id_or_kw(scanner_params):
    file, _, _, base_position, offset = scanner_params

    local_lexeme = ''
    local_offset = 0

    char = file.read(1).lower()
    local_offset += 1
    if is_letter(char):
        while True:
            char = file.read(1).lower()
            if is_digit(char) or is_letter(char):
                local_offset += 1
                continue
            else:
                local_lexeme = 'Id'
                break

        # checks if it is really Id or KeyWord
        value = get_detected_value(file, base_position, local_offset)
        for _, function in lexems_automats.key_words.__dict__.items():
            if callable(function):
                success, rest = function(value)
                if success:
                    local_lexeme = rest
                    value = local_lexeme.lower()
                    break
        return True, {
            'lexeme': local_lexeme,
            'offset': local_offset,
            'value': value
        }
    else:
        file.seek(base_position)
        return False, None
Beispiel #2
0
def Is_hex_int(scanner_params):
    file, _, _, base_position, _ = scanner_params

    char = file.read(1).lower()
    local_offset = 1
    if is_hex_digit(char):
        while True:
            char = file.read(1).lower()
            if not is_hex_digit(char):
                if char == 'h':
                    local_offset += 1
                    break
                else:
                    return False, None
            local_offset += 1

        char = file.read(1).lower()
        value = get_detected_value(file, base_position, local_offset)

        if not (is_letter(char) or is_digit(char) or is_colon(char)):
            return True, {
                'lexeme': 'Int',
                'offset': local_offset,
                'value': value
            }
        else:
            return False, {
                'lexeme': 'Error',
                'error': "HexInt integer's form is wrong",
                'value': value + char
            }
    else:
        return False, None
Beispiel #3
0
def is_exponenta(file, offset):
    char = file.read(1).lower()
    offset += 1

    sign_is_stop = False
    digit_is_present = False
    while is_digit(char) or (char in '+-' and not sign_is_stop
                             and not digit_is_present):
        if char in '+-':
            sign_is_stop = True
        if is_digit(char):
            digit_is_present = True
        char = file.read(1).lower()
        offset += 1

    if digit_is_present:
        return True, offset
    else:
        return False, offset
Beispiel #4
0
def Is_real(scanner_params):
    file, _, _, base_position, _ = scanner_params

    char = file.read(1).lower()
    local_offset = 1
    lexeme_is_formed = False

    if is_digit(char):
        while is_digit(char):
            char = file.read(1).lower()
            local_offset += 1
        if char == 'e':
            lexeme_is_formed, local_offset = is_exponenta(file, local_offset)

            local_offset -= 1
            value = get_detected_value(file, base_position, local_offset)
            if lexeme_is_formed:
                char = file.read(1).lower()
                if not (is_letter(char) or char == '.'):
                    return True, {
                        'lexeme': 'Real',
                        'offset': local_offset,
                        'value': value
                    }
                else:
                    return False, {
                        'lexeme': 'Error',
                        'error': 'Real number form',
                        'value': value + char
                    }
            else:
                char = file.read(1).lower()
                if is_hex_digit(char) or char == 'h':
                    return False, None
                else:
                    return False, {
                        'lexeme': 'Error',
                        'error': 'Real number form',
                        'value': value
                    }
        elif char == '.':
            char = file.read(1).lower()
            local_offset += 1
            if is_digit(char):
                while is_digit(char):
                    char = file.read(1).lower()
                    local_offset += 1

            if char == 'e':
                lexeme_is_formed, local_offset = is_exponenta(
                    file, local_offset)

                local_offset -= 1
                value = get_detected_value(file, base_position, local_offset)
                if lexeme_is_formed:
                    char = file.read(1).lower()
                    if not (is_letter(char) or char == '.'):
                        return True, {
                            'lexeme': 'Real',
                            'offset': local_offset,
                            'value': value
                        }
                    else:
                        return False, {
                            'lexeme': 'Error',
                            'error': 'Real number form',
                            'value': value + char
                        }
                else:
                    return False, {
                        'lexeme': 'Error',
                        'error': 'Real number form',
                        'value': value
                    }
            else:
                local_offset -= 1
                file.seek(base_position)
                chars = file.read(local_offset).lower()
                char = file.read(1).lower()
                if not (is_letter(char) or char == '.'):
                    return True, {
                        'lexeme': 'Real',
                        'offset': local_offset,
                        'value': chars
                    }
                else:
                    return False, {
                        'lexeme': 'Error',
                        'error': 'Real number form',
                        'value': chars + char
                    }

    elif char == '.':
        char = file.read(1).lower()
        local_offset += 1
        if is_digit(char):
            while is_digit(char):
                char = file.read(1).lower()
                local_offset += 1

            if char == 'e':
                lexeme_is_formed, local_offset = is_exponenta(
                    file, local_offset)

                local_offset -= 1
                value = get_detected_value(file, base_position, local_offset)
                if lexeme_is_formed:
                    char = file.read(1).lower()
                    if not (is_letter(char) or char == '.'):
                        return True, {
                            'lexeme': 'Real',
                            'offset': local_offset,
                            'value': value
                        }
                    else:
                        return False, {
                            'lexeme': 'Error',
                            'error': 'Real number form',
                            'value': value + char
                        }
                else:
                    return False, {
                        'lexeme': 'Error',
                        'error': 'Real number form',
                        'value': value
                    }
            elif is_letter(char):
                value = get_detected_value(file, base_position, local_offset)
                return False, {
                    'lexeme': 'Error',
                    'error': 'Real number form',
                    'value': value
                }
            else:
                local_offset -= 1
                value = get_detected_value(file, base_position, local_offset)
                return True, {
                    'lexeme': 'Real',
                    'offset': local_offset,
                    'value': value
                }
        else:
            return False, {
                'lexeme': 'Error',
                'error': 'Real number form',
                'value': '.' + char
            }
    else:
        return False, None

    return False, None
Beispiel #5
0
def Is__old_dec_int_or_label(scanner_params):
    file, _, row, base_position, _ = scanner_params
    additional_rows = 0

    char = file.read(1).lower()
    local_offset = 1
    split_offset = 0

    if is_digit(char):
        local_lexeme = 'Int'
        while True:
            char = file.read(1).lower()
            if is_digit(char) and split_offset == 0:
                local_offset += 1
            elif is_split(char):
                split_offset += 1
                if is_new_line(char):
                    additional_rows += 1
            else:
                if char == 'd':
                    local_offset += 1
                    file.seek(base_position + local_offset)
                elif is_colon(char):
                    local_offset += 1
                    local_lexeme = 'Label'
                    file.seek(base_position + local_offset + split_offset)
                else:
                    file.seek(base_position + local_offset)
                break

        afterchar = file.read(1).lower() if not is_new_line(char) else ''
        if local_lexeme == 'Int':
            value = get_detected_value(file, base_position, local_offset)
        else:
            value = get_detected_value(file, base_position,
                                       local_offset + split_offset, True)

        if local_lexeme == 'Int' and not (is_letter(afterchar)
                                          or is_digit(afterchar)):
            return True, {
                'lexeme': local_lexeme,
                'offset': local_offset,
                'value': value,
                'additional_rows': additional_rows
            }
        elif local_lexeme == 'Label' and (is_split(afterchar)
                                          or afterchar == ';'):
            # value = value.replace(' ', '')
            # value = value.replace('\t', '')
            # value = value.replace('\n', '')
            return True, {
                'lexeme': local_lexeme,
                'offset': local_offset + 2,
                'value': value,
                'additional_rows': additional_rows
            }
        else:
            return False, {
                'lexeme': 'Error',
                'error': "Dec integer's or label's forms are wrong",
                'value': value + char,
                'additional_rows': 0
            }
    else:
        return False, None
Beispiel #6
0
def Is_dec_int_or_label(scanner_params):
    file, _, row, base_position, _ = scanner_params
    # print(row)
    local_lexeme = ''
    may_detect_with_split = False
    detect_with_split = False

    char = file.read(1).lower()
    local_offset = 1
    additional = 0

    if is_digit(char):
        local_lexeme = 'Int'
        while True:
            char = file.read(1).lower()
            if '' == char:
                break

            if not ((is_digit(char) and not may_detect_with_split)
                    or is_split(char)):
                if char == 'd':  # it is still dec integer
                    local_offset += 1
                elif is_colon(char):
                    local_offset += 1
                    local_lexeme = 'Label'
                    if may_detect_with_split:
                        detect_with_split = True
                file.seek(base_position + local_offset + additional)
                break
            else:
                if is_split(char):
                    may_detect_with_split = True
                if char == '\n':
                    additional += 1
                local_offset += 1

        afterchar = file.read(1).lower() if not is_new_line(char) else ''
        value = get_detected_value(file,
                                   base_position,
                                   local_offset,
                                   detect_with_split=detect_with_split)

        # if local_lexeme == 'Label' and afterchar == 'w':
        #     local_offset += 1

        if local_lexeme == 'Int' and not (value.endswith('d') and (is_letter(afterchar) or is_digit(afterchar))) \
           or local_lexeme == 'Label' and (is_split(afterchar) or afterchar == ';' or is_letter(afterchar)):
            value = value.replace('\t', '')
            value = value.replace(' ', '')
            value = value.replace('\n', '')
            return True, {
                'lexeme': local_lexeme,
                'offset': local_offset + additional,
                'value': value,
                'additional_rows': additional
            }
        else:
            return False, {
                'lexeme': 'Error',
                'error': "Dec integer's or label's forms are wrong",
                'value': value + char,
                'additional_rows': 0
            }
    else:
        return False, None