Ejemplo n.º 1
0
def check_chunked_overflow(name, col):
    if col.num_chunks == 1:
        return

    if col.type in (ext.binary(), ext.string()):
        raise ValueError("Column '{0}' exceeds 2GB maximum capacity of "
                         "a Feather binary column. This restriction may be "
                         "lifted in the future".format(name))
    else:
        # TODO(wesm): Not sure when else this might be reached
        raise ValueError("Column '{0}' of type {1} was chunked on conversion "
                         "to Arrow and cannot be currently written to "
                         "Feather format".format(name, str(col.type)))
Ejemplo n.º 2
0
Archivo: feather.py Proyecto: rok/arrow
def check_chunked_overflow(col):
    if col.data.num_chunks == 1:
        return

    if col.type in (ext.binary(), ext.string()):
        raise ValueError("Column '{0}' exceeds 2GB maximum capacity of "
                         "a Feather binary column. This restriction may be "
                         "lifted in the future".format(col.name))
    else:
        # TODO(wesm): Not sure when else this might be reached
        raise ValueError("Column '{0}' of type {1} was chunked on conversion "
                         "to Arrow and cannot be currently written to "
                         "Feather format".format(col.name, str(col.type)))
Ejemplo n.º 3
0
    'is_num',
    'is_possible_cat',
    'is_possible_feature',
    'is_complex',
)

_ARROW_NULL_TYPE: DataType = null()

_ARROW_BOOL_TYPE: DataType = bool_()
assert (__arrow_bool_type_str := str(_ARROW_BOOL_TYPE)) == bool.__name__
assert _BOOL_TYPE.startswith(__arrow_bool_type_str)

_ARROW_STR_TYPE: DataType = string()
assert str(_ARROW_STR_TYPE) == _STR_TYPE

_ARROW_BINARY_TYPE: DataType = binary(-1)
assert str(_ARROW_BINARY_TYPE) == _BINARY_TYPE

_ARROW_INT_TYPE: DataType = int64()
_ARROW_DOUBLE_TYPE: DataType = float64()

_ARROW_DATE_TYPE: DataType = date32()
_ARROW_TIMESTAMP_TYPE: DataType = timestamp(unit='ns', tz=None)


def is_float(arrow_type: DataType, /) -> bool:
    """Check if data type is float."""
    return is_floating(arrow_type) or is_decimal(arrow_type)


def is_num(arrow_type: DataType, /) -> bool:
Ejemplo n.º 4
0
    _VECTOR_TYPE, \
    _DECIMAL_TYPE_PREFIX, \
    _ARRAY_TYPE_PREFIX, _MAP_TYPE_PREFIX, _STRUCT_TYPE_PREFIX

_ARROW_NULL_TYPE = null()
assert str(_ARROW_NULL_TYPE) == _NULL_TYPE

_ARROW_BOOL_TYPE = bool_()
__arrow_bool_type_str = str(_ARROW_BOOL_TYPE)
assert __arrow_bool_type_str == bool.__name__
assert _BOOL_TYPE.startswith(__arrow_bool_type_str)

_ARROW_STR_TYPE = string()
assert str(_ARROW_STR_TYPE) == _STR_TYPE

_ARROW_BINARY_TYPE = binary(-1)
assert str(_ARROW_BINARY_TYPE) == _BINARY_TYPE

_ARROW_INT_TYPE = int64()
_ARROW_DOUBLE_TYPE = float64()

_ARROW_DATE_TYPE = date32()
_ARROW_TIMESTAMP_TYPE = timestamp(unit='ns', tz=None)


def is_float(arrow_type):
    return is_floating(arrow_type) or is_decimal(arrow_type)


def is_num(arrow_type):
    return is_integer(arrow_type) or is_float(arrow_type)