(xlntpyarrow) check builder append return status and use double cell values instead of long double

pull/243/head
Thomas Fussell 2017-09-28 09:05:23 -04:00
parent 75de03745b
commit 0dcd56ebc9
2 changed files with 38 additions and 31 deletions

View File

@ -170,7 +170,7 @@ void open_file(xlnt::streaming_workbook_reader &reader, pybind11::object file)
template<typename T> template<typename T>
T cell_value(xlnt::cell cell) T cell_value(xlnt::cell cell)
{ {
return static_cast<T>(cell.value<long double>()); return static_cast<T>(cell.value<double>());
} }
// from https://stackoverflow.com/questions/1659440/32-bit-to-16-bit-floating-point-conversion // from https://stackoverflow.com/questions/1659440/32-bit-to-16-bit-floating-point-conversion
@ -186,144 +186,151 @@ std::uint16_t float_to_half(float f)
void append_cell_value(arrow::ArrayBuilder *builder, arrow::Type::type type, xlnt::cell cell) void append_cell_value(arrow::ArrayBuilder *builder, arrow::Type::type type, xlnt::cell cell)
{ {
const status = arrow::Status::OK();
switch (type) switch (type)
{ {
case arrow::Type::NA: case arrow::Type::NA:
break; break;
case arrow::Type::BOOL: case arrow::Type::BOOL:
static_cast<arrow::BooleanBuilder *>(builder) status = static_cast<arrow::BooleanBuilder *>(builder)
->Append(cell.value<bool>()); ->Append(cell.value<bool>());
break; break;
case arrow::Type::UINT8: case arrow::Type::UINT8:
static_cast<arrow::UInt8Builder *>(builder) status = static_cast<arrow::UInt8Builder *>(builder)
->Append(cell_value<std::uint8_t>(cell)); ->Append(cell_value<std::uint8_t>(cell));
break; break;
case arrow::Type::INT8: case arrow::Type::INT8:
static_cast<arrow::Int8Builder *>(builder) status = static_cast<arrow::Int8Builder *>(builder)
->Append(cell_value<std::uint8_t>(cell)); ->Append(cell_value<std::uint8_t>(cell));
break; break;
case arrow::Type::UINT16: case arrow::Type::UINT16:
static_cast<arrow::UInt16Builder *>(builder) status = static_cast<arrow::UInt16Builder *>(builder)
->Append(cell_value<std::uint16_t>(cell)); ->Append(cell_value<std::uint16_t>(cell));
break; break;
case arrow::Type::INT16: case arrow::Type::INT16:
static_cast<arrow::Int16Builder *>(builder) status = static_cast<arrow::Int16Builder *>(builder)
->Append(cell_value<std::int16_t>(cell)); ->Append(cell_value<std::int16_t>(cell));
break; break;
case arrow::Type::UINT32: case arrow::Type::UINT32:
static_cast<arrow::UInt32Builder *>(builder) status = static_cast<arrow::UInt32Builder *>(builder)
->Append(cell_value<std::uint32_t>(cell)); ->Append(cell_value<std::uint32_t>(cell));
break; break;
case arrow::Type::INT32: case arrow::Type::INT32:
static_cast<arrow::Int32Builder *>(builder) status = static_cast<arrow::Int32Builder *>(builder)
->Append(cell_value<std::int32_t>(cell)); ->Append(cell_value<std::int32_t>(cell));
break; break;
case arrow::Type::UINT64: case arrow::Type::UINT64:
static_cast<arrow::UInt64Builder *>(builder) status = static_cast<arrow::UInt64Builder *>(builder)
->Append(cell_value<std::uint64_t>(cell)); ->Append(cell_value<std::uint64_t>(cell));
break; break;
case arrow::Type::INT64: case arrow::Type::INT64:
static_cast<arrow::Int64Builder *>(builder) status = static_cast<arrow::Int64Builder *>(builder)
->Append(cell_value<std::int64_t>(cell)); ->Append(cell_value<std::int64_t>(cell));
break; break;
case arrow::Type::HALF_FLOAT: case arrow::Type::HALF_FLOAT:
static_cast<arrow::HalfFloatBuilder *>(builder) status = static_cast<arrow::HalfFloatBuilder *>(builder)
->Append(float_to_half(cell_value<float>(cell))); ->Append(float_to_half(cell_value<float>(cell)));
break; break;
case arrow::Type::FLOAT: case arrow::Type::FLOAT:
static_cast<arrow::FloatBuilder *>(builder) status = static_cast<arrow::FloatBuilder *>(builder)
->Append(cell_value<float>(cell)); ->Append(cell_value<float>(cell));
break; break;
case arrow::Type::DOUBLE: case arrow::Type::DOUBLE:
static_cast<arrow::DoubleBuilder *>(builder) status = static_cast<arrow::DoubleBuilder *>(builder)
->Append(cell_value<long double>(cell)); ->Append(cell_value<double>(cell));
break; break;
case arrow::Type::STRING: case arrow::Type::STRING:
static_cast<arrow::StringBuilder *>(builder) status = static_cast<arrow::StringBuilder *>(builder)
->Append(cell.value<std::string>()); ->Append(cell.value<std::string>());
break; break;
case arrow::Type::BINARY: case arrow::Type::BINARY:
static_cast<arrow::BinaryBuilder *>(builder) status = static_cast<arrow::BinaryBuilder *>(builder)
->Append(cell.value<std::string>()); ->Append(cell.value<std::string>());
break; break;
case arrow::Type::FIXED_SIZE_BINARY: case arrow::Type::FIXED_SIZE_BINARY:
static_cast<arrow::FixedSizeBinaryBuilder *>(builder) status = static_cast<arrow::FixedSizeBinaryBuilder *>(builder)
->Append(cell.value<std::string>()); ->Append(cell.value<std::string>());
break; break;
case arrow::Type::DATE32: case arrow::Type::DATE32:
static_cast<arrow::Date32Builder *>(builder) status = static_cast<arrow::Date32Builder *>(builder)
->Append(cell_value<arrow::Date32Type::c_type>(cell)); ->Append(cell_value<arrow::Date32Type::c_type>(cell));
break; break;
case arrow::Type::DATE64: case arrow::Type::DATE64:
static_cast<arrow::Date64Builder *>(builder) status = static_cast<arrow::Date64Builder *>(builder)
->Append(cell_value<arrow::Date64Type::c_type>(cell)); ->Append(cell_value<arrow::Date64Type::c_type>(cell));
break; break;
case arrow::Type::TIMESTAMP: case arrow::Type::TIMESTAMP:
static_cast<arrow::TimestampBuilder *>(builder) status = static_cast<arrow::TimestampBuilder *>(builder)
->Append(cell_value<arrow::TimestampType::c_type>(cell)); ->Append(cell_value<arrow::TimestampType::c_type>(cell));
break; break;
case arrow::Type::TIME32: case arrow::Type::TIME32:
static_cast<arrow::Time32Builder *>(builder) status = static_cast<arrow::Time32Builder *>(builder)
->Append(cell_value<arrow::Time32Type::c_type>(cell)); ->Append(cell_value<arrow::Time32Type::c_type>(cell));
break; break;
case arrow::Type::TIME64: case arrow::Type::TIME64:
static_cast<arrow::Time64Builder *>(builder) status = static_cast<arrow::Time64Builder *>(builder)
->Append(cell_value<arrow::Time64Type::c_type>(cell)); ->Append(cell_value<arrow::Time64Type::c_type>(cell));
break; break;
/* /*
case arrow::Type::INTERVAL: case arrow::Type::INTERVAL:
static_cast<arrow::IntervalBuilder *>(builder) status = static_cast<arrow::IntervalBuilder *>(builder)
->Append(cell_value<std::int64_t>(cell)); ->Append(cell_value<std::int64_t>(cell));
break; break;
case arrow::Type::DECIMAL: case arrow::Type::DECIMAL:
static_cast<arrow::DecimalBuilder *>(builder) status = static_cast<arrow::DecimalBuilder *>(builder)
->Append(cell.value<std::string>()); ->Append(cell.value<std::string>());
break; break;
case arrow::Type::LIST: case arrow::Type::LIST:
static_cast<arrow::ListBuilder *>(builder) status = static_cast<arrow::ListBuilder *>(builder)
->Append(cell.value<std::string>()); ->Append(cell.value<std::string>());
break; break;
case arrow::Type::STRUCT: case arrow::Type::STRUCT:
static_cast<arrow::StructBuilder *>(builder) status = static_cast<arrow::StructBuilder *>(builder)
->Append(cell.value<std::string>()); ->Append(cell.value<std::string>());
break; break;
case arrow::Type::UNION: case arrow::Type::UNION:
static_cast<arrow::UnionBuilder *>(builder) status = static_cast<arrow::UnionBuilder *>(builder)
->Append(cell.value<std::string>()); ->Append(cell.value<std::string>());
break; break;
case arrow::Type::DICTIONARY: case arrow::Type::DICTIONARY:
static_cast<arrow::DictionaryBuilder *>(builder) status = static_cast<arrow::DictionaryBuilder *>(builder)
->Append(cell.value<std::string>()); ->Append(cell.value<std::string>());
break; break;
*/ */
default: default:
throw xlnt::exception("not implemented"); throw xlnt::exception("not implemented");
} }
if (status != arrow::Status::OK())
{
throw xlnt::exception("Append failed");
}
} }
pybind11::handle read_batch(xlnt::streaming_workbook_reader &reader, pybind11::handle read_batch(xlnt::streaming_workbook_reader &reader,
@ -415,9 +422,9 @@ PYBIND11_MODULE(lib, m)
{ {
return cell.value<unsigned int>(); return cell.value<unsigned int>();
}) })
.def("value_long_double", [](xlnt::cell &cell) .def("value_double", [](xlnt::cell &cell)
{ {
return cell.value<long double>(); return cell.value<double>();
}) })
.def("data_type", [](xlnt::cell &cell) .def("data_type", [](xlnt::cell &cell)
{ {

View File

@ -14,7 +14,7 @@ COLUMN_TYPE_FIELD = {
def cell_to_pyarrow_array(cell, type): def cell_to_pyarrow_array(cell, type):
if cell.data_type() == xpa.Cell.Type.Number: if cell.data_type() == xpa.Cell.Type.Number:
return pa.array([cell.value_long_double()], type) return pa.array([cell.value_double()], type)
elif cell.data_type() == xpa.Cell.Type.SharedString: elif cell.data_type() == xpa.Cell.Type.SharedString:
return pa.array([cell.value_string()], type) return pa.array([cell.value_string()], type)
elif cell.data_type() == xpa.Cell.Type.InlineString: elif cell.data_type() == xpa.Cell.Type.InlineString: