When converting Pandas data that contains floating point values to boolean, incorrect results are given
In [2]: import pyarrow as pa
...: import pandas as pd
...: a = [0.0, 1.0, 2.0, None, float('NaN')]
...:
In [3]: s = pd.Series(a)
In [4]: pa.Array.from_pandas(s, type=pa.bool_())
Out[4]:
<pyarrow.lib.BooleanArray object at 0x7f1bfd099e68>
[
False,
False,
False,
False,
False
]