diff --git a/.github/workflows/python.yml b/.github/workflows/python.yml index e5d367958dd..bc7fe3cd683 100644 --- a/.github/workflows/python.yml +++ b/.github/workflows/python.yml @@ -69,10 +69,10 @@ jobs: - conda-python-3.12-no-numpy include: - name: conda-python-docs - cache: conda-python-3.10 + cache: conda-python-3.11 image: conda-python-docs - title: AMD64 Conda Python 3.10 Sphinx & Numpydoc - python: "3.10" + title: AMD64 Conda Python 3.11 Sphinx & Numpydoc + python: "3.11" - name: conda-python-3.11-nopandas cache: conda-python-3.11 image: conda-python diff --git a/python/pyarrow/table.pxi b/python/pyarrow/table.pxi index 8e258e38afe..7859c736cf0 100644 --- a/python/pyarrow/table.pxi +++ b/python/pyarrow/table.pxi @@ -1882,7 +1882,7 @@ cdef class _Tabular(_PandasConvertible): pyarrow.Table year: double n_legs: int64 - animals: string + animals: large_string ---- year: [[2022,2021]] n_legs: [[4,100]] @@ -1916,7 +1916,7 @@ cdef class _Tabular(_PandasConvertible): >>> table.field(0) pyarrow.Field >>> table.field(1) - pyarrow.Field + pyarrow.Field """ return self.schema.field(i) @@ -2144,7 +2144,7 @@ cdef class _Tabular(_PandasConvertible): pyarrow.Table year: int64 n_legs: int64 - animal: string + animal: large_string ---- year: [[2019,2021,2021,2020,2022,2022]] n_legs: [[5,100,4,2,4,2]] @@ -2190,7 +2190,7 @@ cdef class _Tabular(_PandasConvertible): pyarrow.Table year: int64 n_legs: int64 - animals: string + animals: large_string ---- year: [[2022,2021]] n_legs: [[4,100]] @@ -2484,7 +2484,7 @@ cdef class _Tabular(_PandasConvertible): >>> table.append_column('year', [year]) pyarrow.Table n_legs: int64 - animals: string + animals: large_string year: int64 ---- n_legs: [[2,4,5,100]] @@ -2545,7 +2545,7 @@ cdef class RecordBatch(_Tabular): month: int64 day: int64 n_legs: int64 - animals: string + animals: large_string ---- year: [2020,2022,2021,2022] month: [3,5,7,9] @@ -2585,7 +2585,7 @@ cdef class RecordBatch(_Tabular): month: int64 day: int64 n_legs: int64 - animals: string + animals: large_string ---- year: [2020,2022,2021,2022] month: [3,5,7,9] @@ -2870,7 +2870,7 @@ cdef class RecordBatch(_Tabular): pyarrow.RecordBatch year: int64 n_legs: int64 - animals: string + animals: large_string ---- year: [2021,2022,2019,2021] n_legs: [2,4,5,100] @@ -2881,7 +2881,7 @@ cdef class RecordBatch(_Tabular): >>> batch pyarrow.RecordBatch n_legs: int64 - animals: string + animals: large_string ---- n_legs: [2,4,5,100] animals: ["Flamingo","Horse","Brittle stars","Centipede"] @@ -3047,7 +3047,7 @@ cdef class RecordBatch(_Tabular): >>> batch.rename_columns(new_names) pyarrow.RecordBatch n: int64 - name: string + name: large_string ---- n: [2,4,5,100] name: ["Flamingo","Horse","Brittle stars","Centipede"] @@ -3055,7 +3055,7 @@ cdef class RecordBatch(_Tabular): >>> batch.rename_columns(new_names) pyarrow.RecordBatch n: int64 - name: string + name: large_string ---- n: [2,4,5,100] name: ["Flamingo","Horse","Brittle stars","Centipede"] @@ -3324,7 +3324,7 @@ cdef class RecordBatch(_Tabular): >>> batch = pa.RecordBatch.from_pandas(df) >>> batch.schema n_legs: int64 - animals: string + animals: large_string -- schema metadata -- pandas: '{"index_columns": [{"kind": "range", "name": null, "start": 0, ... @@ -3416,7 +3416,7 @@ cdef class RecordBatch(_Tabular): month: int64 day: int64 n_legs: int64 - animals: string + animals: large_string ---- year: [2020,2022,2021,2022] month: [3,5,7,9] @@ -3583,7 +3583,7 @@ cdef class RecordBatch(_Tabular): >>> pa.RecordBatch.from_struct_array(struct).to_pandas() n_legs animals year 0 2 Parrot NaN - 1 4 None 2022.0 + 1 4 NaN 2022.0 """ cdef: shared_ptr[CRecordBatch] c_record_batch @@ -4156,7 +4156,7 @@ cdef class Table(_Tabular): pyarrow.Table year: int64 n_legs: int64 - animals: string + animals: large_string ---- year: [[2020,2022,2019,2021]] n_legs: [[2,4,5,100]] @@ -4291,7 +4291,7 @@ cdef class Table(_Tabular): pyarrow.Table year: int64 n_legs: int64 - animals: string + animals: large_string ---- year: [[2020,2022,2019]] n_legs: [[2,4,5]] @@ -4300,7 +4300,7 @@ cdef class Table(_Tabular): pyarrow.Table year: int64 n_legs: int64 - animals: string + animals: large_string ---- year: [[2019,2021]] n_legs: [[5,100]] @@ -4309,7 +4309,7 @@ cdef class Table(_Tabular): pyarrow.Table year: int64 n_legs: int64 - animals: string + animals: large_string ---- year: [[2019]] n_legs: [[5]] @@ -4693,7 +4693,7 @@ cdef class Table(_Tabular): >>> table = pa.Table.from_pandas(df) >>> table.schema n_legs: int64 - animals: string + animals: large_string -- schema metadata -- pandas: '{"index_columns": [{"kind": "range", "name": null, "start": 0, ... @@ -4787,7 +4787,7 @@ cdef class Table(_Tabular): >>> pa.Table.from_pandas(df) pyarrow.Table n_legs: int64 - animals: string + animals: large_string ---- n_legs: [[2,4,5,100]] animals: [["Flamingo","Horse","Brittle stars","Centipede"]] @@ -4938,7 +4938,7 @@ cdef class Table(_Tabular): >>> pa.Table.from_struct_array(struct).to_pandas() n_legs animals year 0 2 Parrot NaN - 1 4 None 2022.0 + 1 4 NaN 2022.0 """ if isinstance(struct_array, Array): return Table.from_batches([RecordBatch.from_struct_array(struct_array)]) @@ -5145,13 +5145,13 @@ cdef class Table(_Tabular): >>> reader = table.to_reader() >>> reader.schema n_legs: int64 - animals: string + animals: large_string -- schema metadata -- pandas: '{"index_columns": [{"kind": "range", "name": null, "start": 0, ... >>> reader.read_all() pyarrow.Table n_legs: int64 - animals: string + animals: large_string ---- n_legs: [[2,4,5,100]] animals: [["Flamingo","Horse","Brittle stars","Centipede"]] @@ -5199,7 +5199,7 @@ cdef class Table(_Tabular): >>> table = pa.Table.from_pandas(df) >>> table.schema n_legs: int64 - animals: string + animals: large_string -- schema metadata -- pandas: '{"index_columns": [{"kind": "range", "name": null, "start": 0, "' ... """ @@ -5293,7 +5293,7 @@ cdef class Table(_Tabular): ... 'animals': ["Flamingo", "Horse", None, "Centipede"]}) >>> table = pa.Table.from_pandas(df) >>> table.nbytes - 72 + 88 """ self._assert_cpu() cdef: @@ -5323,7 +5323,7 @@ cdef class Table(_Tabular): ... 'animals': ["Flamingo", "Horse", None, "Centipede"]}) >>> table = pa.Table.from_pandas(df) >>> table.get_total_buffer_size() - 76 + 96 """ self._assert_cpu() cdef: @@ -5372,7 +5372,7 @@ cdef class Table(_Tabular): pyarrow.Table year: int64 n_legs: int64 - animals: string + animals: large_string ---- year: [[2021,2022,2019,2021]] n_legs: [[2,4,5,100]] @@ -5383,7 +5383,7 @@ cdef class Table(_Tabular): >>> table pyarrow.Table n_legs: int64 - animals: string + animals: large_string ---- n_legs: [[2,4,5,100]] animals: [["Flamingo","Horse","Brittle stars","Centipede"]] @@ -5535,7 +5535,7 @@ cdef class Table(_Tabular): >>> table.rename_columns(new_names) pyarrow.Table n: int64 - name: string + name: large_string ---- n: [[2,4,5,100]] name: [["Flamingo","Horse","Brittle stars","Centipede"]] @@ -5543,7 +5543,7 @@ cdef class Table(_Tabular): >>> table.rename_columns(new_names) pyarrow.Table n: int64 - name: string + name: large_string ---- n: [[2,4,5,100]] name: [["Flamingo","Horse","Brittle stars","Centipede"]] @@ -5700,7 +5700,7 @@ cdef class Table(_Tabular): id: int64 year: int64 n_legs: int64 - animal: string + animal: large_string ---- id: [[3,1,2]] year: [[2019,2020,2022]] @@ -5714,7 +5714,7 @@ cdef class Table(_Tabular): id: int64 year: int64 n_legs: int64 - animal: string + animal: large_string ---- id: [[3,1,2,4]] year: [[2019,2020,2022,null]] @@ -5728,7 +5728,7 @@ cdef class Table(_Tabular): year: int64 id: int64 n_legs: int64 - animal: string + animal: large_string ---- year: [[2019,null]] id: [[3,4]] @@ -5741,7 +5741,7 @@ cdef class Table(_Tabular): pyarrow.Table id: int64 n_legs: int64 - animal: string + animal: large_string ---- id: [[4]] n_legs: [[100]] @@ -5754,7 +5754,7 @@ cdef class Table(_Tabular): id: int64 year: int64 n_legs: int64 - animal: string + animal: large_string ---- id: [] year: [] @@ -6003,7 +6003,7 @@ def record_batch(data, names=None, schema=None, metadata=None): month: int64 day: int64 n_legs: int64 - animals: string + animals: large_string ---- year: [2020,2022,2021,2022] month: [3,5,7,9] @@ -6164,7 +6164,7 @@ def table(data, names=None, schema=None, metadata=None, nthreads=None): pyarrow.Table year: int64 n_legs: int64 - animals: string + animals: large_string ---- year: [[2020,2022,2019,2021]] n_legs: [[2,4,5,100]] diff --git a/python/pyarrow/types.pxi b/python/pyarrow/types.pxi index 792c0840f81..14bd64774e4 100644 --- a/python/pyarrow/types.pxi +++ b/python/pyarrow/types.pxi @@ -3140,7 +3140,7 @@ cdef class Schema(_Weakrefable): >>> pa.Schema.from_pandas(df) int: int64 - str: string + str: large_string -- schema metadata -- pandas: '{"index_columns": [{"kind": "range", "name": null, ... """