arrow git commit: ARROW-852: Also search for ARROW libs when pkg-config provided the path
Repository: arrow Updated Branches: refs/heads/master a94c03a02 -> 59cd801a7 ARROW-852: Also search for ARROW libs when pkg-config provided the path Change-Id: Ic7fb227342782dfed5885f8fc5e73418fd31d504 Author: Uwe L. KornCloses #563 from xhochy/ARROW-852 and squashes the following commits: 9630352 [Uwe L. Korn] Remove ARROW_HOME 5fc43ce [Uwe L. Korn] Always search for libs Project: http://git-wip-us.apache.org/repos/asf/arrow/repo Commit: http://git-wip-us.apache.org/repos/asf/arrow/commit/59cd801a Tree: http://git-wip-us.apache.org/repos/asf/arrow/tree/59cd801a Diff: http://git-wip-us.apache.org/repos/asf/arrow/diff/59cd801a Branch: refs/heads/master Commit: 59cd801a7645783c0c33ed2435be08db4ffcd378 Parents: a94c03a Author: Uwe L. Korn Authored: Tue Apr 18 22:32:59 2017 -0400 Committer: Wes McKinney Committed: Tue Apr 18 22:32:59 2017 -0400 -- python/cmake_modules/FindArrow.cmake | 61 --- python/manylinux1/build_arrow.sh | 1 - 2 files changed, 31 insertions(+), 31 deletions(-) -- http://git-wip-us.apache.org/repos/asf/arrow/blob/59cd801a/python/cmake_modules/FindArrow.cmake -- diff --git a/python/cmake_modules/FindArrow.cmake b/python/cmake_modules/FindArrow.cmake index fbe4545..9fb1355 100644 --- a/python/cmake_modules/FindArrow.cmake +++ b/python/cmake_modules/FindArrow.cmake @@ -34,6 +34,7 @@ if ("$ENV{ARROW_HOME}" STREQUAL "") message(STATUS "Arrow SO version: ${ARROW_SO_VERSION}") set(ARROW_INCLUDE_DIR ${ARROW_INCLUDE_DIRS}) set(ARROW_LIBS ${ARROW_LIBRARY_DIRS}) +set(ARROW_SEARCH_LIB_PATH ${ARROW_LIBRARY_DIRS}) endif() else() set(ARROW_HOME "$ENV{ARROW_HOME}") @@ -51,42 +52,42 @@ else() # make sure we don't accidentally pick up a different version NO_DEFAULT_PATH ) +endif() - find_library(ARROW_LIB_PATH NAMES arrow -PATHS -${ARROW_SEARCH_LIB_PATH} -NO_DEFAULT_PATH) - get_filename_component(ARROW_LIBS ${ARROW_LIB_PATH} DIRECTORY) +find_library(ARROW_LIB_PATH NAMES arrow + PATHS + ${ARROW_SEARCH_LIB_PATH} + NO_DEFAULT_PATH) +get_filename_component(ARROW_LIBS ${ARROW_LIB_PATH} DIRECTORY) - find_library(ARROW_JEMALLOC_LIB_PATH NAMES arrow_jemalloc -PATHS -${ARROW_SEARCH_LIB_PATH} -NO_DEFAULT_PATH) +find_library(ARROW_JEMALLOC_LIB_PATH NAMES arrow_jemalloc + PATHS + ${ARROW_SEARCH_LIB_PATH} + NO_DEFAULT_PATH) - find_library(ARROW_PYTHON_LIB_PATH NAMES arrow_python -PATHS -${ARROW_SEARCH_LIB_PATH} -NO_DEFAULT_PATH) +find_library(ARROW_PYTHON_LIB_PATH NAMES arrow_python + PATHS + ${ARROW_SEARCH_LIB_PATH} + NO_DEFAULT_PATH) - if (ARROW_INCLUDE_DIR AND ARROW_LIBS) -set(ARROW_FOUND TRUE) +if (ARROW_INCLUDE_DIR AND ARROW_LIBS) + set(ARROW_FOUND TRUE) -if (MSVC) - set(ARROW_STATIC_LIB ${ARROW_LIB_PATH}) - set(ARROW_PYTHON_STATIC_LIB ${ARROW_PYTHON_LIB_PATH}) - set(ARROW_JEMALLOC_STATIC_LIB ${ARROW_JEMALLOC_LIB_PATH}) - set(ARROW_SHARED_LIB ${ARROW_STATIC_LIB}) - set(ARROW_PYTHON_SHARED_LIB ${ARROW_PYTHON_STATIC_LIB}) - set(ARROW_JEMALLOC_SHARED_LIB ${ARROW_JEMALLOC_STATIC_LIB}) -else() - set(ARROW_STATIC_LIB ${ARROW_PYTHON_LIB_PATH}/libarrow.a) - set(ARROW_PYTHON_STATIC_LIB ${ARROW_PYTHON_LIB_PATH}/libarrow_python.a) - set(ARROW_JEMALLOC_STATIC_LIB ${ARROW_PYTHON_LIB_PATH}/libarrow_jemalloc.a) + if (MSVC) +set(ARROW_STATIC_LIB ${ARROW_LIB_PATH}) +set(ARROW_PYTHON_STATIC_LIB ${ARROW_PYTHON_LIB_PATH}) +set(ARROW_JEMALLOC_STATIC_LIB ${ARROW_JEMALLOC_LIB_PATH}) +set(ARROW_SHARED_LIB ${ARROW_STATIC_LIB}) +set(ARROW_PYTHON_SHARED_LIB ${ARROW_PYTHON_STATIC_LIB}) +set(ARROW_JEMALLOC_SHARED_LIB ${ARROW_JEMALLOC_STATIC_LIB}) + else() +set(ARROW_STATIC_LIB ${ARROW_PYTHON_LIB_PATH}/libarrow.a) +set(ARROW_PYTHON_STATIC_LIB ${ARROW_PYTHON_LIB_PATH}/libarrow_python.a) +set(ARROW_JEMALLOC_STATIC_LIB ${ARROW_PYTHON_LIB_PATH}/libarrow_jemalloc.a) - set(ARROW_SHARED_LIB ${ARROW_LIBS}/libarrow${CMAKE_SHARED_LIBRARY_SUFFIX}) - set(ARROW_JEMALLOC_SHARED_LIB ${ARROW_LIBS}/libarrow_jemalloc${CMAKE_SHARED_LIBRARY_SUFFIX}) - set(ARROW_PYTHON_SHARED_LIB ${ARROW_LIBS}/libarrow_python${CMAKE_SHARED_LIBRARY_SUFFIX}) -endif() +set(ARROW_SHARED_LIB ${ARROW_LIBS}/libarrow${CMAKE_SHARED_LIBRARY_SUFFIX}) +set(ARROW_JEMALLOC_SHARED_LIB ${ARROW_LIBS}/libarrow_jemalloc${CMAKE_SHARED_LIBRARY_SUFFIX}) +set(ARROW_PYTHON_SHARED_LIB ${ARROW_LIBS}/libarrow_python${CMAKE_SHARED_LIBRARY_SUFFIX}) endif() endif() http://git-wip-us.apache.org/repos/asf/arrow/blob/59cd801a/python/manylinux1/build_arrow.sh -- diff --git
arrow git commit: ARROW-844: [Format] Update README documents in format/
Repository: arrow Updated Branches: refs/heads/master 7f20f6e73 -> 38efabea9 ARROW-844: [Format] Update README documents in format/ Added a section reflecting specification maturity and stability. Author: Wes McKinneyCloses #556 from wesm/ARROW-844 and squashes the following commits: 03dbb71 [Wes McKinney] Update README documents in format/ Project: http://git-wip-us.apache.org/repos/asf/arrow/repo Commit: http://git-wip-us.apache.org/repos/asf/arrow/commit/38efabea Tree: http://git-wip-us.apache.org/repos/asf/arrow/tree/38efabea Diff: http://git-wip-us.apache.org/repos/asf/arrow/diff/38efabea Branch: refs/heads/master Commit: 38efabea9bbc8d6386f96a635a95c53ba70e6149 Parents: 7f20f6e Author: Wes McKinney Authored: Tue Apr 18 11:43:13 2017 -0400 Committer: Wes McKinney Committed: Tue Apr 18 11:43:13 2017 -0400 -- format/README.md | 20 +++- 1 file changed, 15 insertions(+), 5 deletions(-) -- http://git-wip-us.apache.org/repos/asf/arrow/blob/38efabea/format/README.md -- diff --git a/format/README.md b/format/README.md index 048badb..3aa8fdd 100644 --- a/format/README.md +++ b/format/README.md @@ -14,16 +14,14 @@ ## Arrow specification documents -> **Work-in-progress specification documents**. These are discussion documents -> created by the Arrow developers during late 2015 and in no way represents a -> finalized specification. - Currently, the Arrow specification consists of these pieces: - Metadata specification (see Metadata.md) - Physical memory layout specification (see Layout.md) -- Metadata serialized representation (see Message.fbs) +- Logical Types, Schemas, and Record Batch Metadata (see Schema.fbs) +- Encapsulated Messages (see Message.fbs) - Mechanics of messaging between Arrow systems (IPC, RPC, etc.) (see IPC.md) +- Tensor (Multi-dimensional array) Metadata (see Tensor.fbs) The metadata currently uses Google's [flatbuffers library][1] for serializing a couple related pieces of information: @@ -35,4 +33,16 @@ couple related pieces of information: schema, and enable a system to send and receive Arrow row batches in a form that can be precisely disassembled or reconstructed. +## Arrow Format Maturity and Stability + +We have made significant progress hardening the Arrow in-memory format and +Flatbuffer metadata since the project started in February 2016. We have +integration tests which verify binary compatibility between the Java and C++ +implementations, for example. + +Major versions may still include breaking changes to the memory format or +metadata, so it is recommended to use the same released version of all +libraries in your applications for maximum compatibility. Data stored in the +Arrow IPC formats should not be used for long term storage. + [1]: http://github.com/google/flatbuffers
arrow git commit: ARROW-818: [Python] Expand Sphinx API docs, pyarrow.* namespace. Add factory functions for time32, time64
Repository: arrow Updated Branches: refs/heads/master bb287e203 -> 7f20f6e73 ARROW-818: [Python] Expand Sphinx API docs, pyarrow.* namespace. Add factory functions for time32, time64 Author: Wes McKinneyCloses #557 from wesm/ARROW-818 and squashes the following commits: 96ce436 [Wes McKinney] Expand Sphinx API docs, pyarrow.* namespace. Add factory functions for time32, time64 Project: http://git-wip-us.apache.org/repos/asf/arrow/repo Commit: http://git-wip-us.apache.org/repos/asf/arrow/commit/7f20f6e7 Tree: http://git-wip-us.apache.org/repos/asf/arrow/tree/7f20f6e7 Diff: http://git-wip-us.apache.org/repos/asf/arrow/diff/7f20f6e7 Branch: refs/heads/master Commit: 7f20f6e738a2e163b0b753416ee4c4ed00998f4b Parents: bb287e2 Author: Wes McKinney Authored: Tue Apr 18 16:37:03 2017 +0200 Committer: Uwe L. Korn Committed: Tue Apr 18 16:37:03 2017 +0200 -- python/doc/source/api.rst| 69 +++- python/pyarrow/__init__.py | 33 ++ python/pyarrow/_array.pxd| 10 + python/pyarrow/_array.pyx| 74 ++- python/pyarrow/_io.pyx | 6 +-- python/pyarrow/includes/libarrow.pxd | 3 ++ python/pyarrow/tests/test_io.py | 4 +- python/pyarrow/tests/test_schema.py | 21 + 8 files changed, 195 insertions(+), 25 deletions(-) -- http://git-wip-us.apache.org/repos/asf/arrow/blob/7f20f6e7/python/doc/source/api.rst -- diff --git a/python/doc/source/api.rst b/python/doc/source/api.rst index 92e248b..08a0694 100644 --- a/python/doc/source/api.rst +++ b/python/doc/source/api.rst @@ -24,8 +24,8 @@ API Reference .. _api.functions: -Type Metadata and Schemas -- +Type and Schema Factory Functions +- .. autosummary:: :toctree: generated/ @@ -43,6 +43,8 @@ Type Metadata and Schemas float16 float32 float64 + time32 + time64 timestamp date32 date64 @@ -53,10 +55,8 @@ Type Metadata and Schemas struct dictionary field - DataType - Field - Schema schema + from_numpy_dtype Scalar Value Types -- @@ -68,6 +68,7 @@ Scalar Value Types NAType Scalar ArrayValue + BooleanValue Int8Value Int16Value Int32Value @@ -82,6 +83,11 @@ Scalar Value Types BinaryValue StringValue FixedSizeBinaryValue + Date32Value + Date64Value + TimestampValue + DecimalValue + Array Types and Constructors @@ -91,21 +97,30 @@ Array Types and Constructors array Array - NullArray - NumericArray - IntegerArray - FloatingPointArray BooleanArray + DictionaryArray + FloatingPointArray + IntegerArray Int8Array Int16Array Int32Array Int64Array + NullArray + NumericArray UInt8Array UInt16Array UInt32Array UInt64Array - DictionaryArray + BinaryArray + FixedSizeBinaryArray StringArray + Time32Array + Time64Array + Date32Array + Date64Array + TimestampArray + DecimalArray + ListArray Tables and Record Batches - @@ -113,9 +128,11 @@ Tables and Record Batches .. autosummary:: :toctree: generated/ + ChunkedArray Column RecordBatch Table + get_record_batch_size Tensor type and Functions - @@ -141,7 +158,7 @@ Input / Output and Shared Memory MemoryMappedFile memory_map create_memory_map - PythonFileInterface + PythonFile Interprocess Communication and Messaging @@ -165,3 +182,33 @@ Memory Pools jemalloc_memory_pool total_allocated_bytes set_memory_pool + +Type Classes + + +.. autosummary:: + :toctree: generated/ + + DataType + DecimalType + DictionaryType + FixedSizeBinaryType + Time32Type + Time64Type + TimestampType + Field + Schema + +.. currentmodule:: pyarrow.parquet + +Apache Parquet +-- + +.. autosummary:: + :toctree: generated/ + + ParquetDataset + ParquetFile + read_table + write_metadata + write_table http://git-wip-us.apache.org/repos/asf/arrow/blob/7f20f6e7/python/pyarrow/__init__.py -- diff --git a/python/pyarrow/__init__.py b/python/pyarrow/__init__.py index 87f2352..4d8da9f 100644 --- a/python/pyarrow/__init__.py +++ b/python/pyarrow/__init__.py @@ -31,12 +31,20 @@ from pyarrow._config import cpu_count, set_cpu_count from pyarrow._array import (null, bool_, int8, int16, int32, int64, uint8, uint16, uint32, uint64, -