svn commit: r19908 - in /dev/arrow/apache-arrow-0.4.1-rc0: ./ apache-arrow-0.4.1.tar.gz apache-arrow-0.4.1.tar.gz.asc apache-arrow-0.4.1.tar.gz.md5 apache-arrow-0.4.1.tar.gz.sha

2017-06-06 Thread wesm
Author: wesm
Date: Wed Jun  7 02:23:23 2017
New Revision: 19908

Log:
Apache Arrow ${version} RC${rc}

Added:
dev/arrow/apache-arrow-0.4.1-rc0/
dev/arrow/apache-arrow-0.4.1-rc0/apache-arrow-0.4.1.tar.gz   (with props)
dev/arrow/apache-arrow-0.4.1-rc0/apache-arrow-0.4.1.tar.gz.asc
dev/arrow/apache-arrow-0.4.1-rc0/apache-arrow-0.4.1.tar.gz.md5
dev/arrow/apache-arrow-0.4.1-rc0/apache-arrow-0.4.1.tar.gz.sha

Added: dev/arrow/apache-arrow-0.4.1-rc0/apache-arrow-0.4.1.tar.gz
==
Binary file - no diff available.

Propchange: dev/arrow/apache-arrow-0.4.1-rc0/apache-arrow-0.4.1.tar.gz
--
svn:mime-type = application/octet-stream

Added: dev/arrow/apache-arrow-0.4.1-rc0/apache-arrow-0.4.1.tar.gz.asc
==
--- dev/arrow/apache-arrow-0.4.1-rc0/apache-arrow-0.4.1.tar.gz.asc (added)
+++ dev/arrow/apache-arrow-0.4.1-rc0/apache-arrow-0.4.1.tar.gz.asc Wed Jun  7 
02:23:23 2017
@@ -0,0 +1,17 @@
+-BEGIN PGP SIGNATURE-
+Version: GnuPG v1
+
+iQIcBAABCgAGBQJZN2OSAAoJEPEFiDoXNWI9WVgQAKzC+m6K6F/8x9GAlEh1jZWS
+eFYnbmpsrFg/BWD/TIz9V5NBMLIdbAokqLFzaPXdOLgz+k6RxlN3EVcXs/+sJsZ+
+cxKhvKBRt8sGwMAK7s5Lwf7SyasqgZ8LaDH6THvqYk8DXsqN9MAIPz1ZZrlOEpKN
+Hl5n0A2LnDw/ItsyHv0dQn5r4EDnqZrvpK0XMkFQTkOdyepTi5Bvfnx9+TvLofCN
+uA7/Dc0yNTIQEm0bias0/3wTZtRZzgf0ts8BtZtpg2fzLeHY7hDAZXiZoPsSSrDN
+hWb4rs4pgMBxMGoWGojilHLc0xweh9uR1bago5PPEDaGBWrsAd0Zkb98S9glc5UW
+42oG9A6qBNp0nulsG72gaw9PEnv8Lu9y/DVRkh/upgGU8G2IYXpt9edvi38OVmGc
+k1sy1hlolJ8l+wphueH3a2BTPF6PYAiLVDxCtCM4CT0GzaCqm7r4Xl8/u45RBkZb
+AzobZAZs8Y/ANP8JxejfaOvGR7eqCPJf4l5RLUcQ1CtqNd3WPbtNWzKYNNoiqJ3h
+ej0NbNFdf4eEtCY7aBFkhfmAqj0lCmUdLE6i/M1qbEffZd3GUfYITLBIALZcrpTw
+WIpL25afjW/owveBmZdrjz9JRILaoTWP5a/nVGI7X6iaYtg+qj16w3eRmqD8gxm7
+JTuwc53udHDp9fz0otbU
+=1ON7
+-END PGP SIGNATURE-

Added: dev/arrow/apache-arrow-0.4.1-rc0/apache-arrow-0.4.1.tar.gz.md5
==
--- dev/arrow/apache-arrow-0.4.1-rc0/apache-arrow-0.4.1.tar.gz.md5 (added)
+++ dev/arrow/apache-arrow-0.4.1-rc0/apache-arrow-0.4.1.tar.gz.md5 Wed Jun  7 
02:23:23 2017
@@ -0,0 +1 @@
+apache-arrow-0.4.1.tar.gz: 6B 10 8A 8D F6 3A 6C E0  D1 69 0B 0B FB A8 DC AB

Added: dev/arrow/apache-arrow-0.4.1-rc0/apache-arrow-0.4.1.tar.gz.sha
==
--- dev/arrow/apache-arrow-0.4.1-rc0/apache-arrow-0.4.1.tar.gz.sha (added)
+++ dev/arrow/apache-arrow-0.4.1-rc0/apache-arrow-0.4.1.tar.gz.sha Wed Jun  7 
02:23:23 2017
@@ -0,0 +1 @@
+290c5c9c6bb0db12ec09c9950a24278899693f8f  apache-arrow-0.4.1.tar.gz




[arrow] Git Push Summary

2017-06-06 Thread wesm
Repository: arrow
Updated Tags:  refs/tags/apache-arrow-0.4.1 [created] ae60e5f3b


arrow git commit: ARROW-1094: [C++] Always truncate buffer read in ReadableFile::Read if actual number of bytes less than request

2017-06-06 Thread wesm
Repository: arrow
Updated Branches:
  refs/heads/master ac540758c -> 2a12482b2


ARROW-1094: [C++] Always truncate buffer read in ReadableFile::Read if actual 
number of bytes less than request

Author: Wes McKinney 

Closes #737 from wesm/ARROW-1094 and squashes the following commits:

fcb613fb [Wes McKinney] Always truncate buffer read in ReadableFile::Read if 
less than requested


Project: http://git-wip-us.apache.org/repos/asf/arrow/repo
Commit: http://git-wip-us.apache.org/repos/asf/arrow/commit/2a12482b
Tree: http://git-wip-us.apache.org/repos/asf/arrow/tree/2a12482b
Diff: http://git-wip-us.apache.org/repos/asf/arrow/diff/2a12482b

Branch: refs/heads/master
Commit: 2a12482b21df0f28bfc53fca114795f4f74d1617
Parents: ac54075
Author: Wes McKinney 
Authored: Tue Jun 6 16:52:45 2017 -0400
Committer: Wes McKinney 
Committed: Tue Jun 6 16:52:45 2017 -0400

--
 cpp/src/arrow/io/file.cc | 5 +
 cpp/src/arrow/io/io-file-test.cc | 9 +
 cpp/src/arrow/ipc/writer.cc  | 4 ++--
 3 files changed, 12 insertions(+), 6 deletions(-)
--


http://git-wip-us.apache.org/repos/asf/arrow/blob/2a12482b/cpp/src/arrow/io/file.cc
--
diff --git a/cpp/src/arrow/io/file.cc b/cpp/src/arrow/io/file.cc
index eb4b9fc..c4c797c 100644
--- a/cpp/src/arrow/io/file.cc
+++ b/cpp/src/arrow/io/file.cc
@@ -412,10 +412,7 @@ class ReadableFile::ReadableFileImpl : public OSFile {
 
 int64_t bytes_read = 0;
 RETURN_NOT_OK(Read(nbytes, &bytes_read, buffer->mutable_data()));
-
-// XXX: heuristic
-if (bytes_read < nbytes / 2) { RETURN_NOT_OK(buffer->Resize(bytes_read)); }
-
+if (bytes_read < nbytes) { RETURN_NOT_OK(buffer->Resize(bytes_read)); }
 *out = buffer;
 return Status::OK();
   }

http://git-wip-us.apache.org/repos/asf/arrow/blob/2a12482b/cpp/src/arrow/io/io-file-test.cc
--
diff --git a/cpp/src/arrow/io/io-file-test.cc b/cpp/src/arrow/io/io-file-test.cc
index a5784de..3450bae 100644
--- a/cpp/src/arrow/io/io-file-test.cc
+++ b/cpp/src/arrow/io/io-file-test.cc
@@ -251,6 +251,15 @@ TEST_F(TestReadableFile, Read) {
   ASSERT_OK(file_->Read(10, &bytes_read, buffer));
   ASSERT_EQ(4, bytes_read);
   ASSERT_EQ(0, std::memcmp(buffer, "data", 4));
+
+  // Test incomplete read, ARROW-1094
+  std::shared_ptr buf;
+  int64_t size;
+  ASSERT_OK(file_->GetSize(&size));
+
+  ASSERT_OK(file_->Seek(1));
+  ASSERT_OK(file_->Read(size, &buf));
+  ASSERT_EQ(size - 1, buf->size());
 }
 
 TEST_F(TestReadableFile, ReadAt) {

http://git-wip-us.apache.org/repos/asf/arrow/blob/2a12482b/cpp/src/arrow/ipc/writer.cc
--
diff --git a/cpp/src/arrow/ipc/writer.cc b/cpp/src/arrow/ipc/writer.cc
index 4f5edf2..5d4b94a 100644
--- a/cpp/src/arrow/ipc/writer.cc
+++ b/cpp/src/arrow/ipc/writer.cc
@@ -757,8 +757,8 @@ class RecordBatchFileWriter::RecordBatchFileWriterImpl
 
   Status Start() override {
 // It is only necessary to align to 8-byte boundary at the start of the 
file
-RETURN_NOT_OK(Write(reinterpret_cast(kArrowMagicBytes),
-strlen(kArrowMagicBytes)));
+RETURN_NOT_OK(Write(
+reinterpret_cast(kArrowMagicBytes), 
strlen(kArrowMagicBytes)));
 RETURN_NOT_OK(Align(8));
 
 // We write the schema at the start of the file (and the end). This also



arrow git commit: ARROW-1088: [Python] Only test unicode filenames if system supports them

2017-06-06 Thread wesm
Repository: arrow
Updated Branches:
  refs/heads/master 402baa4ec -> ac540758c


ARROW-1088: [Python] Only test unicode filenames if system supports them

Author: Jeff Knupp 

Closes #727 from jeffknupp/fmaster and squashes the following commits:

c19b3dec [Jeff Knupp] ARROW-1088: [Python] Only test unicode filenames if 
system supports them


Project: http://git-wip-us.apache.org/repos/asf/arrow/repo
Commit: http://git-wip-us.apache.org/repos/asf/arrow/commit/ac540758
Tree: http://git-wip-us.apache.org/repos/asf/arrow/tree/ac540758
Diff: http://git-wip-us.apache.org/repos/asf/arrow/diff/ac540758

Branch: refs/heads/master
Commit: ac540758c7c013b2ffc7eb3d1e80ce6fb429de03
Parents: 402baa4
Author: Jeff Knupp 
Authored: Tue Jun 6 16:51:49 2017 -0400
Committer: Wes McKinney 
Committed: Tue Jun 6 16:51:49 2017 -0400

--
 python/pyarrow/tests/test_feather.py | 1 +
 1 file changed, 1 insertion(+)
--


http://git-wip-us.apache.org/repos/asf/arrow/blob/ac540758/python/pyarrow/tests/test_feather.py
--
diff --git a/python/pyarrow/tests/test_feather.py 
b/python/pyarrow/tests/test_feather.py
index 287e0da..71e4fee 100644
--- a/python/pyarrow/tests/test_feather.py
+++ b/python/pyarrow/tests/test_feather.py
@@ -355,6 +355,7 @@ class TestFeatherReader(unittest.TestCase):
 expected = df.rename(columns=str)
 self._check_pandas_roundtrip(df, expected)
 
+@pytest.mark.skipif(not os.path.supports_unicode_filenames, 
reason='unicode filenames not supported')
 def test_unicode_filename(self):
 # GH #209
 name = (b'Besa_Kavaj\xc3\xab.feather').decode('utf-8')



arrow git commit: ARROW-1092: More Decimal and scale flipped follow-up

2017-06-06 Thread julien
Repository: arrow
Updated Branches:
  refs/heads/master c3e865d5f -> 402baa4ec


ARROW-1092: More Decimal and scale flipped follow-up

Author: Julien Le Dem 

Closes #736 from julienledem/ARROW-1092 and squashes the following commits:

1bc1ade [Julien Le Dem] ARROW-1092: More Decimal and scale flipped follow-up


Project: http://git-wip-us.apache.org/repos/asf/arrow/repo
Commit: http://git-wip-us.apache.org/repos/asf/arrow/commit/402baa4e
Tree: http://git-wip-us.apache.org/repos/asf/arrow/tree/402baa4e
Diff: http://git-wip-us.apache.org/repos/asf/arrow/diff/402baa4e

Branch: refs/heads/master
Commit: 402baa4ec391b61dd37c770ae7978d51b9b550fa
Parents: c3e865d
Author: Julien Le Dem 
Authored: Tue Jun 6 11:32:39 2017 -0700
Committer: Julien Le Dem 
Committed: Tue Jun 6 11:32:39 2017 -0700

--
 .../vector/src/main/codegen/data/ValueVectorTypes.tdd |  2 +-
 .../src/main/codegen/templates/FixedValueVectors.java |  9 +
 .../src/main/codegen/templates/HolderReaderImpl.java  |  2 +-
 .../vector/src/main/codegen/templates/MapWriters.java |  2 +-
 .../main/codegen/templates/NullableValueVectors.java  | 14 --
 5 files changed, 16 insertions(+), 13 deletions(-)
--


http://git-wip-us.apache.org/repos/asf/arrow/blob/402baa4e/java/vector/src/main/codegen/data/ValueVectorTypes.tdd
--
diff --git a/java/vector/src/main/codegen/data/ValueVectorTypes.tdd 
b/java/vector/src/main/codegen/data/ValueVectorTypes.tdd
index b147c9e..970d887 100644
--- a/java/vector/src/main/codegen/data/ValueVectorTypes.tdd
+++ b/java/vector/src/main/codegen/data/ValueVectorTypes.tdd
@@ -116,7 +116,7 @@
 {
   class: "Decimal",
   maxPrecisionDigits: 38, nDecimalDigits: 4, friendlyType: 
"BigDecimal",
-  typeParams: [ {name: "precision", type: "int"}, { name: "scale", 
type: "int"}],
+  typeParams: [ {name: "scale", type: "int"}, { name: "precision", 
type: "int"}],
   arrowType: "org.apache.arrow.vector.types.pojo.ArrowType.Decimal",
   fields: [{name: "start", type: "int"}, {name: "buffer", type: 
"ArrowBuf"}]
 }

http://git-wip-us.apache.org/repos/asf/arrow/blob/402baa4e/java/vector/src/main/codegen/templates/FixedValueVectors.java
--
diff --git a/java/vector/src/main/codegen/templates/FixedValueVectors.java 
b/java/vector/src/main/codegen/templates/FixedValueVectors.java
index 395417b..5d92cd2 100644
--- a/java/vector/src/main/codegen/templates/FixedValueVectors.java
+++ b/java/vector/src/main/codegen/templates/FixedValueVectors.java
@@ -56,13 +56,14 @@ public final class ${className} extends BaseDataValueVector 
implements FixedWidt
   private int allocationMonitor = 0;
   <#if minor.typeParams??>
 
-<#list minor.typeParams as typeParam>
+<#assign typeParams = minor.typeParams?reverse />
+<#list typeParams as typeParam>
   private final ${typeParam.type} ${typeParam.name};
 
 
-  public ${className}(String name, BufferAllocator allocator<#list 
minor.typeParams as typeParam>, ${typeParam.type} ${typeParam.name}) {
+  public ${className}(String name, BufferAllocator allocator<#list typeParams 
as typeParam>, ${typeParam.type} ${typeParam.name}) {
 super(name, allocator);
-<#list minor.typeParams as typeParam>
+<#list typeParams as typeParam>
 this.${typeParam.name} = ${typeParam.name};
 
   }
@@ -242,7 +243,7 @@ public final class ${className} extends BaseDataValueVector 
implements FixedWidt
 private ${className} to;
 
 public TransferImpl(String name, BufferAllocator allocator){
-  to = new ${className}(name, allocator<#if minor.typeParams??><#list 
minor.typeParams as typeParam>,  
${className}.this.${typeParam.name});
+  to = new ${className}(name, allocator<#if minor.typeParams??><#list 
typeParams as typeParam>,  ${className}.this.${typeParam.name});
 }
 
 public TransferImpl(${className} to) {

http://git-wip-us.apache.org/repos/asf/arrow/blob/402baa4e/java/vector/src/main/codegen/templates/HolderReaderImpl.java
--
diff --git a/java/vector/src/main/codegen/templates/HolderReaderImpl.java 
b/java/vector/src/main/codegen/templates/HolderReaderImpl.java
index 471fe41..c2aa837 100644
--- a/java/vector/src/main/codegen/templates/HolderReaderImpl.java
+++ b/java/vector/src/main/codegen/templates/HolderReaderImpl.java
@@ -29,7 +29,7 @@
 <#assign friendlyType = (minor.friendlyType!minor.boxedType!type.boxedType) />
 <#assign safeType=friendlyType />
 <#if safeType=="byte[]"><#assign safeType="ByteArray" />
-<#assign fields = minor.fields!type.fields + minor.typeParams![]/>
+<#assign fields = (minor.fields!type.fields) + minor.typeParams![]/>
 
 <@pp.changeOutputFile 
name="

arrow git commit: ARROW-1090: Improve build_ext usability with --bundle-arrow-cpp

2017-06-06 Thread wesm
Repository: arrow
Updated Branches:
  refs/heads/master 5589dda50 -> c3e865d5f


ARROW-1090: Improve build_ext usability with --bundle-arrow-cpp

This is based on a blackbox understanding of the build toolchain. It might be 
cleaner to update `FindArrow.cmake`, but I'm not sure what the consequences of 
that would be. This shouldn't be able to do much harm, since this codepath 
would previously crash.

Author: Jacob Scott 

Closes #734 from snakescott/ARROW-1090 and squashes the following commits:

642f9404 [Jacob Scott] Do not attempt to fix cmake on windows
39c8df62 [Jacob Scott] [ARROW-1090] Add doc with instructions for building a 
wheel
9c1d9c2e [Jacob Scott] [ARROW-1090] Improve build_ext usability with 
--bundle-arrow-cpp


Project: http://git-wip-us.apache.org/repos/asf/arrow/repo
Commit: http://git-wip-us.apache.org/repos/asf/arrow/commit/c3e865d5
Tree: http://git-wip-us.apache.org/repos/asf/arrow/tree/c3e865d5
Diff: http://git-wip-us.apache.org/repos/asf/arrow/diff/c3e865d5

Branch: refs/heads/master
Commit: c3e865d5f67fe9059e80e6b59b2b20bd42e7bcc4
Parents: 5589dda
Author: Jacob Scott 
Authored: Tue Jun 6 14:26:36 2017 -0400
Committer: Wes McKinney 
Committed: Tue Jun 6 14:26:36 2017 -0400

--
 python/doc/source/development.rst | 8 
 python/setup.py   | 5 +
 2 files changed, 13 insertions(+)
--


http://git-wip-us.apache.org/repos/asf/arrow/blob/c3e865d5/python/doc/source/development.rst
--
diff --git a/python/doc/source/development.rst 
b/python/doc/source/development.rst
index 410f838..cd24406 100644
--- a/python/doc/source/development.rst
+++ b/python/doc/source/development.rst
@@ -171,6 +171,14 @@ You should be able to run the unit tests with:
 
== 181 passed, 17 skipped in 0.98 seconds ===
 
+You can build a wheel by running:
+
+.. code-block:: shell
+   python setup.py build_ext --build-type=$ARROW_BUILD_TYPE \
+  --with-parquet --with-jemalloc --bundle-arrow-cpp bdist_wheel
+
+Again, if you did not build parquet-cpp, you should omit ``--with-parquet``.
+
 Windows
 ===
 

http://git-wip-us.apache.org/repos/asf/arrow/blob/c3e865d5/python/setup.py
--
diff --git a/python/setup.py b/python/setup.py
index 817c59f..e10b4b8 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -148,6 +148,11 @@ class build_ext(_build_ext):
 
 if self.bundle_arrow_cpp:
 cmake_options.append('-DPYARROW_BUNDLE_ARROW_CPP=ON')
+# ARROW-1090: work around CMake rough edges
+if 'ARROW_HOME' in os.environ and sys.platform != 'win32':
+os.environ['PKG_CONFIG_PATH'] = 
pjoin(os.environ['ARROW_HOME'], 'lib', 'pkgconfig')
+del os.environ['ARROW_HOME']
+
 
 cmake_options.append('-DCMAKE_BUILD_TYPE={0}'
  .format(self.build_type.lower()))



arrow git commit: ARROW-1080: C++: Add tutorial about converting to/from row-wise representation

2017-06-06 Thread wesm
Repository: arrow
Updated Branches:
  refs/heads/master 1a72acdf4 -> 5589dda50


ARROW-1080: C++: Add tutorial about converting to/from row-wise representation

Author: Uwe L. Korn 

Closes #721 from xhochy/ARROW-1080 and squashes the following commits:

556a37b2 [Uwe L. Korn] Fix chunk indices
e7ace72b [Uwe L. Korn] ARROW-1080: C++: Add tutorial about converting to/from 
row-wise representation


Project: http://git-wip-us.apache.org/repos/asf/arrow/repo
Commit: http://git-wip-us.apache.org/repos/asf/arrow/commit/5589dda5
Tree: http://git-wip-us.apache.org/repos/asf/arrow/tree/5589dda5
Diff: http://git-wip-us.apache.org/repos/asf/arrow/diff/5589dda5

Branch: refs/heads/master
Commit: 5589dda50de923abb0ab22b8ca30edb912b992ab
Parents: 1a72acd
Author: Uwe L. Korn 
Authored: Tue Jun 6 14:23:31 2017 -0400
Committer: Wes McKinney 
Committed: Tue Jun 6 14:23:31 2017 -0400

--
 cpp/apidoc/index.md |   2 +
 cpp/apidoc/tutorials/row_wise_conversion.md | 187 +++
 2 files changed, 189 insertions(+)
--


http://git-wip-us.apache.org/repos/asf/arrow/blob/5589dda5/cpp/apidoc/index.md
--
diff --git a/cpp/apidoc/index.md b/cpp/apidoc/index.md
index 923fc5b..4004e1e 100644
--- a/cpp/apidoc/index.md
+++ b/cpp/apidoc/index.md
@@ -32,6 +32,8 @@ Table of Contents
 
  * Instructions on how to build Arrow C++ on [Windows](Windows.md)
  * How to access [HDFS](HDFS.md)
+ * Tutorials
+   * [Convert a vector of row-wise data into an Arrow 
table](tutorials/row_wise_conversion.md)
 
 Getting Started
 ---

http://git-wip-us.apache.org/repos/asf/arrow/blob/5589dda5/cpp/apidoc/tutorials/row_wise_conversion.md
--
diff --git a/cpp/apidoc/tutorials/row_wise_conversion.md 
b/cpp/apidoc/tutorials/row_wise_conversion.md
new file mode 100644
index 000..1486fc2
--- /dev/null
+++ b/cpp/apidoc/tutorials/row_wise_conversion.md
@@ -0,0 +1,187 @@
+
+
+Convert a vector of row-wise data into an Arrow table
+=
+
+While we want to use columnar data structures to build efficient operations, we
+often receive data in a row-wise fashion from other systems. In the following,
+we want give a brief introduction into the classes provided by Apache Arrow by
+showing how to transform row-wise data into a columnar table.
+
+The data in this example is stored in the following struct:
+
+```
+struct data_row {
+int64_t id;
+double cost;
+std::vector cost_components;
+};
+
+std::vector rows;
+```
+
+The final representation should be an `arrow::Table` which in turn is made up 
of
+an `arrow::Schema` and a list of `arrow::Column`. An `arrow::Column` is again a
+named collection of one or more `arrow::Array` instances. As the first step, we
+will iterate over the data and build up the arrays incrementally. For this 
task,
+we provide `arrow::ArrayBuilder` classes that help in the construction of the
+final `arrow::Array` instances.
+
+For each type, Arrow has a specially typed builder class. For the primitive
+values `id` and `cost` we can use the respective `arrow::Int64Builder` and
+`arrow::DoubleBuilder`. For the `cost_components` vector, we need to have two
+builders, a top-level `arrow::ListBuilder` that builds the array of offsets and
+a nested `arrow::DoubleBuilder` that constructs the underlying values array 
that
+is referenced by the offsets in the former array.
+
+```
+// The builders are more efficient using
+// arrow::jemalloc::MemoryPool::default_pool() as this can increase the size of
+// the underlying memory regions in-place. At the moment, arrow::jemalloc is 
only
+// supported on Unix systems, not Windows.
+
+arrow::Int64Builder id_builder(arrow::default_memory_pool());
+arrow::DoubleBuilder cost_builder(arrow::default_memory_pool());
+std::shared_ptr components_values_builder =
+std::make_shared(arrow::default_memory_pool());
+arrow::ListBuilder components_builder(arrow::default_memory_pool(),
+components_values_builder);
+```
+
+Now we can loop over our existing data and insert it into the builders. The
+`Append` calls here may fail (e.g. we cannot allocate enough additional 
memory).
+Thus we need to check their return values. For more information on these 
values,
+check the documentation about `arrow::Status`.
+
+```
+for (const data_row& row : rows) {
+ARROW_RETURN_NOT_OK(id_builder.Append(row.id));
+ARROW_RETURN_NOT_OK(cost_builder.Append(row.cost));
+
+// Indicate the start of a new list row. This will memorise the current
+// offset in the values builder.
+ARROW_RETURN_NOT_OK(components_builder.Append());
+// Store the actual values. The final nullptr argument tells the underyling
+// builder that all added values ar

arrow git commit: [Doc] Fix a few links for files moved in ARROW-957

2017-06-06 Thread wesm
Repository: arrow
Updated Branches:
  refs/heads/master 44dba7176 -> 1a72acdf4


[Doc] Fix a few links for files moved in ARROW-957

Closes #714

Change-Id: Ic58e7ad6b0b2cf5a7d4d36859bdbffda65e13f79


Project: http://git-wip-us.apache.org/repos/asf/arrow/repo
Commit: http://git-wip-us.apache.org/repos/asf/arrow/commit/1a72acdf
Tree: http://git-wip-us.apache.org/repos/asf/arrow/tree/1a72acdf
Diff: http://git-wip-us.apache.org/repos/asf/arrow/diff/1a72acdf

Branch: refs/heads/master
Commit: 1a72acdf4daa68fe6e7639acde08a0abf795a3fc
Parents: 44dba71
Author: Tony Kelman 
Authored: Wed May 24 02:16:58 2017 -0400
Committer: Wes McKinney 
Committed: Tue Jun 6 14:21:16 2017 -0400

--
 cpp/README.md  | 2 +-
 python/doc/source/development.rst  | 2 +-
 site/_posts/2017-05-08-0.3-release-japanese.md | 2 +-
 site/_posts/2017-05-08-0.3-release.md  | 2 +-
 4 files changed, 4 insertions(+), 4 deletions(-)
--


http://git-wip-us.apache.org/repos/asf/arrow/blob/1a72acdf/cpp/README.md
--
diff --git a/cpp/README.md b/cpp/README.md
index 69c6950..5bb516f 100644
--- a/cpp/README.md
+++ b/cpp/README.md
@@ -126,4 +126,4 @@ both of these options would be used rarely.  Current known 
uses-cases whent hey
 *  Parameterized tests in google test.
 
 [1]: https://brew.sh/
-[2]: https://github.com/apache/arrow/blob/master/cpp/doc/Windows.md
+[2]: https://github.com/apache/arrow/blob/master/cpp/apidoc/Windows.md

http://git-wip-us.apache.org/repos/asf/arrow/blob/1a72acdf/python/doc/source/development.rst
--
diff --git a/python/doc/source/development.rst 
b/python/doc/source/development.rst
index 6ec563e..410f838 100644
--- a/python/doc/source/development.rst
+++ b/python/doc/source/development.rst
@@ -175,7 +175,7 @@ Windows
 ===
 
 First, we bootstrap a conda environment similar to the `C++ build instructions
-`_. This
+`_. This
 includes all the dependencies for Arrow and the Apache Parquet C++ libraries.
 
 First, starting from fresh clones of Apache Arrow and parquet-cpp:

http://git-wip-us.apache.org/repos/asf/arrow/blob/1a72acdf/site/_posts/2017-05-08-0.3-release-japanese.md
--
diff --git a/site/_posts/2017-05-08-0.3-release-japanese.md 
b/site/_posts/2017-05-08-0.3-release-japanese.md
index e49bde1..6bad5ad 100644
--- a/site/_posts/2017-05-08-0.3-release-japanese.md
+++ b/site/_posts/2017-05-08-0.3-release-japanese.md
@@ -162,7 +162,7 @@ $ git shortlog -sn apache-arrow-0.2.0..apache-arrow-0.3.0
 [4]: http://wesmckinney.com/blog/arrow-streaming-columnar/
 [5]: http://github.com/google/flatbuffers
 [6]: http://arrow.apache.org/install
-[7]: https://github.com/apache/arrow/blob/master/cpp/doc/Windows.md
+[7]: https://github.com/apache/arrow/blob/master/cpp/apidoc/Windows.md
 [8]: 
https://github.com/apache/arrow/blob/master/python/doc/source/development.rst
 [9]: http://github.com/kou
 [10]: https://wiki.gnome.org/Projects/GObjectIntrospection

http://git-wip-us.apache.org/repos/asf/arrow/blob/1a72acdf/site/_posts/2017-05-08-0.3-release.md
--
diff --git a/site/_posts/2017-05-08-0.3-release.md 
b/site/_posts/2017-05-08-0.3-release.md
index 39a907d..cf38a8b 100644
--- a/site/_posts/2017-05-08-0.3-release.md
+++ b/site/_posts/2017-05-08-0.3-release.md
@@ -238,7 +238,7 @@ $ git shortlog -sn apache-arrow-0.2.0..apache-arrow-0.3.0
 [4]: http://wesmckinney.com/blog/arrow-streaming-columnar/
 [5]: http://github.com/google/flatbuffers
 [6]: http://arrow.apache.org/install
-[7]: https://github.com/apache/arrow/blob/master/cpp/doc/Windows.md
+[7]: https://github.com/apache/arrow/blob/master/cpp/apidoc/Windows.md
 [8]: 
https://github.com/apache/arrow/blob/master/python/doc/source/development.rst
 [9]: http://github.com/kou
 [10]: https://wiki.gnome.org/Projects/GObjectIntrospection



arrow git commit: ARROW-1020: [Format] Revise language for Timestamp type in Schema.fbs to avoid possible confusion about tz-naive timestamps

2017-06-06 Thread wesm
Repository: arrow
Updated Branches:
  refs/heads/master a367fd437 -> 44dba7176


ARROW-1020: [Format] Revise language for Timestamp type in Schema.fbs to avoid 
possible confusion about tz-naive timestamps

Author: Wes McKinney 

Closes #731 from wesm/ARROW-1020 and squashes the following commits:

5466f417 [Wes McKinney] Revise language for Timestamp type in Schema.fbs to 
avoid possible confusion about time zone naive timestamps (they are not 
necessarily normalized to UTC)


Project: http://git-wip-us.apache.org/repos/asf/arrow/repo
Commit: http://git-wip-us.apache.org/repos/asf/arrow/commit/44dba717
Tree: http://git-wip-us.apache.org/repos/asf/arrow/tree/44dba717
Diff: http://git-wip-us.apache.org/repos/asf/arrow/diff/44dba717

Branch: refs/heads/master
Commit: 44dba7176f078a297b327183593704f939df52a7
Parents: a367fd4
Author: Wes McKinney 
Authored: Tue Jun 6 14:20:06 2017 -0400
Committer: Wes McKinney 
Committed: Tue Jun 6 14:20:06 2017 -0400

--
 format/Schema.fbs | 7 ++-
 1 file changed, 6 insertions(+), 1 deletion(-)
--


http://git-wip-us.apache.org/repos/asf/arrow/blob/44dba717/format/Schema.fbs
--
diff --git a/format/Schema.fbs b/format/Schema.fbs
index 8de5c6d..a7e802b 100644
--- a/format/Schema.fbs
+++ b/format/Schema.fbs
@@ -113,7 +113,12 @@ table Time {
   bitWidth: int = 32;
 }
 
-/// Time elapsed from the Unix epoch, 00:00:00.000 on 1 January 1970, UTC.
+/// Time elapsed from the Unix epoch, 00:00:00.000 on 1 January 1970, excluding
+/// leap seconds, as a 64-bit integer. Note that UNIX time does not include
+/// leap seconds.
+///
+/// The Timestamp metadata supports both "time zone naive" and "time zone
+/// aware" timestamps. Read about the timezone attribute for more detail
 table Timestamp {
   unit: TimeUnit;
 



arrow git commit: ARROW-1086: include additional pxd files during package build

2017-06-06 Thread wesm
Repository: arrow
Updated Branches:
  refs/heads/master 4e134e5b9 -> a367fd437


ARROW-1086: include additional pxd files during package build

Since this is purely a packaging change, I believe I would need to 
change`travis_script_python.sh` in order test it (build a wheel, set up a new 
conda environment and install the wheel, etc). Not sure if that's worth doing? 
Happy to take a stab if it is.

Author: Jacob Scott 

Closes #733 from snakescott/ARROW-1086 and squashes the following commits:

6c3e8598 [Jacob Scott] [ARROW-1086] Add more pxd files to package_data


Project: http://git-wip-us.apache.org/repos/asf/arrow/repo
Commit: http://git-wip-us.apache.org/repos/asf/arrow/commit/a367fd43
Tree: http://git-wip-us.apache.org/repos/asf/arrow/tree/a367fd43
Diff: http://git-wip-us.apache.org/repos/asf/arrow/diff/a367fd43

Branch: refs/heads/master
Commit: a367fd437b1fe7797a27be578435abfacf94d052
Parents: 4e134e5
Author: Jacob Scott 
Authored: Tue Jun 6 14:18:05 2017 -0400
Committer: Wes McKinney 
Committed: Tue Jun 6 14:18:05 2017 -0400

--
 python/setup.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)
--


http://git-wip-us.apache.org/repos/asf/arrow/blob/a367fd43/python/setup.py
--
diff --git a/python/setup.py b/python/setup.py
index b64e259..817c59f 100644
--- a/python/setup.py
+++ b/python/setup.py
@@ -349,7 +349,7 @@ setup(
 name="pyarrow",
 packages=['pyarrow', 'pyarrow.tests'],
 zip_safe=False,
-package_data={'pyarrow': ['*.pxd', '*.pyx']},
+package_data={'pyarrow': ['*.pxd', '*.pyx', 'includes/*.pxd']},
 include_package_data=True,
 distclass=BinaryDistribution,
 # Dummy extension to trigger build_ext