This is an automated email from the ASF dual-hosted git repository.
kou pushed a commit to branch master
in repository https://gitbox.apache.org/repos/asf/arrow.git
The following commit(s) were added to refs/heads/master by this push:
new 79810a5491 ARROW-15936 [Ruby] Add test for
Arrow::DictionaryArray#raw_records
79810a5491 is described below
commit 79810a54913d328f06c29395ec5a086b3aa90fcc
Author: okadakk <[email protected]>
AuthorDate: Thu May 19 10:53:09 2022 +0900
ARROW-15936 [Ruby] Add test for Arrow::DictionaryArray#raw_records
I added test for Arrow::DictionaryArray#raw_records.
Closes #12904 from
okadakk/arrow-ruby-add-test-for-arrow-dictionary-array-raw-records
Authored-by: okadakk <[email protected]>
Signed-off-by: Sutou Kouhei <[email protected]>
---
.../test/raw-records/test-dictionary-array.rb | 311 +++++++++++++++++++++
1 file changed, 311 insertions(+)
diff --git a/ruby/red-arrow/test/raw-records/test-dictionary-array.rb
b/ruby/red-arrow/test/raw-records/test-dictionary-array.rb
new file mode 100644
index 0000000000..cac547caf7
--- /dev/null
+++ b/ruby/red-arrow/test/raw-records/test-dictionary-array.rb
@@ -0,0 +1,311 @@
+# Licensed to the Apache Software Foundation (ASF) under one
+# or more contributor license agreements. See the NOTICE file
+# distributed with this work for additional information
+# regarding copyright ownership. The ASF licenses this file
+# to you under the Apache License, Version 2.0 (the
+# "License"); you may not use this file except in compliance
+# with the License. You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing,
+# software distributed under the License is distributed on an
+# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+# KIND, either express or implied. See the License for the
+# specific language governing permissions and limitations
+# under the License.
+
+module RawRecordsDictionaryArrayTests
+ def build_record_batch(array)
+ dictionary = array.dictionary_encode
+ schema = Arrow::Schema.new(column: dictionary.value_data_type)
+ Arrow::RecordBatch.new(schema, array.length, [dictionary])
+ end
+
+ def test_null
+ records = [
+ [nil],
+ [nil],
+ [nil],
+ [nil],
+ ]
+ target = build(Arrow::NullArray.new(records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_boolean
+ records = [
+ [true],
+ [nil],
+ [false],
+ ]
+ target = build(Arrow::BooleanArray.new(records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_int8
+ records = [
+ [-(2 ** 7)],
+ [nil],
+ [(2 ** 7) - 1],
+ ]
+ target = build(Arrow::Int8Array.new(records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_uint8
+ records = [
+ [0],
+ [nil],
+ [(2 ** 8) - 1],
+ ]
+ target = build(Arrow::UInt8Array.new(records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_int16
+ records = [
+ [-(2 ** 15)],
+ [nil],
+ [(2 ** 15) - 1],
+ ]
+ target = build(Arrow::Int16Array.new(records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_uint16
+ records = [
+ [0],
+ [nil],
+ [(2 ** 16) - 1],
+ ]
+ target = build(Arrow::UInt16Array.new(records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_int32
+ records = [
+ [-(2 ** 31)],
+ [nil],
+ [(2 ** 31) - 1],
+ ]
+ target = build(Arrow::Int32Array.new(records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_uint32
+ records = [
+ [0],
+ [nil],
+ [(2 ** 32) - 1],
+ ]
+ target = build(Arrow::UInt32Array.new(records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_int64
+ records = [
+ [-(2 ** 63)],
+ [nil],
+ [(2 ** 63) - 1],
+ ]
+ target = build(Arrow::Int64Array.new(records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_uint64
+ records = [
+ [0],
+ [nil],
+ [(2 ** 64) - 1],
+ ]
+ target = build(Arrow::UInt64Array.new(records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_float
+ records = [
+ [-1.0],
+ [nil],
+ [1.0],
+ ]
+ target = build(Arrow::FloatArray.new(records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_double
+ records = [
+ [-1.0],
+ [nil],
+ [1.0],
+ ]
+ target = build(Arrow::DoubleArray.new(records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_binary
+ records = [
+ ["\x00".b],
+ [nil],
+ ["\xff".b],
+ ]
+ target = build(Arrow::BinaryArray.new(records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_string
+ records = [
+ ["Ruby"],
+ [nil],
+ ["\u3042"], # U+3042 HIRAGANA LETTER A
+ ]
+ target = build(Arrow::StringArray.new(records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_date32
+ records = [
+ [Date.new(1960, 1, 1)],
+ [nil],
+ [Date.new(2017, 8, 23)],
+ ]
+ target = build(Arrow::Date32Array.new(records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_date64
+ records = [
+ [DateTime.new(1960, 1, 1, 2, 9, 30)],
+ [nil],
+ [DateTime.new(2017, 8, 23, 14, 57, 2)],
+ ]
+ target = build(Arrow::Date64Array.new(records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_timestamp_second
+ records = [
+ [Time.parse("1960-01-01T02:09:30Z")],
+ [nil],
+ [Time.parse("2017-08-23T14:57:02Z")],
+ ]
+ target = build(Arrow::TimestampArray.new(:second,
records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_timestamp_milli
+ records = [
+ [Time.parse("1960-01-01T02:09:30.123Z")],
+ [nil],
+ [Time.parse("2017-08-23T14:57:02.987Z")],
+ ]
+ target = build(Arrow::TimestampArray.new(:milli, records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_timestamp_micro
+ records = [
+ [Time.parse("1960-01-01T02:09:30.123456Z")],
+ [nil],
+ [Time.parse("2017-08-23T14:57:02.987654Z")],
+ ]
+ target = build(Arrow::TimestampArray.new(:micro, records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_timestamp_nano
+ records = [
+ [Time.parse("1960-01-01T02:09:30.123456789Z")],
+ [nil],
+ [Time.parse("2017-08-23T14:57:02.987654321Z")],
+ ]
+ target = build(Arrow::TimestampArray.new(:nano, records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_time32_second
+ unit = Arrow::TimeUnit::SECOND
+ records = [
+ [Arrow::Time.new(unit, 60 * 10)], # 00:10:00
+ [nil],
+ [Arrow::Time.new(unit, 60 * 60 * 2 + 9)], # 02:00:09
+ ]
+ target = build(Arrow::Time32Array.new(unit, records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_time32_milli
+ unit = Arrow::TimeUnit::MILLI
+ records = [
+ [Arrow::Time.new(unit, (60 * 10) * 1000 + 123)], # 00:10:00.123
+ [nil],
+ [Arrow::Time.new(unit, (60 * 60 * 2 + 9) * 1000 + 987)], # 02:00:09.987
+ ]
+ target = build(Arrow::Time32Array.new(unit, records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_time64_micro
+ unit = Arrow::TimeUnit::MICRO
+ records = [
+ # 00:10:00.123456
+ [Arrow::Time.new(unit, (60 * 10) * 1_000_000 + 123_456)],
+ [nil],
+ # 02:00:09.987654
+ [Arrow::Time.new(unit, (60 * 60 * 2 + 9) * 1_000_000 + 987_654)],
+ ]
+ target = build(Arrow::Time64Array.new(unit, records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_time64_nano
+ unit = Arrow::TimeUnit::NANO
+ records = [
+ # 00:10:00.123456789
+ [Arrow::Time.new(unit, (60 * 10) * 1_000_000_000 + 123_456_789)],
+ [nil],
+ # 02:00:09.987654321
+ [Arrow::Time.new(unit, (60 * 60 * 2 + 9) * 1_000_000_000 + 987_654_321)],
+ ]
+ target = build(Arrow::Time64Array.new(unit, records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_decimal128
+ records = [
+ [BigDecimal("92.92")],
+ [nil],
+ [BigDecimal("29.29")],
+ ]
+ data_type = Arrow::Decimal128DataType.new(8, 2)
+ target = build(Arrow::Decimal128Array.new(data_type,
records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+
+ def test_decimal256
+ records = [
+ [BigDecimal("92.92")],
+ [nil],
+ [BigDecimal("29.29")],
+ ]
+ data_type = Arrow::Decimal256DataType.new(38, 2)
+ target = build(Arrow::Decimal256Array.new(data_type,
records.collect(&:first)))
+ assert_equal(records, target.raw_records)
+ end
+end
+
+class RawRecordsRecordBatchDictionaryArraysTest < Test::Unit::TestCase
+ include RawRecordsDictionaryArrayTests
+
+ def build(array)
+ build_record_batch(array)
+ end
+end
+
+class RawRecordsTableDictionaryArraysTest < Test::Unit::TestCase
+ include RawRecordsDictionaryArrayTests
+
+ def build(array)
+ build_record_batch(array).to_table
+ end
+end