[
https://issues.apache.org/jira/browse/ASTERIXDB-3620?page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel&focusedCommentId=17956800#comment-17956800
]
ASF subversion and git services commented on ASTERIXDB-3620:
------------------------------------------------------------
Commit a013fb7a89580a1c90f82e6d01dc0078ac4bcd93 in asterixdb's branch
refs/heads/master from Peeyush Gupta
[ https://gitbox.apache.org/repos/asf?p=asterixdb.git;h=a013fb7a89 ]
[ASTERIXDB-3620][STO] Fix writing null values to columnar storage
- user model changes: no
- storage format changes: no
- interface changes: no
Ext-ref: MB-67051
Change-Id: I32f8c19c80c5ac898781a4931a30459b3a801e4d
Reviewed-on: https://asterix-gerrit.ics.uci.edu/c/asterixdb/+/19873
Reviewed-by: Ritik Raj <[email protected]>
Tested-by: Jenkins <[email protected]>
Integration-Tests: Jenkins <[email protected]>
> Exception on querying on columnar data
> --------------------------------------
>
> Key: ASTERIXDB-3620
> URL: https://issues.apache.org/jira/browse/ASTERIXDB-3620
> Project: Apache AsterixDB
> Issue Type: Bug
> Components: STO - Storage
> Reporter: Peeyush Gupta
> Priority: Major
>
> Steps to reproduce:
> Create collection
>
> {{CREATE COLLECTION Events PRIMARY KEY (id:string)}}
> Get Github Events data using
>
> {{wget https://data.gharchive.org/2015-01-01-15.json.gz}}
> Load this jsonl data into the Events collection
> Run following query
>
> {{SELECT * FROM Events}}
> Causes the following exception
>
> {{2025-06-03T16:30:01.510+00:00 WARN CBAS.apache.asterix
> [Executor-29:ClusterController]
> org.apache.parquet.io.ParquetDecodingException: no more value to read, total
> value count is 1
> org.apache.hyracks.api.exceptions.HyracksDataException:
> org.apache.parquet.io.ParquetDecodingException: no more value to read, total
> value count is 1
> at
> org.apache.hyracks.api.exceptions.HyracksDataException.create(HyracksDataException.java:70)
> ~[hyracks-api-1.1.1-1302.jar:1.1.1-1302]
> at
> org.apache.hyracks.api.util.ExceptionUtils.setNodeIds(ExceptionUtils.java:74)
> ~[hyracks-api-1.1.1-1302.jar:1.1.1-1302]
> at org.apache.hyracks.control.nc.Task.run(Task.java:399)
> ~[hyracks-control-nc-1.1.1-1302.jar:1.1.1-1302]
> at
> java.base/java.util.concurrent.ThreadPoolExecutor.runWorker(ThreadPoolExecutor.java:1144)
> ~[?:?]
> at
> java.base/java.util.concurrent.ThreadPoolExecutor$Worker.run(ThreadPoolExecutor.java:642)
> ~[?:?]
> at java.base/java.lang.Thread.run(Thread.java:1583) [?:?]
> Caused by: org.apache.parquet.io.ParquetDecodingException: no more value to
> read, total value count is 1
> at
> org.apache.asterix.column.bytes.decoder.ParquetDeltaBinaryPackingValuesReader.checkRead(ParquetDeltaBinaryPackingValuesReader.java:127)
> ~[asterix-column-1.1.1-1302.jar:1.1.1-1302]
> at
> org.apache.asterix.column.bytes.decoder.ParquetDeltaBinaryPackingValuesReader.readLong(ParquetDeltaBinaryPackingValuesReader.java:120)
> ~[asterix-column-1.1.1-1302.jar:1.1.1-1302]
> at
> org.apache.asterix.column.bytes.decoder.ParquetDeltaBinaryPackingValuesReader.readInteger(ParquetDeltaBinaryPackingValuesReader.java:115)
> ~[asterix-column-1.1.1-1302.jar:1.1.1-1302]
> at
> org.apache.asterix.column.bytes.decoder.ParquetDeltaByteArrayReader.readBytes(ParquetDeltaByteArrayReader.java:69)
> ~[asterix-column-1.1.1-1302.jar:1.1.1-1302]
> at
> org.apache.asterix.column.values.reader.value.StringValueReader.nextValue(StringValueReader.java:44)
> ~[asterix-column-1.1.1-1302.jar:1.1.1-1302]
> at
> org.apache.asterix.column.values.reader.PrimitiveColumnValuesReader.next(PrimitiveColumnValuesReader.java:60)
> ~[asterix-column-1.1.1-1302.jar:1.1.1-1302]
> at
> org.apache.asterix.column.assembler.PrimitiveValueAssembler.next(PrimitiveValueAssembler.java:49)
> ~[asterix-column-1.1.1-1302.jar:1.1.1-1302]
> at
> org.apache.asterix.column.operation.query.ColumnAssembler.nextValue(ColumnAssembler.java:87)
> ~[asterix-column-1.1.1-1302.jar:1.1.1-1302]
> at
> org.apache.asterix.column.tuple.QueryColumnTupleReference.getAssembledValue(QueryColumnTupleReference.java:165)
> ~[asterix-column-1.1.1-1302.jar:1.1.1-1302]
> at
> org.apache.asterix.column.operation.query.QueryColumnTupleProjector.getAssembledValue(QueryColumnTupleProjector.java:115)
> ~[asterix-column-1.1.1-1302.jar:1.1.1-1302]
> at
> org.apache.asterix.column.operation.query.QueryColumnTupleProjector.project(QueryColumnTupleProjector.java:93)
> ~[asterix-column-1.1.1-1302.jar:1.1.1-1302]
> at
> org.apache.hyracks.storage.am.common.dataflow.IndexSearchOperatorNodePushable.writeTupleToOutput(IndexSearchOperatorNodePushable.java:401)
> ~[hyracks-storage-am-common-1.1.1-1302.jar:1.1.1-1302]
> at
> org.apache.hyracks.storage.am.common.dataflow.IndexSearchOperatorNodePushable.writeSearchResults(IndexSearchOperatorNodePushable.java:274)
> ~[hyracks-storage-am-common-1.1.1-1302.jar:1.1.1-1302]
> at
> org.apache.hyracks.storage.am.common.dataflow.IndexSearchOperatorNodePushable.searchAllPartitions(IndexSearchOperatorNodePushable.java:470)
> ~[hyracks-storage-am-common-1.1.1-1302.jar:1.1.1-1302]
> at
> org.apache.hyracks.storage.am.common.dataflow.IndexSearchOperatorNodePushable.nextFrame(IndexSearchOperatorNodePushable.java:316)
> ~[hyracks-storage-am-common-1.1.1-1302.jar:1.1.1-1302]
> at
> org.apache.hyracks.dataflow.common.comm.io.AbstractFrameAppender.write(AbstractFrameAppender.java:94)
> ~[hyracks-dataflow-common-1.1.1-1302.jar:1.1.1-1302]
> at
> org.apache.hyracks.algebricks.runtime.operators.std.EmptyTupleSourceRuntimeFactory$1.open(EmptyTupleSourceRuntimeFactory.java:55)
> ~[algebricks-runtime-1.1.1-1302.jar:1.1.1-1302]
> at
> org.apache.hyracks.algebricks.runtime.operators.meta.AlgebricksMetaOperatorDescriptor$SourcePushRuntime.initialize(AlgebricksMetaOperatorDescriptor.java:176)
> ~[algebricks-runtime-1.1.1-1302.jar:1.1.1-1302]
> at
> org.apache.hyracks.api.rewriter.runtime.SuperActivityOperatorNodePushable.lambda$runInParallel$0(SuperActivityOperatorNodePushable.java:245)
> ~[hyracks-api-1.1.1-1302.jar:1.1.1-1302]
> at java.base/java.util.concurrent.FutureTask.run(FutureTask.java:317)
> ~[?:?]
> ... 3 more}}
>
--
This message was sent by Atlassian Jira
(v8.20.10#820010)