rdblue commented on code in PR #3197: URL: https://github.com/apache/parquet-java/pull/3197#discussion_r2056641009
########## parquet-variant/src/main/java/org/apache/parquet/variant/Variant.java: ########## @@ -0,0 +1,313 @@ +/* + * Licensed to the Apache Software Foundation (ASF) under one + * or more contributor license agreements. See the NOTICE file + * distributed with this work for additional information + * regarding copyright ownership. The ASF licenses this file + * to you under the Apache License, Version 2.0 (the + * "License"); you may not use this file except in compliance + * with the License. You may obtain a copy of the License at + * + * http://www.apache.org/licenses/LICENSE-2.0 + * + * Unless required by applicable law or agreed to in writing, + * software distributed under the License is distributed on an + * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY + * KIND, either express or implied. See the License for the + * specific language governing permissions and limitations + * under the License. + */ +package org.apache.parquet.variant; + +import java.math.BigDecimal; +import java.nio.ByteBuffer; +import java.util.UUID; + +/** + * This Variant class holds the Variant-encoded value and metadata binary values. + */ +public final class Variant { + /** The buffer that contains the Variant value. */ + final ByteBuffer value; + + /** The buffer that contains the Variant metadata. */ + final ByteBuffer metadata; + + /** + * The threshold to switch from linear search to binary search when looking up a field by key in + * an object. This is a performance optimization to avoid the overhead of binary search for a + * short list. + */ + static final int BINARY_SEARCH_THRESHOLD = 32; + + public Variant(byte[] value, byte[] metadata) { + this(value, 0, value.length, metadata, 0, metadata.length); + } + + public Variant(byte[] value, int valuePos, int valueLength, byte[] metadata, int metadataPos, int metadataLength) { + this(ByteBuffer.wrap(value, valuePos, valueLength), ByteBuffer.wrap(metadata, metadataPos, metadataLength)); + } + + public Variant(ByteBuffer value, ByteBuffer metadata) { + // THe buffers are read single-byte at a time, so the endianness of the input buffers + // are not important. + this.value = value.asReadOnlyBuffer(); + this.metadata = metadata.asReadOnlyBuffer(); + + // There is currently only one allowed version. + if ((metadata.get(metadata.position()) & VariantUtil.VERSION_MASK) != VariantUtil.VERSION) { + throw new UnsupportedOperationException(String.format( + "Unsupported variant metadata version: %d", + metadata.get(metadata.position()) & VariantUtil.VERSION_MASK)); + } + } + + /** + * @return the boolean value + */ + public boolean getBoolean() { + return VariantUtil.getBoolean(value); + } + + /** + * @return the byte value + */ + public byte getByte() { + long longValue = VariantUtil.getLong(value); + if (longValue < Byte.MIN_VALUE || longValue > Byte.MAX_VALUE) { + throw new IllegalStateException("Value out of range for byte: " + longValue); + } + return (byte) longValue; + } + + /** + * @return the short value + */ + public short getShort() { + long longValue = VariantUtil.getLong(value); + if (longValue < Short.MIN_VALUE || longValue > Short.MAX_VALUE) { + throw new IllegalStateException("Value out of range for short: " + longValue); + } + return (short) longValue; + } + + /** + * @return the int value + */ + public int getInt() { + long longValue = VariantUtil.getLong(value); + if (longValue < Integer.MIN_VALUE || longValue > Integer.MAX_VALUE) { + throw new IllegalStateException("Value out of range for int: " + longValue); + } + return (int) longValue; + } + + /** + * @return the long value + */ + public long getLong() { + return VariantUtil.getLong(value); + } + + /** + * @return the double value + */ + public double getDouble() { + return VariantUtil.getDouble(value); + } + + /** + * @return the decimal value + */ + public BigDecimal getDecimal() { + return VariantUtil.getDecimal(value); + } + + /** + * @return the float value + */ + public float getFloat() { + return VariantUtil.getFloat(value); + } + + /** + * @return the binary value + */ + public ByteBuffer getBinary() { + return VariantUtil.getBinary(value); + } + + /** + * @return the UUID value + */ + public UUID getUUID() { + return VariantUtil.getUUID(value); + } + + /** + * @return the string value + */ + public String getString() { + return VariantUtil.getString(value); + } + + /** + * The value type of Variant value. It is determined by the header byte. + */ + public enum Type { + OBJECT, + ARRAY, + NULL, + BOOLEAN, + BYTE, + SHORT, + INT, + LONG, + STRING, + DOUBLE, + DECIMAL4, + DECIMAL8, + DECIMAL16, + DATE, + TIMESTAMP_TZ, + TIMESTAMP_NTZ, + FLOAT, + BINARY, + TIME, + TIMESTAMP_NANOS, Review Comment: This should also have a `_TZ` suffix. -- This is an automated message from the Apache Git Service. To respond to the message, please log on to GitHub and use the URL above to go to the specific comment. To unsubscribe, e-mail: [email protected] For queries about this service, please contact Infrastructure at: [email protected] --------------------------------------------------------------------- To unsubscribe, e-mail: [email protected] For additional commands, e-mail: [email protected]
