TestValidateVectorFull.java

/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *    http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.arrow.vector.validate;

import static org.apache.arrow.vector.testing.ValueVectorDataPopulator.setVector;
import static org.apache.arrow.vector.util.ValueVectorUtility.validateFull;
import static org.junit.jupiter.api.Assertions.assertEquals;
import static org.junit.jupiter.api.Assertions.assertThrows;
import static org.junit.jupiter.api.Assertions.assertTrue;

import java.nio.charset.StandardCharsets;
import java.util.Arrays;
import org.apache.arrow.memory.ArrowBuf;
import org.apache.arrow.memory.BufferAllocator;
import org.apache.arrow.memory.RootAllocator;
import org.apache.arrow.vector.Decimal256Vector;
import org.apache.arrow.vector.DecimalVector;
import org.apache.arrow.vector.Float4Vector;
import org.apache.arrow.vector.IntVector;
import org.apache.arrow.vector.LargeVarCharVector;
import org.apache.arrow.vector.ValueVector;
import org.apache.arrow.vector.VarCharVector;
import org.apache.arrow.vector.complex.DenseUnionVector;
import org.apache.arrow.vector.complex.LargeListVector;
import org.apache.arrow.vector.complex.ListVector;
import org.apache.arrow.vector.complex.StructVector;
import org.apache.arrow.vector.complex.UnionVector;
import org.apache.arrow.vector.holders.NullableFloat4Holder;
import org.apache.arrow.vector.holders.NullableFloat8Holder;
import org.apache.arrow.vector.testing.ValueVectorDataPopulator;
import org.apache.arrow.vector.types.Types;
import org.apache.arrow.vector.types.pojo.ArrowType;
import org.apache.arrow.vector.types.pojo.Field;
import org.apache.arrow.vector.types.pojo.FieldType;
import org.junit.jupiter.api.AfterEach;
import org.junit.jupiter.api.BeforeEach;
import org.junit.jupiter.api.Test;

public class TestValidateVectorFull {

  private BufferAllocator allocator;

  @BeforeEach
  public void init() {
    allocator = new RootAllocator(Long.MAX_VALUE);
  }

  @AfterEach
  public void terminate() throws Exception {
    allocator.close();
  }

  @Test
  public void testBaseVariableWidthVector() {
    try (final VarCharVector vector = new VarCharVector("v", allocator)) {
      validateFull(vector);
      setVector(vector, "aaa", "bbb", "ccc");
      validateFull(vector);

      ArrowBuf offsetBuf = vector.getOffsetBuffer();
      offsetBuf.setInt(0, 100);
      offsetBuf.setInt(4, 50);

      ValidateUtil.ValidateException e =
          assertThrows(ValidateUtil.ValidateException.class, () -> validateFull(vector));
      assertTrue(
          e.getMessage()
              .contains("The values in positions 0 and 1 of the offset buffer are decreasing"));
    }
  }

  @Test
  public void testBaseLargeVariableWidthVector() {
    try (final LargeVarCharVector vector = new LargeVarCharVector("v", allocator)) {
      validateFull(vector);
      setVector(vector, "aaa", "bbb", null, "ccc");
      validateFull(vector);

      ArrowBuf offsetBuf = vector.getOffsetBuffer();
      offsetBuf.setLong(0, 100);
      offsetBuf.setLong(8, 50);

      ValidateUtil.ValidateException e =
          assertThrows(ValidateUtil.ValidateException.class, () -> validateFull(vector));
      assertTrue(
          e.getMessage()
              .contains(
                  "The values in positions 0 and 1 of the large offset buffer are decreasing"));
    }
  }

  @Test
  public void testListVector() {
    try (final ListVector vector = ListVector.empty("v", allocator)) {
      validateFull(vector);
      setVector(vector, Arrays.asList(1, 2, 3), Arrays.asList(4, 5), Arrays.asList(6, 7, 8, 9));
      validateFull(vector);

      ArrowBuf offsetBuf = vector.getOffsetBuffer();
      offsetBuf.setInt(0, 100);
      offsetBuf.setInt(8, 50);

      ValidateUtil.ValidateException e =
          assertThrows(ValidateUtil.ValidateException.class, () -> validateFull(vector));
      assertTrue(
          e.getMessage()
              .contains("The values in positions 0 and 1 of the offset buffer are decreasing"));
    }
  }

  @Test
  public void testLargeListVector() {
    try (final LargeListVector vector = LargeListVector.empty("v", allocator)) {
      validateFull(vector);
      setVector(vector, Arrays.asList(1, 2, 3), Arrays.asList(4, 5), Arrays.asList(6, 7, 8, 9));
      validateFull(vector);

      ArrowBuf offsetBuf = vector.getOffsetBuffer();
      offsetBuf.setLong(0, 100);
      offsetBuf.setLong(16, 50);

      ValidateUtil.ValidateException e =
          assertThrows(ValidateUtil.ValidateException.class, () -> validateFull(vector));
      assertTrue(
          e.getMessage()
              .contains(
                  "The values in positions 0 and 1 of the large offset buffer are decreasing"));
    }
  }

  @Test
  public void testStructVectorRangeEquals() {
    try (final StructVector vector = StructVector.empty("struct", allocator)) {
      IntVector intVector =
          vector.addOrGet("f0", FieldType.nullable(new ArrowType.Int(32, true)), IntVector.class);
      VarCharVector strVector =
          vector.addOrGet("f1", FieldType.nullable(new ArrowType.Utf8()), VarCharVector.class);

      validateFull(vector);
      validateFull(intVector);
      validateFull(strVector);

      ValueVectorDataPopulator.setVector(intVector, 1, 2, 3, 4, 5);
      ValueVectorDataPopulator.setVector(strVector, "a", "b", "c", "d", "e");
      vector.setValueCount(5);

      validateFull(vector);
      validateFull(intVector);
      validateFull(strVector);

      ArrowBuf offsetBuf = strVector.getOffsetBuffer();
      offsetBuf.setInt(0, 100);
      offsetBuf.setInt(8, 50);

      ValidateUtil.ValidateException e =
          assertThrows(ValidateUtil.ValidateException.class, () -> validateFull(strVector));
      assertTrue(
          e.getMessage()
              .contains("The values in positions 0 and 1 of the offset buffer are decreasing"));

      e = assertThrows(ValidateUtil.ValidateException.class, () -> validateFull(vector));
      assertTrue(
          e.getMessage()
              .contains("The values in positions 0 and 1 of the offset buffer are decreasing"));
    }
  }

  @Test
  public void testUnionVector() {
    try (final UnionVector vector = UnionVector.empty("union", allocator)) {
      validateFull(vector);

      final NullableFloat4Holder float4Holder = new NullableFloat4Holder();
      float4Holder.value = 1.01f;
      float4Holder.isSet = 1;

      final NullableFloat8Holder float8Holder = new NullableFloat8Holder();
      float8Holder.value = 2.02f;
      float8Holder.isSet = 1;

      vector.setType(0, Types.MinorType.FLOAT4);
      vector.setSafe(0, float4Holder);
      vector.setType(1, Types.MinorType.FLOAT8);
      vector.setSafe(1, float8Holder);
      vector.setValueCount(2);

      validateFull(vector);

      // negative type id
      vector.getTypeBuffer().setByte(0, -1);

      ValidateUtil.ValidateException e =
          assertThrows(ValidateUtil.ValidateException.class, () -> validateFull(vector));
      assertTrue(e.getMessage().contains("The type id at position 0 is negative"));
    }
  }

  @Test
  public void testDenseUnionVector() {
    try (final DenseUnionVector vector = DenseUnionVector.empty("union", allocator)) {
      validateFull(vector);

      final NullableFloat4Holder float4Holder = new NullableFloat4Holder();
      float4Holder.value = 1.01f;
      float4Holder.isSet = 1;

      final NullableFloat8Holder float8Holder = new NullableFloat8Holder();
      float8Holder.value = 2.02f;
      float8Holder.isSet = 1;

      byte float4TypeId =
          vector.registerNewTypeId(Field.nullable("", Types.MinorType.FLOAT4.getType()));
      byte float8TypeId =
          vector.registerNewTypeId(Field.nullable("", Types.MinorType.FLOAT8.getType()));

      vector.setTypeId(0, float4TypeId);
      vector.setSafe(0, float4Holder);
      vector.setTypeId(1, float8TypeId);
      vector.setSafe(1, float8Holder);
      vector.setValueCount(2);

      validateFull(vector);

      ValueVector subVector = vector.getVectorByType(float4TypeId);
      assertTrue(subVector instanceof Float4Vector);
      assertEquals(1, subVector.getValueCount());

      // shrink sub-vector
      subVector.setValueCount(0);

      ValidateUtil.ValidateException e =
          assertThrows(ValidateUtil.ValidateException.class, () -> validateFull(vector));
      assertTrue(e.getMessage().contains("Dense union vector offset exceeds sub-vector boundary"));
    }
  }

  @Test
  public void testBaseVariableWidthVectorInstanceMethod() {
    try (final VarCharVector vector = new VarCharVector("v", allocator)) {
      vector.validateFull();
      setVector(vector, "aaa", "bbb", "ccc");
      vector.validateFull();

      ArrowBuf offsetBuf = vector.getOffsetBuffer();
      offsetBuf.setInt(0, 100);
      offsetBuf.setInt(4, 50);

      ValidateUtil.ValidateException e =
          assertThrows(ValidateUtil.ValidateException.class, vector::validateFull);
      assertTrue(
          e.getMessage()
              .contains("The values in positions 0 and 1 of the offset buffer are decreasing"));
    }
  }

  @Test
  public void testValidateVarCharUTF8() {
    try (final VarCharVector vector = new VarCharVector("v", allocator)) {
      vector.validateFull();
      setVector(
          vector,
          "aaa".getBytes(StandardCharsets.UTF_8),
          "bbb".getBytes(StandardCharsets.UTF_8),
          new byte[] {(byte) 0xFF, (byte) 0xFE});
      ValidateUtil.ValidateException e =
          assertThrows(ValidateUtil.ValidateException.class, vector::validateFull);
      assertTrue(e.getMessage().contains("UTF"));
    }
  }

  @Test
  public void testValidateLargeVarCharUTF8() {
    try (final LargeVarCharVector vector = new LargeVarCharVector("v", allocator)) {
      vector.validateFull();
      setVector(
          vector,
          "aaa".getBytes(StandardCharsets.UTF_8),
          "bbb".getBytes(StandardCharsets.UTF_8),
          new byte[] {(byte) 0xFF, (byte) 0xFE});
      ValidateUtil.ValidateException e =
          assertThrows(ValidateUtil.ValidateException.class, vector::validateFull);
      assertTrue(e.getMessage().contains("UTF"));
    }
  }

  @Test
  public void testValidateDecimal() {
    try (final DecimalVector vector =
        new DecimalVector(
            Field.nullable("v", new ArrowType.Decimal(2, 0, DecimalVector.TYPE_WIDTH * 8)),
            allocator)) {
      vector.validateFull();
      setVector(vector, 1L);
      vector.validateFull();
      vector.clear();
      setVector(vector, Long.MAX_VALUE);
      ValidateUtil.ValidateException e =
          assertThrows(ValidateUtil.ValidateException.class, vector::validateFull);
      assertTrue(e.getMessage().contains("Decimal"));
    }
  }

  @Test
  public void testValidateDecimal256() {
    try (final Decimal256Vector vector =
        new Decimal256Vector(
            Field.nullable("v", new ArrowType.Decimal(2, 0, DecimalVector.TYPE_WIDTH * 8)),
            allocator)) {
      vector.validateFull();
      setVector(vector, 1L);
      vector.validateFull();
      vector.clear();
      setVector(vector, Long.MAX_VALUE);
      ValidateUtil.ValidateException e =
          assertThrows(ValidateUtil.ValidateException.class, vector::validateFull);
      assertTrue(e.getMessage().contains("Decimal"));
    }
  }
}