From 1cc49ad4cba8b6eaf8d1709da49b2a25cb1c9034 Mon Sep 17 00:00:00 2001
From: eadwright <eadwright@gmail.com>
Date: Tue, 4 May 2021 14:24:01 +0100
Subject: [PATCH 1/7] PARQUET-1633 Fix integer overflow

---
 .../apache/parquet/hadoop/ParquetFileReader.java | 16 ++++++++--------
 1 file changed, 8 insertions(+), 8 deletions(-)
diff --git a/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/ParquetFileReader.java b/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/ParquetFileReader.java
index 1fa9c1f44d..c2b27f88bf 100644
--- a/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/ParquetFileReader.java
+++ b/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/ParquetFileReader.java
@@ -944,7 +944,7 @@ private ColumnChunkPageReadStore internalReadRowGroup(int blockIndex) throws IOE
           currentParts = new ConsecutivePartList(startingPos);
           allParts.add(currentParts);
         }
-        currentParts.addChunk(new ChunkDescriptor(columnDescriptor, mc, startingPos, (int)mc.getTotalSize()));
+        currentParts.addChunk(new ChunkDescriptor(columnDescriptor, mc, startingPos, mc.getTotalSize()));
       }
     }
     // actually read all the chunks
@@ -1066,7 +1066,7 @@ private ColumnChunkPageReadStore internalReadFilteredRowGroup(BlockMetaData bloc
             allParts.add(currentParts);
           }
           ChunkDescriptor chunkDescriptor = new ChunkDescriptor(columnDescriptor, mc, startingPos,
-              Math.toIntExact(range.getLength()));
+              range.getLength());
           currentParts.addChunk(chunkDescriptor);
           builder.setOffsetIndex(chunkDescriptor, filteredOffsetIndex);
         }
@@ -1464,7 +1464,7 @@ protected PageHeader readPageHeader(BlockCipher.Decryptor blockDecryptor, byte[]
      */
     private void verifyCrc(int referenceCrc, byte[] bytes, String exceptionMsg) {
       crc.reset();
-      crc.update(bytes);
+      crc.update(bytes, 0, bytes.length);
       if (crc.getValue() != ((long) referenceCrc & 0xffffffffL)) {
         throw new ParquetDecodingException(exceptionMsg);
       }
@@ -1691,7 +1691,7 @@ private static class ChunkDescriptor {
     private final ColumnDescriptor col;
     private final ColumnChunkMetaData metadata;
     private final long fileOffset;
-    private final int size;
+    private final long size;
 
     /**
      * @param col column this chunk is part of
@@ -1703,7 +1703,7 @@ private ChunkDescriptor(
         ColumnDescriptor col,
         ColumnChunkMetaData metadata,
         long fileOffset,
-        int size) {
+        long size) {
       super();
       this.col = col;
       this.metadata = metadata;
@@ -1735,7 +1735,7 @@ public boolean equals(Object obj) {
   private class ConsecutivePartList {
 
     private final long offset;
-    private int length;
+    private long length;
     private final List<ChunkDescriptor> chunks = new ArrayList<>();
 
     /**
@@ -1763,8 +1763,8 @@ public void addChunk(ChunkDescriptor descriptor) {
     public void readAll(SeekableInputStream f, ChunkListBuilder builder) throws IOException {
       f.seek(offset);
 
-      int fullAllocations = length / options.getMaxAllocationSize();
-      int lastAllocationSize = length % options.getMaxAllocationSize();
+      int fullAllocations = (int)(length / options.getMaxAllocationSize());
+      int lastAllocationSize = (int)(length % options.getMaxAllocationSize());
 
       int numAllocations = fullAllocations + (lastAllocationSize > 0 ? 1 : 0);
       List<ByteBuffer> buffers = new ArrayList<>(numAllocations);

From 481b348d9f55376dbbf16ad650dc74759d30fcdf Mon Sep 17 00:00:00 2001
From: eadwright <eadwright@gmail.com>
Date: Tue, 18 May 2021 22:17:37 +0100
Subject: [PATCH 2/7] PARQUET-1633 Undo Java 8 change

---
 .../main/java/org/apache/parquet/hadoop/ParquetFileReader.java  | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/ParquetFileReader.java b/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/ParquetFileReader.java
index c2b27f88bf..32f38b747f 100644
--- a/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/ParquetFileReader.java
+++ b/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/ParquetFileReader.java
@@ -1464,7 +1464,7 @@ protected PageHeader readPageHeader(BlockCipher.Decryptor blockDecryptor, byte[]
      */
     private void verifyCrc(int referenceCrc, byte[] bytes, String exceptionMsg) {
       crc.reset();
-      crc.update(bytes, 0, bytes.length);
+      crc.update(bytes);
       if (crc.getValue() != ((long) referenceCrc & 0xffffffffL)) {
         throw new ParquetDecodingException(exceptionMsg);
       }

From 4dd697793c0ab148c4a37c7185a9ac6937dd0977 Mon Sep 17 00:00:00 2001
From: eadwright <eadwright@gmail.com>
Date: Wed, 19 May 2021 09:18:34 +0100
Subject: [PATCH 3/7] PARQUET-1633 Use Math.toIntExact()

---
 .../java/org/apache/parquet/hadoop/ParquetFileReader.java     | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/ParquetFileReader.java b/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/ParquetFileReader.java
index 32f38b747f..3a68e0133b 100644
--- a/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/ParquetFileReader.java
+++ b/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/ParquetFileReader.java
@@ -1763,8 +1763,8 @@ public void addChunk(ChunkDescriptor descriptor) {
     public void readAll(SeekableInputStream f, ChunkListBuilder builder) throws IOException {
       f.seek(offset);
 
-      int fullAllocations = (int)(length / options.getMaxAllocationSize());
-      int lastAllocationSize = (int)(length % options.getMaxAllocationSize());
+      int fullAllocations = Math.toIntExact(length / options.getMaxAllocationSize());
+      int lastAllocationSize = Math.toIntExact(length % options.getMaxAllocationSize());
 
       int numAllocations = fullAllocations + (lastAllocationSize > 0 ? 1 : 0);
       List<ByteBuffer> buffers = new ArrayList<>(numAllocations);

From fcaf41269470c03c088b7eb5598558d44013f59d Mon Sep 17 00:00:00 2001
From: Gabor Szadovszky <gabor@apache.org>
Date: Wed, 26 May 2021 18:36:56 +0200
Subject: [PATCH 4/7] PARQUET-1633: Unit test

- Updated ParquetWriter to support setting row group size in long
- Removed Xmx settings in the pom to allow more memory for the tests
---
 .../apache/parquet/hadoop/ParquetWriter.java  |  16 +-
 .../parquet/hadoop/TestLargeColumnChunk.java  | 146 ++++++++++++++++++
 pom.xml                                       |   3 +-
 3 files changed, 161 insertions(+), 4 deletions(-)
 create mode 100644 parquet-hadoop/src/test/java/org/apache/parquet/hadoop/TestLargeColumnChunk.java

diff --git a/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/ParquetWriter.java b/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/ParquetWriter.java
index 696fec3140..b9953a57f3 100644
--- a/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/ParquetWriter.java
+++ b/parquet-hadoop/src/main/java/org/apache/parquet/hadoop/ParquetWriter.java
@@ -269,7 +269,7 @@ public ParquetWriter(Path file, Configuration conf, WriteSupport<T> writeSupport
       ParquetFileWriter.Mode mode,
       WriteSupport<T> writeSupport,
       CompressionCodecName compressionCodecName,
-      int rowGroupSize,
+      long rowGroupSize,
       boolean validating,
       Configuration conf,
       int maxPaddingSize,
@@ -355,7 +355,7 @@ public abstract static class Builder<T, SELF extends Builder<T, SELF>> {
     private Configuration conf = new Configuration();
     private ParquetFileWriter.Mode mode;
     private CompressionCodecName codecName = DEFAULT_COMPRESSION_CODEC_NAME;
-    private int rowGroupSize = DEFAULT_BLOCK_SIZE;
+    private long rowGroupSize = DEFAULT_BLOCK_SIZE;
     private int maxPaddingSize = MAX_PADDING_SIZE_DEFAULT;
     private boolean enableValidation = DEFAULT_IS_VALIDATING_ENABLED;
     private ParquetProperties.Builder encodingPropsBuilder =
@@ -432,8 +432,20 @@ public SELF withEncryption (FileEncryptionProperties encryptionProperties) {
      *
      * @param rowGroupSize an integer size in bytes
      * @return this builder for method chaining.
+     * @deprecated Use {@link #withRowGroupSize(long)} instead
      */
+    @Deprecated
     public SELF withRowGroupSize(int rowGroupSize) {
+      return withRowGroupSize((long) rowGroupSize);
+    }
+
+    /**
+     * Set the Parquet format row group size used by the constructed writer.
+     *
+     * @param rowGroupSize an integer size in bytes
+     * @return this builder for method chaining.
+     */
+    public SELF withRowGroupSize(long rowGroupSize) {
       this.rowGroupSize = rowGroupSize;
       return self();
     }
diff --git a/parquet-hadoop/src/test/java/org/apache/parquet/hadoop/TestLargeColumnChunk.java b/parquet-hadoop/src/test/java/org/apache/parquet/hadoop/TestLargeColumnChunk.java
new file mode 100644
index 0000000000..0ccb9f6d01
--- /dev/null
+++ b/parquet-hadoop/src/test/java/org/apache/parquet/hadoop/TestLargeColumnChunk.java
@@ -0,0 +1,146 @@
+/*
+ * Licensed to the Apache Software Foundation (ASF) under one
+ * or more contributor license agreements.  See the NOTICE file
+ * distributed with this work for additional information
+ * regarding copyright ownership.  The ASF licenses this file
+ * to you under the Apache License, Version 2.0 (the
+ * "License"); you may not use this file except in compliance
+ * with the License.  You may obtain a copy of the License at
+ *
+ *   http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing,
+ * software distributed under the License is distributed on an
+ * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
+ * KIND, either express or implied.  See the License for the
+ * specific language governing permissions and limitations
+ * under the License.
+ */
+
+package org.apache.parquet.hadoop;
+
+import static org.apache.parquet.filter2.predicate.FilterApi.binaryColumn;
+import static org.apache.parquet.filter2.predicate.FilterApi.eq;
+import static org.apache.parquet.hadoop.ParquetFileWriter.Mode.OVERWRITE;
+import static org.apache.parquet.hadoop.metadata.CompressionCodecName.UNCOMPRESSED;
+import static org.apache.parquet.schema.LogicalTypeAnnotation.stringType;
+import static org.apache.parquet.schema.PrimitiveType.PrimitiveTypeName.BINARY;
+import static org.apache.parquet.schema.PrimitiveType.PrimitiveTypeName.INT64;
+import static org.apache.parquet.schema.Types.buildMessage;
+import static org.apache.parquet.schema.Types.required;
+import static org.junit.Assert.assertEquals;
+import static org.junit.Assert.assertNull;
+
+import java.io.IOException;
+import java.util.Random;
+
+import org.apache.hadoop.conf.Configuration;
+import org.apache.hadoop.fs.Path;
+import org.apache.parquet.example.data.Group;
+import org.apache.parquet.example.data.GroupFactory;
+import org.apache.parquet.example.data.simple.SimpleGroupFactory;
+import org.apache.parquet.filter2.compat.FilterCompat;
+import org.apache.parquet.hadoop.example.ExampleParquetWriter;
+import org.apache.parquet.hadoop.example.GroupReadSupport;
+import org.apache.parquet.hadoop.example.GroupWriteSupport;
+import org.apache.parquet.hadoop.util.HadoopOutputFile;
+import org.apache.parquet.io.api.Binary;
+import org.apache.parquet.schema.MessageType;
+import org.junit.BeforeClass;
+import org.junit.Rule;
+import org.junit.Test;
+import org.junit.rules.TemporaryFolder;
+
+/**
+ * This test is to test parquet-mr working with potential int overflows (when the sizes are greater than
+ * Integer.MAX_VALUE).
+ *
+ * TODO: Check if CI environment can handle the memory consumption and time of this test.
+ */
+public class TestLargeColumnChunk {
+  private static final MessageType SCHEMA = buildMessage().addFields(
+      required(INT64).named("id"),
+      required(BINARY).named("data"))
+      .named("schema");
+  private static final int DATA_SIZE = 256;
+  // Ensure that the size of the column chunk would overflow an int
+  private static final int ROW_COUNT = Integer.MAX_VALUE / DATA_SIZE + 1;
+  private static final long RANDOM_SEED = 42;
+  private static final int ID_INDEX = SCHEMA.getFieldIndex("id");
+  private static final int DATA_INDEX = SCHEMA.getFieldIndex("data");
+
+  private static final long ID_OF_FILTERED_DATA = ROW_COUNT / 2;
+  private static Binary VALUE_IN_DATA;
+  private static Binary VALUE_NOT_IN_DATA;
+  private static Path file;
+
+  @Rule
+  public TemporaryFolder folder = new TemporaryFolder();
+
+  @BeforeClass
+  public static void createFile() throws IOException {
+//  TODO:  file = new Path(folder.newFile().getAbsolutePath());
+    file = new Path("/tmp/test.parquet");
+
+    GroupFactory factory = new SimpleGroupFactory(SCHEMA);
+    Random random = new Random(RANDOM_SEED);
+    Configuration conf = new Configuration();
+    GroupWriteSupport.setSchema(SCHEMA, conf);
+    try (ParquetWriter<Group> writer = ExampleParquetWriter
+        .builder(HadoopOutputFile.fromPath(file, conf))
+        .withWriteMode(OVERWRITE)
+        .withConf(conf)
+        .withCompressionCodec(UNCOMPRESSED)
+        .withRowGroupSize(4L * 1024 * 1024 * 1024) // 4G to ensure all data goes to one row group
+        .withBloomFilterEnabled(true)
+        .build()) {
+      for (long id = 0; id < ROW_COUNT; ++id) {
+        Group group = factory.newGroup();
+        group.add(ID_INDEX, id);
+        Binary data = nextBinary(random);
+        group.add(DATA_INDEX, data);
+        writer.write(group);
+        if (id == ID_OF_FILTERED_DATA) {
+          VALUE_IN_DATA = data;
+        }
+      }
+    }
+    VALUE_NOT_IN_DATA = nextBinary(random);
+  }
+
+  private static Binary nextBinary(Random random) {
+    byte[] bytes = new byte[DATA_SIZE];
+    random.nextBytes(bytes);
+    return Binary.fromConstantByteArray(bytes);
+  }
+
+  @Test
+  public void validateAllData() throws IOException {
+    Random random = new Random(RANDOM_SEED);
+    try (ParquetReader<Group> reader = ParquetReader.builder(new GroupReadSupport(), file).build()) {
+      for (long id = 0; id < ROW_COUNT; ++id) {
+        Group group = reader.read();
+        assertEquals(id, group.getLong(ID_INDEX, 0));
+        assertEquals(nextBinary(random), group.getBinary(DATA_INDEX, 0));
+      }
+      assertNull("No more record should be read", reader.read());
+    }
+  }
+
+  @Test
+  public void validateFiltering() throws IOException {
+    try (ParquetReader<Group> reader = ParquetReader.builder(new GroupReadSupport(), file)
+        .withFilter(FilterCompat.get(eq(binaryColumn("data"), VALUE_IN_DATA)))
+        .build()) {
+      Group group = reader.read();
+      assertEquals(ID_OF_FILTERED_DATA, group.getLong(ID_INDEX, 0));
+      assertEquals(VALUE_IN_DATA, group.getBinary(DATA_INDEX, 0));
+      assertNull("No more record should be read", reader.read());
+    }
+    try (ParquetReader<Group> reader = ParquetReader.builder(new GroupReadSupport(), file)
+        .withFilter(FilterCompat.get(eq(binaryColumn("data"), VALUE_NOT_IN_DATA)))
+        .build()) {
+      assertNull("No record should be read", reader.read());
+    }
+  }
+}
diff --git a/pom.xml b/pom.xml
index 24f122935f..ecfd17f49f 100644
--- a/pom.xml
+++ b/pom.xml
@@ -109,7 +109,6 @@
     <commons-text.version>1.8</commons-text.version>
 
     <!-- properties for the profiles -->
-    <surefire.argLine>-Xmx512m</surefire.argLine>
     <surefire.logLevel>INFO</surefire.logLevel>
   </properties>
 
@@ -558,7 +557,7 @@
       <id>ci-test</id>
       <properties>
         <surefire.logLevel>WARN</surefire.logLevel>
-        <surefire.argLine>-Xmx512m -XX:MaxJavaStackTraceDepth=10</surefire.argLine>
+        <surefire.argLine>-XX:MaxJavaStackTraceDepth=10</surefire.argLine>
       </properties>
     </profile>
 

From 631eb6bf76067ca31a0a7bf13a0835a5ce41aac6 Mon Sep 17 00:00:00 2001
From: eadwright <eadwright@gmail.com>
Date: Thu, 10 Jun 2021 10:28:25 +0100
Subject: [PATCH 5/7] Test updates from @gszadovszky

---
 .../parquet/hadoop/TestLargeColumnChunk.java  | 20 ++++++++++++-------
 1 file changed, 13 insertions(+), 7 deletions(-)

diff --git a/parquet-hadoop/src/test/java/org/apache/parquet/hadoop/TestLargeColumnChunk.java b/parquet-hadoop/src/test/java/org/apache/parquet/hadoop/TestLargeColumnChunk.java
index 0ccb9f6d01..8cb6577bc2 100644
--- a/parquet-hadoop/src/test/java/org/apache/parquet/hadoop/TestLargeColumnChunk.java
+++ b/parquet-hadoop/src/test/java/org/apache/parquet/hadoop/TestLargeColumnChunk.java
@@ -23,7 +23,6 @@
 import static org.apache.parquet.filter2.predicate.FilterApi.eq;
 import static org.apache.parquet.hadoop.ParquetFileWriter.Mode.OVERWRITE;
 import static org.apache.parquet.hadoop.metadata.CompressionCodecName.UNCOMPRESSED;
-import static org.apache.parquet.schema.LogicalTypeAnnotation.stringType;
 import static org.apache.parquet.schema.PrimitiveType.PrimitiveTypeName.BINARY;
 import static org.apache.parquet.schema.PrimitiveType.PrimitiveTypeName.INT64;
 import static org.apache.parquet.schema.Types.buildMessage;
@@ -46,6 +45,7 @@
 import org.apache.parquet.hadoop.util.HadoopOutputFile;
 import org.apache.parquet.io.api.Binary;
 import org.apache.parquet.schema.MessageType;
+import org.junit.Assume;
 import org.junit.BeforeClass;
 import org.junit.Rule;
 import org.junit.Test;
@@ -53,9 +53,8 @@
 
 /**
  * This test is to test parquet-mr working with potential int overflows (when the sizes are greater than
- * Integer.MAX_VALUE).
- *
- * TODO: Check if CI environment can handle the memory consumption and time of this test.
+ * Integer.MAX_VALUE). The test requires ~3GB memory so it is likely to fail in the CI environment. Because of that the
+ * OOM errors are caught and the test is skipped to ensure it'll not break our regular testing.
  */
 public class TestLargeColumnChunk {
   private static final MessageType SCHEMA = buildMessage().addFields(
@@ -75,12 +74,11 @@ public class TestLargeColumnChunk {
   private static Path file;
 
   @Rule
-  public TemporaryFolder folder = new TemporaryFolder();
+  public static TemporaryFolder folder = new TemporaryFolder();
 
   @BeforeClass
   public static void createFile() throws IOException {
-//  TODO:  file = new Path(folder.newFile().getAbsolutePath());
-    file = new Path("/tmp/test.parquet");
+    file = new Path(folder.newFile().getAbsolutePath());
 
     GroupFactory factory = new SimpleGroupFactory(SCHEMA);
     Random random = new Random(RANDOM_SEED);
@@ -104,6 +102,8 @@ public static void createFile() throws IOException {
           VALUE_IN_DATA = data;
         }
       }
+    } catch (OutOfMemoryError e) {
+      Assume.assumeNoException("This test is skipped due to not enough memory", e);
     }
     VALUE_NOT_IN_DATA = nextBinary(random);
   }
@@ -124,6 +124,8 @@ public void validateAllData() throws IOException {
         assertEquals(nextBinary(random), group.getBinary(DATA_INDEX, 0));
       }
       assertNull("No more record should be read", reader.read());
+    } catch (OutOfMemoryError e) {
+      Assume.assumeNoException("This test is skipped due to not enough memory", e);
     }
   }
 
@@ -136,11 +138,15 @@ public void validateFiltering() throws IOException {
       assertEquals(ID_OF_FILTERED_DATA, group.getLong(ID_INDEX, 0));
       assertEquals(VALUE_IN_DATA, group.getBinary(DATA_INDEX, 0));
       assertNull("No more record should be read", reader.read());
+    } catch (OutOfMemoryError e) {
+      Assume.assumeNoException("This test is skipped due to not enough memory", e);
     }
     try (ParquetReader<Group> reader = ParquetReader.builder(new GroupReadSupport(), file)
         .withFilter(FilterCompat.get(eq(binaryColumn("data"), VALUE_NOT_IN_DATA)))
         .build()) {
       assertNull("No record should be read", reader.read());
+    } catch (OutOfMemoryError e) {
+      Assume.assumeNoException("This test is skipped due to not enough memory", e);
     }
   }
 }

From c29b0c8b5a45f6cfc2c04c0b80140cb4b21902e2 Mon Sep 17 00:00:00 2001
From: eadwright <eadwright@gmail.com>
Date: Thu, 10 Jun 2021 10:32:14 +0100
Subject: [PATCH 6/7] Fix merging mistake

---
 .../org/apache/parquet/hadoop/TestLargeColumnChunk.java    | 7 ++-----
 1 file changed, 2 insertions(+), 5 deletions(-)

diff --git a/parquet-hadoop/src/test/java/org/apache/parquet/hadoop/TestLargeColumnChunk.java b/parquet-hadoop/src/test/java/org/apache/parquet/hadoop/TestLargeColumnChunk.java
index 8cb6577bc2..a5e95549fa 100644
--- a/parquet-hadoop/src/test/java/org/apache/parquet/hadoop/TestLargeColumnChunk.java
+++ b/parquet-hadoop/src/test/java/org/apache/parquet/hadoop/TestLargeColumnChunk.java
@@ -45,10 +45,7 @@
 import org.apache.parquet.hadoop.util.HadoopOutputFile;
 import org.apache.parquet.io.api.Binary;
 import org.apache.parquet.schema.MessageType;
-import org.junit.Assume;
-import org.junit.BeforeClass;
-import org.junit.Rule;
-import org.junit.Test;
+import org.junit.*;
 import org.junit.rules.TemporaryFolder;
 
 /**
@@ -73,7 +70,7 @@ public class TestLargeColumnChunk {
   private static Binary VALUE_NOT_IN_DATA;
   private static Path file;
 
-  @Rule
+  @ClassRule
   public static TemporaryFolder folder = new TemporaryFolder();
 
   @BeforeClass

From 03a2e0ef5fbe557cb49e67d98b2c713de99fcbf3 Mon Sep 17 00:00:00 2001
From: eadwright <eadwright@gmail.com>
Date: Thu, 10 Jun 2021 15:10:37 +0100
Subject: [PATCH 7/7] Ignore test, remove OOM checks

---
 .../parquet/hadoop/TestLargeColumnChunk.java      | 15 ++++-----------
 1 file changed, 4 insertions(+), 11 deletions(-)

diff --git a/parquet-hadoop/src/test/java/org/apache/parquet/hadoop/TestLargeColumnChunk.java b/parquet-hadoop/src/test/java/org/apache/parquet/hadoop/TestLargeColumnChunk.java
index a5e95549fa..90015f57e1 100644
--- a/parquet-hadoop/src/test/java/org/apache/parquet/hadoop/TestLargeColumnChunk.java
+++ b/parquet-hadoop/src/test/java/org/apache/parquet/hadoop/TestLargeColumnChunk.java
@@ -50,9 +50,10 @@
 
 /**
  * This test is to test parquet-mr working with potential int overflows (when the sizes are greater than
- * Integer.MAX_VALUE). The test requires ~3GB memory so it is likely to fail in the CI environment. Because of that the
- * OOM errors are caught and the test is skipped to ensure it'll not break our regular testing.
+ * Integer.MAX_VALUE). The test requires ~3GB memory so it is likely to fail in the CI environment, so these
+ * tests are flagged to be ignored.
  */
+@Ignore
 public class TestLargeColumnChunk {
   private static final MessageType SCHEMA = buildMessage().addFields(
       required(INT64).named("id"),
@@ -60,7 +61,7 @@ public class TestLargeColumnChunk {
       .named("schema");
   private static final int DATA_SIZE = 256;
   // Ensure that the size of the column chunk would overflow an int
-  private static final int ROW_COUNT = Integer.MAX_VALUE / DATA_SIZE + 1;
+  private static final int ROW_COUNT = Integer.MAX_VALUE / DATA_SIZE + 1000;
   private static final long RANDOM_SEED = 42;
   private static final int ID_INDEX = SCHEMA.getFieldIndex("id");
   private static final int DATA_INDEX = SCHEMA.getFieldIndex("data");
@@ -99,8 +100,6 @@ public static void createFile() throws IOException {
           VALUE_IN_DATA = data;
         }
       }
-    } catch (OutOfMemoryError e) {
-      Assume.assumeNoException("This test is skipped due to not enough memory", e);
     }
     VALUE_NOT_IN_DATA = nextBinary(random);
   }
@@ -121,8 +120,6 @@ public void validateAllData() throws IOException {
         assertEquals(nextBinary(random), group.getBinary(DATA_INDEX, 0));
       }
       assertNull("No more record should be read", reader.read());
-    } catch (OutOfMemoryError e) {
-      Assume.assumeNoException("This test is skipped due to not enough memory", e);
     }
   }
 
@@ -135,15 +132,11 @@ public void validateFiltering() throws IOException {
       assertEquals(ID_OF_FILTERED_DATA, group.getLong(ID_INDEX, 0));
       assertEquals(VALUE_IN_DATA, group.getBinary(DATA_INDEX, 0));
       assertNull("No more record should be read", reader.read());
-    } catch (OutOfMemoryError e) {
-      Assume.assumeNoException("This test is skipped due to not enough memory", e);
     }
     try (ParquetReader<Group> reader = ParquetReader.builder(new GroupReadSupport(), file)
         .withFilter(FilterCompat.get(eq(binaryColumn("data"), VALUE_NOT_IN_DATA)))
         .build()) {
       assertNull("No record should be read", reader.read());
-    } catch (OutOfMemoryError e) {
-      Assume.assumeNoException("This test is skipped due to not enough memory", e);
     }
   }
 }