apache · dongjoon-hyun · Mar 8, 2022 · Mar 4, 2022 · Mar 7, 2022 · stiga-huang
diff --git a/java/core/src/java/org/apache/orc/impl/SchemaEvolution.java b/java/core/src/java/org/apache/orc/impl/SchemaEvolution.java
@@ -38,6 +38,8 @@
 public class SchemaEvolution {
   // indexed by reader column id
   private final TypeDescription[] readerFileTypes;
+  // key: file column id, value: reader column id
+  private final Map<Integer, Integer> typeIdsMap = new HashMap<>();
   // indexed by reader column id
   private final boolean[] readerIncluded;
   // the offset to the first column id ignoring any ACID columns
@@ -126,6 +128,11 @@ public SchemaEvolution(TypeDescription fileSchema,
       }
     }
     buildConversion(fileSchema, this.readerSchema, positionalLevels);
+    for (int i = 0; i < readerFileTypes.length; i++) {
+      if (readerFileTypes[i] != null) {
+        this.typeIdsMap.put(readerFileTypes[i].getId(), i);
+      }
+    }
     this.positionalColumns = options.getForcePositionalEvolution();
     this.ppdSafeConversion = populatePpdSafeConversion();
   }
@@ -296,13 +303,13 @@ private boolean typesAreImplicitConversion(final TypeDescription fileType,
 
   /**
    * Check if column is safe for ppd evaluation
-   * @param colId reader column id
+   * @param colId file column id
    * @return true if the specified column is safe for ppd evaluation else false
    */
   public boolean isPPDSafeConversion(final int colId) {
     if (hasConversion()) {
-      return !(colId < 0 || colId >= ppdSafeConversion.length) &&
-          ppdSafeConversion[colId];
+      Integer readerTypeId = typeIdsMap.get(colId);
+      return readerTypeId != null && ppdSafeConversion[readerTypeId];
     }
 
     // when there is no schema evolution PPD is safe

diff --git a/java/core/src/test/org/apache/orc/impl/TestSchemaEvolution.java b/java/core/src/test/org/apache/orc/impl/TestSchemaEvolution.java
@@ -853,6 +853,16 @@ public void testSafePpdEvaluation() throws IOException {
     assertTrue(both1.isPPDSafeConversion(2));
     assertTrue(both1.isPPDSafeConversion(3));
     assertFalse(both1.isPPDSafeConversion(4));
+
+    // column pruning
+    readerStruct1 = TypeDescription.createStruct()
+        .addField("f2", TypeDescription.createString());
+    both1 = new SchemaEvolution(fileStruct1, readerStruct1, options);
+    assertTrue(both1.hasConversion());
+    assertFalse(both1.isPPDSafeConversion(0));
+    assertFalse(both1.isPPDSafeConversion(1));
+    assertTrue(both1.isPPDSafeConversion(2));
+    assertFalse(both1.isPPDSafeConversion(3));
   }
 
   @Test