Skip to content

Commit

Permalink
Update comments for ORC and Parquet extensions
Browse files Browse the repository at this point in the history
  • Loading branch information
HyukjinKwon committed Mar 10, 2016
1 parent 0e9b003 commit 7568744
Show file tree
Hide file tree
Showing 2 changed files with 6 additions and 0 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -379,6 +379,9 @@ private[sql] class ParquetOutputWriter(
val taskAttemptId = context.getTaskAttemptID
val split = taskAttemptId.getTaskID.getId
val bucketString = bucketId.map(BucketingUtils.bucketIdToString).getOrElse("")
// It has the `.parquet` extension at the end because (de)compression tools
// such as gunzip would not be able to decompress this as the compression
// is not applied on this whole file but on each "page" in Parquet format.
new Path(path, f"part-r-$split%05d-$uniqueWriteJobId$bucketString$extension")
}
}
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -165,6 +165,9 @@ private[orc] class OrcOutputWriter(
val name = conf.get(OrcTableProperties.COMPRESSION.getPropName)
OrcRelation.extensionsForCompressionCodecNames.getOrElse(name, "")
}
// It has the `.orc` extension at the end because (de)compression tools
// such as gunzip would not be able to decompress this as the compression
// is not applied on this whole file but on each "stream" in ORC format.
val filename = f"part-r-$partition%05d-$uniqueWriteJobId$bucketString$compressionExtension.orc"

new OrcOutputFormat().getRecordWriter(
Expand Down

0 comments on commit 7568744

Please sign in to comment.