From d1af60ed20dfd4eeb3570c9bb562639164080915 Mon Sep 17 00:00:00 2001 From: Wenchen Fan Date: Sat, 16 Jan 2016 22:19:19 -0800 Subject: [PATCH] speed up hashcode for UTF8String --- .../java/org/apache/spark/unsafe/types/UTF8String.java | 7 ++----- 1 file changed, 2 insertions(+), 5 deletions(-) diff --git a/unsafe/src/main/java/org/apache/spark/unsafe/types/UTF8String.java b/unsafe/src/main/java/org/apache/spark/unsafe/types/UTF8String.java index 5b61386808769..87706d0b68388 100644 --- a/unsafe/src/main/java/org/apache/spark/unsafe/types/UTF8String.java +++ b/unsafe/src/main/java/org/apache/spark/unsafe/types/UTF8String.java @@ -31,6 +31,7 @@ import org.apache.spark.unsafe.Platform; import org.apache.spark.unsafe.array.ByteArrayMethods; +import org.apache.spark.unsafe.hash.Murmur3_x86_32; import static org.apache.spark.unsafe.Platform.*; @@ -935,11 +936,7 @@ public int levenshteinDistance(UTF8String other) { @Override public int hashCode() { - int result = 1; - for (int i = 0; i < numBytes; i ++) { - result = 31 * result + getByte(i); - } - return result; + return Murmur3_x86_32.hashUnsafeBytes(base, offset, numBytes, 42); } /**