From ff9bd8d363b317674e78000a1b7f44f7282ca6de Mon Sep 17 00:00:00 2001 From: Andrew Tang Date: Tue, 27 Jun 2023 23:23:46 -0700 Subject: [PATCH] fix: use native hashing algorithm and fix bug --- .../linkedin/feathr/offline/swa/SlidingWindowFeatureUtils.scala | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/feathr-impl/src/main/scala/com/linkedin/feathr/offline/swa/SlidingWindowFeatureUtils.scala b/feathr-impl/src/main/scala/com/linkedin/feathr/offline/swa/SlidingWindowFeatureUtils.scala index 42b24bcc2..0ca62dbf6 100644 --- a/feathr-impl/src/main/scala/com/linkedin/feathr/offline/swa/SlidingWindowFeatureUtils.scala +++ b/feathr-impl/src/main/scala/com/linkedin/feathr/offline/swa/SlidingWindowFeatureUtils.scala @@ -187,7 +187,7 @@ private[offline] object SlidingWindowFeatureUtils { val rewrittenDef = s"CASE WHEN ${featureDef} IS NOT NULL THEN 1 ELSE 0 END" new CountAggregate(rewrittenDef) case AggregationType.COUNT_DISTINCT => - var rewrittenDef = s"CASE WHEN ${featureDef} IS NOT NULL THEN CAST(CONV(MD5(${featureDef}), 16, 10) AS INT) ELSE 0 END" + val rewrittenDef = s"CASE WHEN ${featureDef} IS NOT NULL THEN hash(${featureDef}) ELSE 0 END" new CountDistinctAggregate(rewrittenDef) case AggregationType.AVG => new AvgAggregate(featureDef) case AggregationType.MAX => new MaxAggregate(featureDef)