From 17a18cb2d11c918064e94a7b054a2c0b783e2a9f Mon Sep 17 00:00:00 2001 From: Yuhao Yang Date: Sat, 25 Jul 2015 02:59:44 -0400 Subject: [PATCH] add ut for word2vec --- .../org/apache/spark/mllib/feature/Word2VecSuite.scala | 10 ++++++++++ 1 file changed, 10 insertions(+) diff --git a/mllib/src/test/scala/org/apache/spark/mllib/feature/Word2VecSuite.scala b/mllib/src/test/scala/org/apache/spark/mllib/feature/Word2VecSuite.scala index b6818369208d7..77a9f0f872473 100644 --- a/mllib/src/test/scala/org/apache/spark/mllib/feature/Word2VecSuite.scala +++ b/mllib/src/test/scala/org/apache/spark/mllib/feature/Word2VecSuite.scala @@ -39,6 +39,16 @@ class Word2VecSuite extends SparkFunSuite with MLlibTestSparkContext { assert(syms(1)._1 == "c") } + test("Word2Vec throws exception when vocabulary is empty") { + intercept[IllegalArgumentException] { + val sentence = "a b c" + val localDoc = Seq(sentence, sentence) + val doc = sc.parallelize(localDoc) + .map(line => line.split(" ").toSeq) + new Word2Vec().setMinCount(10).fit(doc) + } + } + test("Word2VecModel") { val num = 2 val word2VecMap = Map(