Skip to content

Commit a594382

Browse files
committed
Initial test
1 parent 4ee3721 commit a594382

File tree

2 files changed

+101
-0
lines changed

2 files changed

+101
-0
lines changed
Lines changed: 41 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,41 @@
1+
/*
2+
* Licensed to the Apache Software Foundation (ASF) under one or more
3+
* contributor license agreements. See the NOTICE file distributed with
4+
* this work for additional information regarding copyright ownership.
5+
* The ASF licenses this file to You under the Apache License, Version 2.0
6+
* (the "License"); you may not use this file except in compliance with
7+
* the License. You may obtain a copy of the License at
8+
*
9+
* http://www.apache.org/licenses/LICENSE-2.0
10+
*
11+
* Unless required by applicable law or agreed to in writing, software
12+
* distributed under the License is distributed on an "AS IS" BASIS,
13+
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14+
* See the License for the specific language governing permissions and
15+
* limitations under the License.
16+
*/
17+
18+
package com.sparklingpandas.sparklingml.feature
19+
20+
import org.apache.spark.ml.param._
21+
22+
import org.apache.lucene.analysis.Analyzer
23+
24+
import com.sparklingpandas.sparklingml.param._
25+
26+
// DO NOT MODIFY THIS FILE! It was auto generated by LuceneAnalyzerGenerators
27+
28+
/**
29+
* A super simple test
30+
*/
31+
class WhitespaceAnalyzerLuceneTest extends LuceneTransformerTest[WhitespaceAnalyzerLucene] {
32+
val transformer = new WhitespaceAnalyzerLucene()
33+
}
34+
35+
36+
/**
37+
* A super simple test
38+
*/
39+
class FinnishAnalyzerLuceneTest extends LuceneStopwordTransformerTest[FinnishAnalyzerLucene] {
40+
val transformer = new FinnishAnalyzerLucene()
41+
}
Lines changed: 60 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,60 @@
1+
/*
2+
* Licensed to the Apache Software Foundation (ASF) under one or more
3+
* contributor license agreements. See the NOTICE file distributed with
4+
* this work for additional information regarding copyright ownership.
5+
* The ASF licenses this file to You under the Apache License, Version 2.0
6+
* (the "License"); you may not use this file except in compliance with
7+
* the License. You may obtain a copy of the License at
8+
*
9+
* http://www.apache.org/licenses/LICENSE-2.0
10+
*
11+
* Unless required by applicable law or agreed to in writing, software
12+
* distributed under the License is distributed on an "AS IS" BASIS,
13+
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14+
* See the License for the specific language governing permissions and
15+
* limitations under the License.
16+
*/
17+
18+
package com.sparklingpandas.sparklingml.feature
19+
20+
import org.apache.spark.ml.param._
21+
22+
import org.apache.lucene.analysis.Analyzer
23+
24+
import org.scalatest.FunSuite
25+
26+
import com.holdenkarau.spark.testing.DataFrameSuiteBase
27+
28+
import com.sparklingpandas.sparklingml.param._
29+
30+
case class InputData(input: String)
31+
32+
abstract class LuceneTransformerTest[T <: LuceneTransformer[_]] extends
33+
FunSuite with DataFrameSuiteBase {
34+
val transformer: T
35+
36+
test("verify that the transformer runs") {
37+
import spark.implicits._
38+
val input = spark.createDataset(
39+
List(InputData("hi"), InputData("boo"), InputData("boop")))
40+
transformer.setInputCol("input")
41+
val result = transformer.transform(input).collect()
42+
assert(result.size === 3)
43+
}
44+
}
45+
46+
abstract class LuceneStopwordTransformerTest[T <: LuceneTransformer[_]] extends
47+
LuceneTransformerTest[T] {
48+
test("verify stopword is dropped, nothing else") {
49+
import spark.implicits._
50+
val input = spark.createDataset(
51+
List(InputData("hi"), InputData("boo"), InputData("boop")))
52+
val thst = transformer.asInstanceOf[HasStopwords]
53+
thst.set(thst.stopwords, Array("boo"))
54+
thst.setStopwords(Array("boop"))
55+
transformer.asInstanceOf[FinnishAnalyzerLucene].setInputCol("input")
56+
val result = transformer.transform(input).collect()
57+
assert(result.size === 3)
58+
assert(result(2).getSeq(1).isEmpty)
59+
}
60+
}

0 commit comments

Comments
 (0)