Skip to content

Commit 74c7d52

Browse files
mawiesnerzo1
authored andcommitted
OPENNLP-1631 Convert existing ModelLoader tests to integration tests
- converts the three existing test classes to "IT" ending so that they get executed during failsafe plugin phase - adds new 18 languages for each model type (sent, pos, tokens) - fixes missing language checks for "nl" (Dutch) in DownloadParserTest
1 parent 3c8bd72 commit 74c7d52

File tree

4 files changed

+28
-16
lines changed

4 files changed

+28
-16
lines changed

opennlp-tools/src/test/java/opennlp/tools/cmdline/postag/POSModelLoaderTest.java opennlp-tools/src/test/java/opennlp/tools/cmdline/postag/POSModelLoaderIT.java

+8-4
Original file line numberDiff line numberDiff line change
@@ -33,15 +33,16 @@
3333
import opennlp.tools.util.DownloadUtil;
3434

3535
@EnabledWhenCDNAvailable(hostname = "dlcdn.apache.org")
36-
public class POSModelLoaderTest extends AbstractModelLoaderTest {
36+
public class POSModelLoaderIT extends AbstractModelLoaderTest {
3737

3838
// SUT
3939
private POSModelLoader loader;
4040

4141
@BeforeAll
4242
public static void initResources() {
43-
List<String> resources = List.of("en", "de");
44-
resources.forEach(lang -> {
43+
List<String> langs = List.of("en", "fr", "de", "it", "nl", "bg", "cs", "da",
44+
"es", "et", "fi", "hr", "lv", "no", "pl", "pt", "ro", "ru", "sk", "sl", "sr", "sv", "uk");
45+
langs.forEach(lang -> {
4546
try {
4647
DownloadUtil.downloadModel(lang,
4748
DownloadUtil.ModelType.POS, POSModel.class);
@@ -57,7 +58,10 @@ public void setup() {
5758
}
5859

5960
@ParameterizedTest(name = "Verify \"{0}\" POS model loading")
60-
@ValueSource(strings = {"en-ud-ewt", "de-ud-gsd"})
61+
@ValueSource(strings = {"en-ud-ewt", "fr-ud-gsd", "de-ud-gsd", "it-ud-vit", "nl-ud-alpino",
62+
"bg-ud-btb", "cs-ud-pdt", "da-ud-ddt", "es-ud-gsd", "et-ud-edt", "fi-ud-tdt", "hr-ud-set",
63+
"lv-ud-lvtb", "no-ud-bokmaal", "pl-ud-pdb", "pt-ud-gsd", "ro-ud-rrt", "ru-ud-gsd",
64+
"sr-ud-set", "sk-ud-snk", "sl-ud-ssj", "sv-ud-talbanken", "uk-ud-iu"})
6165
public void testLoadModelByLanguage(String langModel) throws IOException {
6266
String modelName = "opennlp-" + langModel + "-pos-1.1-2.4.0.bin";
6367
POSModel model = loader.loadModel(Files.newInputStream(OPENNLP_DIR.resolve(modelName)));

opennlp-tools/src/test/java/opennlp/tools/cmdline/sentdetect/SentenceModelLoaderTest.java opennlp-tools/src/test/java/opennlp/tools/cmdline/sentdetect/SentenceModelLoaderIT.java

+8-4
Original file line numberDiff line numberDiff line change
@@ -33,15 +33,16 @@
3333
import opennlp.tools.util.DownloadUtil;
3434

3535
@EnabledWhenCDNAvailable(hostname = "dlcdn.apache.org")
36-
public class SentenceModelLoaderTest extends AbstractModelLoaderTest {
36+
public class SentenceModelLoaderIT extends AbstractModelLoaderTest {
3737

3838
// SUT
3939
private SentenceModelLoader loader;
4040

4141
@BeforeAll
4242
public static void initResources() {
43-
List<String> resources = List.of("en", "de");
44-
resources.forEach(lang -> {
43+
List<String> langs = List.of("en", "fr", "de", "it", "nl", "bg", "cs", "da",
44+
"es", "et", "fi", "hr", "lv", "no", "pl", "pt", "ro", "ru", "sk", "sl", "sr", "sv", "uk");
45+
langs.forEach(lang -> {
4546
try {
4647
DownloadUtil.downloadModel(lang,
4748
DownloadUtil.ModelType.SENTENCE_DETECTOR, SentenceModel.class);
@@ -57,7 +58,10 @@ public void setup() {
5758
}
5859

5960
@ParameterizedTest(name = "Verify \"{0}\" sentence model loading")
60-
@ValueSource(strings = {"en-ud-ewt", "de-ud-gsd"})
61+
@ValueSource(strings = {"en-ud-ewt", "fr-ud-gsd", "de-ud-gsd", "it-ud-vit", "nl-ud-alpino",
62+
"bg-ud-btb", "cs-ud-pdt", "da-ud-ddt", "es-ud-gsd", "et-ud-edt", "fi-ud-tdt", "hr-ud-set",
63+
"lv-ud-lvtb", "no-ud-bokmaal", "pl-ud-pdb", "pt-ud-gsd", "ro-ud-rrt", "ru-ud-gsd",
64+
"sr-ud-set", "sk-ud-snk", "sl-ud-ssj", "sv-ud-talbanken", "uk-ud-iu"})
6165
public void testLoadModelByLanguage(String langModel) throws IOException {
6266
String modelName = "opennlp-" + langModel + "-sentence-1.1-2.4.0.bin";
6367
SentenceModel model = loader.loadModel(Files.newInputStream(OPENNLP_DIR.resolve(modelName)));

opennlp-tools/src/test/java/opennlp/tools/cmdline/tokenizer/TokenizerModelLoaderTest.java opennlp-tools/src/test/java/opennlp/tools/cmdline/tokenizer/TokenizerModelLoaderIT.java

+8-4
Original file line numberDiff line numberDiff line change
@@ -33,15 +33,16 @@
3333
import opennlp.tools.util.DownloadUtil;
3434

3535
@EnabledWhenCDNAvailable(hostname = "dlcdn.apache.org")
36-
public class TokenizerModelLoaderTest extends AbstractModelLoaderTest {
36+
public class TokenizerModelLoaderIT extends AbstractModelLoaderTest {
3737

3838
// SUT
3939
private TokenizerModelLoader loader;
4040

4141
@BeforeAll
4242
public static void initResources() {
43-
List<String> resources = List.of("en", "de");
44-
resources.forEach(lang -> {
43+
List<String> langs = List.of("en", "fr", "de", "it", "nl", "bg", "cs", "da",
44+
"es", "et", "fi", "hr", "lv", "no", "pl", "pt", "ro", "ru", "sk", "sl", "sr", "sv", "uk");
45+
langs.forEach(lang -> {
4546
try {
4647
DownloadUtil.downloadModel(lang,
4748
DownloadUtil.ModelType.TOKENIZER, TokenizerModel.class);
@@ -57,7 +58,10 @@ public void setup() {
5758
}
5859

5960
@ParameterizedTest(name = "Verify \"{0}\" tokenizer model loading")
60-
@ValueSource(strings = {"en-ud-ewt", "de-ud-gsd"})
61+
@ValueSource(strings = {"en-ud-ewt", "fr-ud-gsd", "de-ud-gsd", "it-ud-vit", "nl-ud-alpino",
62+
"bg-ud-btb", "cs-ud-pdt", "da-ud-ddt", "es-ud-gsd", "et-ud-edt", "fi-ud-tdt", "hr-ud-set",
63+
"lv-ud-lvtb", "no-ud-bokmaal", "pl-ud-pdb", "pt-ud-gsd", "ro-ud-rrt", "ru-ud-gsd",
64+
"sr-ud-set", "sk-ud-snk", "sl-ud-ssj", "sv-ud-talbanken", "uk-ud-iu"})
6165
public void testLoadModelByLanguage(String langModel) throws IOException {
6266
String modelName = "opennlp-" + langModel + "-tokens-1.1-2.4.0.bin";
6367
TokenizerModel model = loader.loadModel(Files.newInputStream(OPENNLP_DIR.resolve(modelName)));

opennlp-tools/src/test/java/opennlp/tools/util/DownloadParserTest.java

+4-4
Original file line numberDiff line numberDiff line change
@@ -105,6 +105,10 @@ public static Stream<Arguments> expectedModels() {
105105
DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "it-ud-vit-" + MODEL_SENT + VER + BIN,
106106
DownloadUtil.ModelType.TOKENIZER, OPENNLP + "it-ud-vit-" + MODEL_TOK + VER + BIN,
107107
DownloadUtil.ModelType.POS, OPENNLP + "it-ud-vit-" + MODEL_POS + VER + BIN)),
108+
Arguments.of("nl", Map.of(
109+
DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "nl-ud-alpino-" + MODEL_SENT + VER + BIN,
110+
DownloadUtil.ModelType.TOKENIZER, OPENNLP + "nl-ud-alpino-" + MODEL_TOK + VER + BIN,
111+
DownloadUtil.ModelType.POS, OPENNLP + "nl-ud-alpino-" + MODEL_POS + VER + BIN)),
108112
Arguments.of("bg", Map.of(
109113
DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "bg-ud-btb-" + MODEL_SENT + VER + BIN,
110114
DownloadUtil.ModelType.TOKENIZER, OPENNLP + "bg-ud-btb-" + MODEL_TOK + VER + BIN,
@@ -137,10 +141,6 @@ public static Stream<Arguments> expectedModels() {
137141
DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "lv-ud-lvtb-" + MODEL_SENT + VER + BIN,
138142
DownloadUtil.ModelType.TOKENIZER, OPENNLP + "lv-ud-lvtb-" + MODEL_TOK + VER + BIN,
139143
DownloadUtil.ModelType.POS, OPENNLP + "lv-ud-lvtb-" + MODEL_POS + VER + BIN)),
140-
Arguments.of("lv", Map.of(
141-
DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "lv-ud-lvtb-" + MODEL_SENT + VER + BIN,
142-
DownloadUtil.ModelType.TOKENIZER, OPENNLP + "lv-ud-lvtb-" + MODEL_TOK + VER + BIN,
143-
DownloadUtil.ModelType.POS, OPENNLP + "lv-ud-lvtb-" + MODEL_POS + VER + BIN)),
144144
Arguments.of("no", Map.of(
145145
DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "no-ud-bokmaal-" + MODEL_SENT + VER + BIN,
146146
DownloadUtil.ModelType.TOKENIZER, OPENNLP + "no-ud-bokmaal-" + MODEL_TOK + VER + BIN,

0 commit comments

Comments
 (0)