From f4d8316ea633cfe438fe69105bee7520362da8c6 Mon Sep 17 00:00:00 2001 From: Martin Wiesner Date: Mon, 28 Oct 2024 16:17:53 +0100 Subject: [PATCH] OPENNLP-1629 Update DownloadUtil to support more languages via new UD models - updates opennlp-models dependency to 1.1 - adapts DownloadUtil to work with ud-models-1.1 release, adding 18 new supported languages - adapts JUnit tests accordingly to include the new model files - replaces content of 'index.html' copy of the released model list (v 1.1.0) for DownloadParserTest --- .../java/opennlp/tools/util/DownloadUtil.java | 56 ++- .../cmdline/postag/POSModelLoaderTest.java | 2 +- .../sentdetect/SentenceModelLoaderTest.java | 2 +- .../tokenizer/TokenizerModelLoaderTest.java | 2 +- .../tools/util/DownloadParserTest.java | 126 ++++-- .../opennlp/tools/util/DownloadUtilTest.java | 43 +- .../resources/opennlp/tools/util/index.html | 366 ++++++++++++++---- pom.xml | 2 +- 8 files changed, 471 insertions(+), 128 deletions(-) diff --git a/opennlp-tools/src/main/java/opennlp/tools/util/DownloadUtil.java b/opennlp-tools/src/main/java/opennlp/tools/util/DownloadUtil.java index b0f979e54..986801bd5 100644 --- a/opennlp-tools/src/main/java/opennlp/tools/util/DownloadUtil.java +++ b/opennlp-tools/src/main/java/opennlp/tools/util/DownloadUtil.java @@ -72,13 +72,13 @@ public enum ModelType { } private static final String BASE_URL = "https://dlcdn.apache.org/opennlp/"; - private static final String MODELS_UD_MODELS_1_0 = "models/ud-models-1.0/"; + private static final String MODELS_UD_MODELS_1_1 = "models/ud-models-1.1/"; public static final Map> available_models; static { try { - available_models = new DownloadParser(new URL(BASE_URL + MODELS_UD_MODELS_1_0)).getAvailableModels(); + available_models = new DownloadParser(new URL(BASE_URL + MODELS_UD_MODELS_1_1)).getAvailableModels(); } catch (MalformedURLException e) { throw new RuntimeException(e); } @@ -214,7 +214,6 @@ static class DownloadParser { } Map> getAvailableModels() { - final Matcher matcher = LINK_PATTERN.matcher(fetchPageIndex()); final List links = new ArrayList<>(); @@ -226,27 +225,58 @@ Map> getAvailableModels() { } private Map> toMap(List links) { - final Map> result = new HashMap<>(); - for (String link : links) { - if (link.endsWith(".bin")) { - if (link.contains("de-ud")) { + if (link.contains("de-ud")) { // German addModel("de", link, result); - } else if (link.contains("en-ud")) { + } else if (link.contains("en-ud")) { // English addModel("en", link, result); - } else if (link.contains("it-ud")) { + } else if (link.contains("it-ud")) { // Italian addModel("it", link, result); - } else if (link.contains("nl-ud")) { + } else if (link.contains("nl-ud")) { // Dutch addModel("nl", link, result); - } else if (link.contains("fr-ud")) { + } else if (link.contains("fr-ud")) { // French addModel("fr", link, result); + } else if (link.contains("bg-ud")) { // Bulgarian + addModel("bg", link, result); + } else if (link.contains("cs-ud")) { // Czech + addModel("cs", link, result); + } else if (link.contains("hr-ud")) { // Croatian + addModel("hr", link, result); + } else if (link.contains("da-ud")) { // Danish + addModel("da", link, result); + } else if (link.contains("es-ud")) { // Spanish + addModel("es", link, result); + } else if (link.contains("et-ud")) { // Estonian + addModel("et", link, result); + } else if (link.contains("fi-ud")) { // Finnish + addModel("fi", link, result); + } else if (link.contains("lv-ud")) { // Latvian + addModel("lv", link, result); + } else if (link.contains("no-ud")) { // Norwegian + addModel("no", link, result); + } else if (link.contains("pl-ud")) { // Polish + addModel("pl", link, result); + } else if (link.contains("pt-ud")) { // Portuguese + addModel("pt", link, result); + } else if (link.contains("ro-ud")) { // Romanian + addModel("ro", link, result); + } else if (link.contains("ru-ud")) { // Russian + addModel("ru", link, result); + } else if (link.contains("sr-ud")) { // Serbian + addModel("sr", link, result); + } else if (link.contains("sk-ud")) { // Slovak + addModel("sk", link, result); + } else if (link.contains("sl-ud")) { // Slovenian + addModel("sl", link, result); + } else if (link.contains("sv-ud")) { // Swedish + addModel("sv", link, result); + } else if (link.contains("uk-ud")) { // Ukrainian + addModel("uk", link, result); } } - } - return result; } diff --git a/opennlp-tools/src/test/java/opennlp/tools/cmdline/postag/POSModelLoaderTest.java b/opennlp-tools/src/test/java/opennlp/tools/cmdline/postag/POSModelLoaderTest.java index 473b00d52..9c1f65a52 100644 --- a/opennlp-tools/src/test/java/opennlp/tools/cmdline/postag/POSModelLoaderTest.java +++ b/opennlp-tools/src/test/java/opennlp/tools/cmdline/postag/POSModelLoaderTest.java @@ -59,7 +59,7 @@ public void setup() { @ParameterizedTest(name = "Verify \"{0}\" POS model loading") @ValueSource(strings = {"en-ud-ewt", "de-ud-gsd"}) public void testLoadModelByLanguage(String langModel) throws IOException { - String modelName = "opennlp-" + langModel + "-pos-1.0-1.9.3.bin"; + String modelName = "opennlp-" + langModel + "-pos-1.1-2.4.0.bin"; POSModel model = loader.loadModel(Files.newInputStream(OPENNLP_DIR.resolve(modelName))); Assertions.assertNotNull(model); Assertions.assertTrue(model.isLoadedFromSerialized()); diff --git a/opennlp-tools/src/test/java/opennlp/tools/cmdline/sentdetect/SentenceModelLoaderTest.java b/opennlp-tools/src/test/java/opennlp/tools/cmdline/sentdetect/SentenceModelLoaderTest.java index 632557b9a..b7d3b48a0 100644 --- a/opennlp-tools/src/test/java/opennlp/tools/cmdline/sentdetect/SentenceModelLoaderTest.java +++ b/opennlp-tools/src/test/java/opennlp/tools/cmdline/sentdetect/SentenceModelLoaderTest.java @@ -59,7 +59,7 @@ public void setup() { @ParameterizedTest(name = "Verify \"{0}\" sentence model loading") @ValueSource(strings = {"en-ud-ewt", "de-ud-gsd"}) public void testLoadModelByLanguage(String langModel) throws IOException { - String modelName = "opennlp-" + langModel + "-sentence-1.0-1.9.3.bin"; + String modelName = "opennlp-" + langModel + "-sentence-1.1-2.4.0.bin"; SentenceModel model = loader.loadModel(Files.newInputStream(OPENNLP_DIR.resolve(modelName))); Assertions.assertNotNull(model); Assertions.assertTrue(model.isLoadedFromSerialized()); diff --git a/opennlp-tools/src/test/java/opennlp/tools/cmdline/tokenizer/TokenizerModelLoaderTest.java b/opennlp-tools/src/test/java/opennlp/tools/cmdline/tokenizer/TokenizerModelLoaderTest.java index 118311bf5..c678071d1 100644 --- a/opennlp-tools/src/test/java/opennlp/tools/cmdline/tokenizer/TokenizerModelLoaderTest.java +++ b/opennlp-tools/src/test/java/opennlp/tools/cmdline/tokenizer/TokenizerModelLoaderTest.java @@ -59,7 +59,7 @@ public void setup() { @ParameterizedTest(name = "Verify \"{0}\" tokenizer model loading") @ValueSource(strings = {"en-ud-ewt", "de-ud-gsd"}) public void testLoadModelByLanguage(String langModel) throws IOException { - String modelName = "opennlp-" + langModel + "-tokens-1.0-1.9.3.bin"; + String modelName = "opennlp-" + langModel + "-tokens-1.1-2.4.0.bin"; TokenizerModel model = loader.loadModel(Files.newInputStream(OPENNLP_DIR.resolve(modelName))); Assertions.assertNotNull(model); Assertions.assertTrue(model.isLoadedFromSerialized()); diff --git a/opennlp-tools/src/test/java/opennlp/tools/util/DownloadParserTest.java b/opennlp-tools/src/test/java/opennlp/tools/util/DownloadParserTest.java index c867f8de5..cfcb0219e 100644 --- a/opennlp-tools/src/test/java/opennlp/tools/util/DownloadParserTest.java +++ b/opennlp-tools/src/test/java/opennlp/tools/util/DownloadParserTest.java @@ -45,7 +45,7 @@ void testAvailableModels(String language, Map ex Map> result = downloadParser.getAvailableModels(); assertNotNull(result); - assertEquals(5, result.size()); + assertEquals(23, result.size()); final Map availableModels = result.get(language); assertNotNull(availableModels); @@ -78,35 +78,109 @@ private URL fromClasspath(String file) { return Thread.currentThread().getContextClassLoader().getResource(file); } + private static final String OPENNLP = "opennlp-"; + private static final String MODEL_SENT = "sentence-"; + private static final String MODEL_TOK = "tokens-"; + private static final String MODEL_POS = "pos-"; + private static final String VER = "1.1-2.4.0"; + private static final String BIN = ".bin"; + // Note: This needs to be public as JUnit 5 requires it like this. public static Stream expectedModels() { // Data as defined in "test/resources/opennlp/tools/util/index.html" return Stream.of( - Arguments.of("en", - Map.of( - DownloadUtil.ModelType.SENTENCE_DETECTOR, "opennlp-en-ud-ewt-sentence-1.0-1.9.3.bin", - DownloadUtil.ModelType.TOKENIZER, "opennlp-en-ud-ewt-tokens-1.0-1.9.3.bin", - DownloadUtil.ModelType.POS, "opennlp-en-ud-ewt-pos-1.0-1.9.3.bin")), - Arguments.of("fr", - Map.of( - DownloadUtil.ModelType.SENTENCE_DETECTOR, "opennlp-1.0-1.9.3fr-ud-ftb-sentence-1.0-1.9.3.bin", - DownloadUtil.ModelType.TOKENIZER, "opennlp-fr-ud-ftb-tokens-1.0-1.9.3.bin", - DownloadUtil.ModelType.POS, "opennlp-fr-ud-ftb-pos-1.0-1.9.3.bin")), - Arguments.of("de", - Map.of( - DownloadUtil.ModelType.SENTENCE_DETECTOR, "opennlp-de-ud-gsd-sentence-1.0-1.9.3.bin", - DownloadUtil.ModelType.TOKENIZER, "opennlp-de-ud-gsd-tokens-1.0-1.9.3.bin", - DownloadUtil.ModelType.POS, "opennlp-de-ud-gsd-pos-1.0-1.9.3.bin")), - Arguments.of("it", - Map.of( - DownloadUtil.ModelType.SENTENCE_DETECTOR, "opennlp-it-ud-vit-sentence-1.0-1.9.3.bin", - DownloadUtil.ModelType.TOKENIZER, "opennlp-it-ud-vit-tokens-1.0-1.9.3.bin", - DownloadUtil.ModelType.POS, "opennlp-it-ud-vit-pos-1.0-1.9.3.bin")), - Arguments.of("nl", - Map.of( - DownloadUtil.ModelType.SENTENCE_DETECTOR, "opennlp-nl-ud-alpino-sentence-1.0-1.9.3.bin", - DownloadUtil.ModelType.TOKENIZER, "opennlp-nl-ud-alpino-tokens-1.0-1.9.3.bin", - DownloadUtil.ModelType.POS, "opennlp-nl-ud-alpino-pos-1.0-1.9.3.bin")) + Arguments.of("en",Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "en-ud-ewt-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "en-ud-ewt-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "en-ud-ewt-" + MODEL_POS + VER + BIN)), + Arguments.of("fr", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "fr-ud-gsd-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "fr-ud-gsd-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "fr-ud-gsd-" + MODEL_POS + VER + BIN)), + Arguments.of("de", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "de-ud-gsd-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "de-ud-gsd-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "de-ud-gsd-" + MODEL_POS + VER + BIN)), + Arguments.of("it", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "it-ud-vit-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "it-ud-vit-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "it-ud-vit-" + MODEL_POS + VER + BIN)), + Arguments.of("bg", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "bg-ud-btb-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "bg-ud-btb-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "bg-ud-btb-" + MODEL_POS + VER + BIN)), + Arguments.of("cs", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "cs-ud-pdt-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "cs-ud-pdt-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "cs-ud-pdt-" + MODEL_POS + VER + BIN)), + Arguments.of("da", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "da-ud-ddt-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "da-ud-ddt-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "da-ud-ddt-" + MODEL_POS + VER + BIN)), + Arguments.of("es", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "es-ud-gsd-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "es-ud-gsd-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "es-ud-gsd-" + MODEL_POS + VER + BIN)), + Arguments.of("et", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "et-ud-edt-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "et-ud-edt-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "et-ud-edt-" + MODEL_POS + VER + BIN)), + Arguments.of("fi", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "fi-ud-tdt-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "fi-ud-tdt-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "fi-ud-tdt-" + MODEL_POS + VER + BIN)), + Arguments.of("hr", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "hr-ud-set-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "hr-ud-set-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "hr-ud-set-" + MODEL_POS + VER + BIN)), + Arguments.of("lv", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "lv-ud-lvtb-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "lv-ud-lvtb-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "lv-ud-lvtb-" + MODEL_POS + VER + BIN)), + Arguments.of("lv", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "lv-ud-lvtb-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "lv-ud-lvtb-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "lv-ud-lvtb-" + MODEL_POS + VER + BIN)), + Arguments.of("no", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "no-ud-bokmaal-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "no-ud-bokmaal-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "no-ud-bokmaal-" + MODEL_POS + VER + BIN)), + Arguments.of("pl", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "pl-ud-pdb-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "pl-ud-pdb-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "pl-ud-pdb-" + MODEL_POS + VER + BIN)), + Arguments.of("pt", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "pt-ud-gsd-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "pt-ud-gsd-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "pt-ud-gsd-" + MODEL_POS + VER + BIN)), + Arguments.of("ro", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "ro-ud-rrt-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "ro-ud-rrt-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "ro-ud-rrt-" + MODEL_POS + VER + BIN)), + Arguments.of("ru", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "ru-ud-gsd-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "ru-ud-gsd-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "ru-ud-gsd-" + MODEL_POS + VER + BIN)), + Arguments.of("sr", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "sr-ud-set-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "sr-ud-set-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "sr-ud-set-" + MODEL_POS + VER + BIN)), + Arguments.of("sk", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "sk-ud-snk-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "sk-ud-snk-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "sk-ud-snk-" + MODEL_POS + VER + BIN)), + Arguments.of("sl", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "sl-ud-ssj-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "sl-ud-ssj-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "sl-ud-ssj-" + MODEL_POS + VER + BIN)), + Arguments.of("sv", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "sv-ud-talbanken-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "sv-ud-talbanken-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "sv-ud-talbanken-" + MODEL_POS + VER + BIN)), + Arguments.of("uk", Map.of( + DownloadUtil.ModelType.SENTENCE_DETECTOR, OPENNLP + "uk-ud-iu-" + MODEL_SENT + VER + BIN, + DownloadUtil.ModelType.TOKENIZER, OPENNLP + "uk-ud-iu-" + MODEL_TOK + VER + BIN, + DownloadUtil.ModelType.POS, OPENNLP + "uk-ud-iu-" + MODEL_POS + VER + BIN)) ); } } diff --git a/opennlp-tools/src/test/java/opennlp/tools/util/DownloadUtilTest.java b/opennlp-tools/src/test/java/opennlp/tools/util/DownloadUtilTest.java index 1de5558bd..0afbd3067 100644 --- a/opennlp-tools/src/test/java/opennlp/tools/util/DownloadUtilTest.java +++ b/opennlp-tools/src/test/java/opennlp/tools/util/DownloadUtilTest.java @@ -27,7 +27,6 @@ import java.nio.file.Path; import java.util.stream.Stream; -import org.junit.jupiter.api.Assertions; import org.junit.jupiter.api.BeforeAll; import org.junit.jupiter.params.ParameterizedTest; import org.junit.jupiter.params.provider.Arguments; @@ -39,6 +38,10 @@ import opennlp.tools.sentdetect.SentenceModel; import opennlp.tools.tokenize.TokenizerModel; +import static org.junit.jupiter.api.Assertions.assertEquals; +import static org.junit.jupiter.api.Assertions.assertNotNull; +import static org.junit.jupiter.api.Assertions.assertThrows; +import static org.junit.jupiter.api.Assertions.assertTrue; import static org.junit.jupiter.api.Assertions.fail; public class DownloadUtilTest { @@ -83,14 +86,16 @@ private static void wipeExistingModelFiles(final String fragment) { } @ParameterizedTest(name = "Verify \"{0}\" sentence model") - @ValueSource(strings = {"en", "fr", "de", "it", "nl"}) + @ValueSource(strings = {"en", "fr", "de", "it", "nl", "bg", "cs", "da", "es", "et", + "fi", "hr", "lv", "no", "pl", "pt", "ro", "ru", "sk", "sl", + "sr", "sv", "uk"}) @EnabledWhenCDNAvailable(hostname = "dlcdn.apache.org") public void testDownloadModelByLanguage(String lang) throws IOException { SentenceModel model = DownloadUtil.downloadModel(lang, DownloadUtil.ModelType.SENTENCE_DETECTOR, SentenceModel.class); - Assertions.assertNotNull(model); - Assertions.assertEquals(lang, model.getLanguage()); - Assertions.assertTrue(model.isLoadedFromSerialized()); + assertNotNull(model); + assertEquals(lang, model.getLanguage()); + assertTrue(model.isLoadedFromSerialized()); } @ParameterizedTest(name = "Verify \"{0}\" tokenizer model") @@ -98,16 +103,16 @@ public void testDownloadModelByLanguage(String lang) throws IOException { @EnabledWhenCDNAvailable(hostname = "dlcdn.apache.org") public void testDownloadModelByURL(String language, URL url) throws IOException { TokenizerModel model = DownloadUtil.downloadModel(url, TokenizerModel.class); - Assertions.assertNotNull(model); - Assertions.assertEquals(language, model.getLanguage()); - Assertions.assertTrue(model.isLoadedFromSerialized()); + assertNotNull(model); + assertEquals(language, model.getLanguage()); + assertTrue(model.isLoadedFromSerialized()); } @ParameterizedTest(name = "Detect invalid input: \"{0}\"") @NullAndEmptySource @ValueSource(strings = {" ", "\t", "\n"}) public void testDownloadModelInvalid(String input) { - Assertions.assertThrows(IOException.class, () -> DownloadUtil.downloadModel( + assertThrows(IOException.class, () -> DownloadUtil.downloadModel( input, DownloadUtil.ModelType.SENTENCE_DETECTOR, SentenceModel.class), "Invalid model"); } @@ -121,7 +126,25 @@ public static Stream provideURLs() { Arguments.of("fr", DownloadUtil.available_models.get("fr").get(MT_TOKENIZER)), Arguments.of("de", DownloadUtil.available_models.get("de").get(MT_TOKENIZER)), Arguments.of("it", DownloadUtil.available_models.get("it").get(MT_TOKENIZER)), - Arguments.of("nl", DownloadUtil.available_models.get("nl").get(MT_TOKENIZER)) + Arguments.of("nl", DownloadUtil.available_models.get("nl").get(MT_TOKENIZER)), + Arguments.of("bg", DownloadUtil.available_models.get("bg").get(MT_TOKENIZER)), + Arguments.of("cs", DownloadUtil.available_models.get("cs").get(MT_TOKENIZER)), + Arguments.of("da", DownloadUtil.available_models.get("da").get(MT_TOKENIZER)), + Arguments.of("es", DownloadUtil.available_models.get("es").get(MT_TOKENIZER)), + Arguments.of("et", DownloadUtil.available_models.get("et").get(MT_TOKENIZER)), + Arguments.of("fi", DownloadUtil.available_models.get("fi").get(MT_TOKENIZER)), + Arguments.of("hr", DownloadUtil.available_models.get("hr").get(MT_TOKENIZER)), + Arguments.of("lv", DownloadUtil.available_models.get("lv").get(MT_TOKENIZER)), + Arguments.of("no", DownloadUtil.available_models.get("no").get(MT_TOKENIZER)), + Arguments.of("pl", DownloadUtil.available_models.get("pl").get(MT_TOKENIZER)), + Arguments.of("pt", DownloadUtil.available_models.get("pt").get(MT_TOKENIZER)), + Arguments.of("ro", DownloadUtil.available_models.get("ro").get(MT_TOKENIZER)), + Arguments.of("ru", DownloadUtil.available_models.get("ru").get(MT_TOKENIZER)), + Arguments.of("sk", DownloadUtil.available_models.get("sk").get(MT_TOKENIZER)), + Arguments.of("sl", DownloadUtil.available_models.get("sl").get(MT_TOKENIZER)), + Arguments.of("sr", DownloadUtil.available_models.get("sr").get(MT_TOKENIZER)), + Arguments.of("sv", DownloadUtil.available_models.get("sv").get(MT_TOKENIZER)), + Arguments.of("uk", DownloadUtil.available_models.get("uk").get(MT_TOKENIZER)) ); } } diff --git a/opennlp-tools/src/test/resources/opennlp/tools/util/index.html b/opennlp-tools/src/test/resources/opennlp/tools/util/index.html index fd77cfd66..57c688ed9 100644 --- a/opennlp-tools/src/test/resources/opennlp/tools/util/index.html +++ b/opennlp-tools/src/test/resources/opennlp/tools/util/index.html @@ -17,83 +17,299 @@ under the License. --> - - Index of /opennlp/models/ud-models-1.0 - - -

Index of /opennlp/models/ud-models-1.0

-
Icon  Name                                                     Last modified      Size  Description
[PARENTDIR] Parent Directory - -[   ] CHANGES 2021-05-29 13:55 581 -[   ] LICENSE 2021-05-29 13:55 13K -[   ] NOTICE 2021-05-29 13:55 376 -[   ] opennlp-1.0-1.9.3fr-ud-ftb-sentence-1.0-1.9.3.bin 2021-05-29 13:55 846 -[TXT] opennlp-1.0-1.9.3fr-ud-ftb-sentence-1.0-1.9.3.bin.asc 2021-05-29 13:55 833 -[TXT] opennlp-1.0-1.9.3fr-ud-ftb-sentence-1.0-1.9.3.bin.sha256 2021-05-29 13:55 118 -[TXT] opennlp-1.0-1.9.3fr-ud-ftb-sentence-1.0-1.9.3.bin.sha512 2021-05-29 13:55 182 -[   ] opennlp-de-ud-gsd-pos-1.0-1.9.3.bin 2021-05-29 13:55 1.2M -[TXT] opennlp-de-ud-gsd-pos-1.0-1.9.3.bin.asc 2021-05-29 13:55 833 -[TXT] opennlp-de-ud-gsd-pos-1.0-1.9.3.bin.sha256 2021-05-29 13:55 104 -[TXT] opennlp-de-ud-gsd-pos-1.0-1.9.3.bin.sha512 2021-05-29 13:55 168 -[   ] opennlp-de-ud-gsd-sentence-1.0-1.9.3.bin 2021-05-29 13:55 15K -[TXT] opennlp-de-ud-gsd-sentence-1.0-1.9.3.bin.asc 2021-05-29 13:55 833 -[TXT] opennlp-de-ud-gsd-sentence-1.0-1.9.3.bin.sha256 2021-05-29 13:55 109 -[TXT] opennlp-de-ud-gsd-sentence-1.0-1.9.3.bin.sha512 2021-05-29 13:55 173 -[   ] opennlp-de-ud-gsd-tokens-1.0-1.9.3.bin 2021-05-29 13:55 553K -[TXT] opennlp-de-ud-gsd-tokens-1.0-1.9.3.bin.asc 2021-05-29 13:55 833 -[TXT] opennlp-de-ud-gsd-tokens-1.0-1.9.3.bin.sha256 2021-05-29 13:55 107 -[TXT] opennlp-de-ud-gsd-tokens-1.0-1.9.3.bin.sha512 2021-05-29 13:55 171 -[   ] opennlp-en-ud-ewt-pos-1.0-1.9.3.bin 2021-05-29 13:55 1.1M -[TXT] opennlp-en-ud-ewt-pos-1.0-1.9.3.bin.asc 2021-05-29 13:55 833 -[TXT] opennlp-en-ud-ewt-pos-1.0-1.9.3.bin.sha256 2021-05-29 13:55 104 -[TXT] opennlp-en-ud-ewt-pos-1.0-1.9.3.bin.sha512 2021-05-29 13:55 168 -[   ] opennlp-en-ud-ewt-sentence-1.0-1.9.3.bin 2021-05-29 13:55 20K -[TXT] opennlp-en-ud-ewt-sentence-1.0-1.9.3.bin.asc 2021-05-29 13:55 833 -[TXT] opennlp-en-ud-ewt-sentence-1.0-1.9.3.bin.sha256 2021-05-29 13:55 109 -[TXT] opennlp-en-ud-ewt-sentence-1.0-1.9.3.bin.sha512 2021-05-29 13:55 173 -[   ] opennlp-en-ud-ewt-tokens-1.0-1.9.3.bin 2021-05-29 13:55 338K -[TXT] opennlp-en-ud-ewt-tokens-1.0-1.9.3.bin.asc 2021-05-29 13:55 833 -[TXT] opennlp-en-ud-ewt-tokens-1.0-1.9.3.bin.sha256 2021-05-29 13:55 107 -[TXT] opennlp-en-ud-ewt-tokens-1.0-1.9.3.bin.sha512 2021-05-29 13:55 171 -[   ] opennlp-fr-ud-ftb-pos-1.0-1.9.3.bin 2021-05-29 13:55 72K -[TXT] opennlp-fr-ud-ftb-pos-1.0-1.9.3.bin.asc 2021-05-29 13:55 833 -[TXT] opennlp-fr-ud-ftb-pos-1.0-1.9.3.bin.sha256 2021-05-29 13:55 104 -[TXT] opennlp-fr-ud-ftb-pos-1.0-1.9.3.bin.sha512 2021-05-29 13:55 168 -[   ] opennlp-fr-ud-ftb-tokens-1.0-1.9.3.bin 2021-05-29 13:55 35K -[TXT] opennlp-fr-ud-ftb-tokens-1.0-1.9.3.bin.asc 2021-05-29 13:55 833 -[TXT] opennlp-fr-ud-ftb-tokens-1.0-1.9.3.bin.sha256 2021-05-29 13:55 107 -[TXT] opennlp-fr-ud-ftb-tokens-1.0-1.9.3.bin.sha512 2021-05-29 13:55 171 -[   ] opennlp-it-ud-vit-pos-1.0-1.9.3.bin 2021-05-29 13:55 1.1M -[TXT] opennlp-it-ud-vit-pos-1.0-1.9.3.bin.asc 2021-05-29 13:55 833 -[TXT] opennlp-it-ud-vit-pos-1.0-1.9.3.bin.sha256 2021-05-29 13:55 104 -[TXT] opennlp-it-ud-vit-pos-1.0-1.9.3.bin.sha512 2021-05-29 13:55 168 -[   ] opennlp-it-ud-vit-sentence-1.0-1.9.3.bin 2021-05-29 13:55 9.4K -[TXT] opennlp-it-ud-vit-sentence-1.0-1.9.3.bin.asc 2021-05-29 13:55 833 -[TXT] opennlp-it-ud-vit-sentence-1.0-1.9.3.bin.sha256 2021-05-29 13:55 109 -[TXT] opennlp-it-ud-vit-sentence-1.0-1.9.3.bin.sha512 2021-05-29 13:55 173 -[   ] opennlp-it-ud-vit-tokens-1.0-1.9.3.bin 2021-05-29 13:55 387K -[TXT] opennlp-it-ud-vit-tokens-1.0-1.9.3.bin.asc 2021-05-29 13:55 833 -[TXT] opennlp-it-ud-vit-tokens-1.0-1.9.3.bin.sha256 2021-05-29 13:55 107 -[TXT] opennlp-it-ud-vit-tokens-1.0-1.9.3.bin.sha512 2021-05-29 13:55 171 -[   ] opennlp-nl-ud-alpino-pos-1.0-1.9.3.bin 2021-05-29 13:55 897K -[TXT] opennlp-nl-ud-alpino-pos-1.0-1.9.3.bin.asc 2021-05-29 13:55 833 -[TXT] opennlp-nl-ud-alpino-pos-1.0-1.9.3.bin.sha256 2021-05-29 13:55 107 -[TXT] opennlp-nl-ud-alpino-pos-1.0-1.9.3.bin.sha512 2021-05-29 13:55 171 -[   ] opennlp-nl-ud-alpino-sentence-1.0-1.9.3.bin 2021-05-29 13:55 13K -[TXT] opennlp-nl-ud-alpino-sentence-1.0-1.9.3.bin.asc 2021-05-29 13:55 833 -[TXT] opennlp-nl-ud-alpino-sentence-1.0-1.9.3.bin.sha256 2021-05-29 13:55 112 -[TXT] opennlp-nl-ud-alpino-sentence-1.0-1.9.3.bin.sha512 2021-05-29 13:55 176 -[   ] opennlp-nl-ud-alpino-tokens-1.0-1.9.3.bin 2021-05-29 13:55 340K -[TXT] opennlp-nl-ud-alpino-tokens-1.0-1.9.3.bin.asc 2021-05-29 13:55 833 -[TXT] opennlp-nl-ud-alpino-tokens-1.0-1.9.3.bin.sha256 2021-05-29 13:55 110 -[TXT] opennlp-nl-ud-alpino-tokens-1.0-1.9.3.bin.sha512 2021-05-29 13:55 174 -[   ] opennlp-training-eval-logs-1.0-1.9.3.zip 2021-05-29 13:55 40K -[TXT] opennlp-training-eval-logs-1.0-1.9.3.zip.asc 2021-05-29 13:55 833 -[TXT] opennlp-training-eval-logs-1.0-1.9.3.zip.sha256 2021-05-29 13:55 109 -[TXT] opennlp-training-eval-logs-1.0-1.9.3.zip.sha512 2021-05-29 13:55 173 + + Index of /opennlp/models/ud-models-1.1 + + +

Index of /opennlp/models/ud-models-1.1

+
Icon  Name                                                  Last modified      Size  Description
[PARENTDIR] Parent Directory - +[   ] CHANGES 2024-10-11 13:41 1.8K +[   ] LICENSE 2024-10-11 13:41 13K +[   ] NOTICE 2024-10-11 13:41 79 +[   ] README 2024-10-11 13:41 635 +[   ] opennlp-bg-ud-btb-pos-1.1-2.4.0.bin 2024-10-11 13:41 676K +[TXT] opennlp-bg-ud-btb-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-bg-ud-btb-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 102 +[TXT] opennlp-bg-ud-btb-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 166 +[   ] opennlp-bg-ud-btb-sentence-1.1-2.4.0.bin 2024-10-11 13:41 11K +[TXT] opennlp-bg-ud-btb-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-bg-ud-btb-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 107 +[TXT] opennlp-bg-ud-btb-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 171 +[   ] opennlp-bg-ud-btb-tokens-1.1-2.4.0.bin 2024-10-11 13:41 299K +[TXT] opennlp-bg-ud-btb-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-bg-ud-btb-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 105 +[TXT] opennlp-bg-ud-btb-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 169 +[   ] opennlp-cs-ud-pdt-pos-1.1-2.4.0.bin 2024-10-11 13:41 5.2M +[TXT] opennlp-cs-ud-pdt-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-cs-ud-pdt-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 102 +[TXT] opennlp-cs-ud-pdt-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 166 +[   ] opennlp-cs-ud-pdt-sentence-1.1-2.4.0.bin 2024-10-11 13:41 85K +[TXT] opennlp-cs-ud-pdt-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-cs-ud-pdt-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 107 +[TXT] opennlp-cs-ud-pdt-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 171 +[   ] opennlp-cs-ud-pdt-tokens-1.1-2.4.0.bin 2024-10-11 13:41 1.5M +[TXT] opennlp-cs-ud-pdt-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-cs-ud-pdt-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 105 +[TXT] opennlp-cs-ud-pdt-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 169 +[   ] opennlp-da-ud-ddt-pos-1.1-2.4.0.bin 2024-10-11 13:41 439K +[TXT] opennlp-da-ud-ddt-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-da-ud-ddt-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 102 +[TXT] opennlp-da-ud-ddt-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 166 +[   ] opennlp-da-ud-ddt-sentence-1.1-2.4.0.bin 2024-10-11 13:41 6.3K +[TXT] opennlp-da-ud-ddt-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-da-ud-ddt-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 107 +[TXT] opennlp-da-ud-ddt-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 171 +[   ] opennlp-da-ud-ddt-tokens-1.1-2.4.0.bin 2024-10-11 13:41 170K +[TXT] opennlp-da-ud-ddt-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-da-ud-ddt-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 105 +[TXT] opennlp-da-ud-ddt-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 169 +[   ] opennlp-de-ud-gsd-pos-1.1-2.4.0.bin 2024-10-11 13:41 1.2M +[TXT] opennlp-de-ud-gsd-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-de-ud-gsd-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 102 +[TXT] opennlp-de-ud-gsd-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 166 +[   ] opennlp-de-ud-gsd-sentence-1.1-2.4.0.bin 2024-10-11 13:41 15K +[TXT] opennlp-de-ud-gsd-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-de-ud-gsd-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 107 +[TXT] opennlp-de-ud-gsd-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 171 +[   ] opennlp-de-ud-gsd-tokens-1.1-2.4.0.bin 2024-10-11 13:41 510K +[TXT] opennlp-de-ud-gsd-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-de-ud-gsd-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 105 +[TXT] opennlp-de-ud-gsd-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 169 +[   ] opennlp-en-ud-ewt-pos-1.1-2.4.0.bin 2024-10-11 13:41 1.1M +[TXT] opennlp-en-ud-ewt-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-en-ud-ewt-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 102 +[TXT] opennlp-en-ud-ewt-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 166 +[   ] opennlp-en-ud-ewt-sentence-1.1-2.4.0.bin 2024-10-11 13:41 20K +[TXT] opennlp-en-ud-ewt-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-en-ud-ewt-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 107 +[TXT] opennlp-en-ud-ewt-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 171 +[   ] opennlp-en-ud-ewt-tokens-1.1-2.4.0.bin 2024-10-11 13:41 318K +[TXT] opennlp-en-ud-ewt-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-en-ud-ewt-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 105 +[TXT] opennlp-en-ud-ewt-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 169 +[   ] opennlp-es-ud-gsd-pos-1.1-2.4.0.bin 2024-10-11 13:41 1.7M +[TXT] opennlp-es-ud-gsd-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-es-ud-gsd-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 102 +[TXT] opennlp-es-ud-gsd-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 166 +[   ] opennlp-es-ud-gsd-sentence-1.1-2.4.0.bin 2024-10-11 13:41 14K +[TXT] opennlp-es-ud-gsd-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-es-ud-gsd-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 107 +[TXT] opennlp-es-ud-gsd-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 171 +[   ] opennlp-es-ud-gsd-tokens-1.1-2.4.0.bin 2024-10-11 13:41 525K +[TXT] opennlp-es-ud-gsd-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-es-ud-gsd-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 105 +[TXT] opennlp-es-ud-gsd-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 169 +[   ] opennlp-et-ud-edt-pos-1.1-2.4.0.bin 2024-10-11 13:41 1.8M +[TXT] opennlp-et-ud-edt-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-et-ud-edt-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 102 +[TXT] opennlp-et-ud-edt-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 166 +[   ] opennlp-et-ud-edt-sentence-1.1-2.4.0.bin 2024-10-11 13:41 29K +[TXT] opennlp-et-ud-edt-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-et-ud-edt-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 107 +[TXT] opennlp-et-ud-edt-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 171 +[   ] opennlp-et-ud-edt-tokens-1.1-2.4.0.bin 2024-10-11 13:41 718K +[TXT] opennlp-et-ud-edt-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-et-ud-edt-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 105 +[TXT] opennlp-et-ud-edt-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 169 +[   ] opennlp-fi-ud-tdt-pos-1.1-2.4.0.bin 2024-10-11 13:41 921K +[TXT] opennlp-fi-ud-tdt-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-fi-ud-tdt-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 102 +[TXT] opennlp-fi-ud-tdt-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 166 +[   ] opennlp-fi-ud-tdt-sentence-1.1-2.4.0.bin 2024-10-11 13:41 12K +[TXT] opennlp-fi-ud-tdt-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-fi-ud-tdt-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 107 +[TXT] opennlp-fi-ud-tdt-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 171 +[   ] opennlp-fi-ud-tdt-tokens-1.1-2.4.0.bin 2024-10-11 13:41 452K +[TXT] opennlp-fi-ud-tdt-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-fi-ud-tdt-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 105 +[TXT] opennlp-fi-ud-tdt-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 169 +[   ] opennlp-fr-ud-gsd-pos-1.1-2.4.0.bin 2024-10-11 13:41 1.5M +[TXT] opennlp-fr-ud-gsd-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-fr-ud-gsd-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 102 +[TXT] opennlp-fr-ud-gsd-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 166 +[   ] opennlp-fr-ud-gsd-sentence-1.1-2.4.0.bin 2024-10-11 13:41 12K +[TXT] opennlp-fr-ud-gsd-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-fr-ud-gsd-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 107 +[TXT] opennlp-fr-ud-gsd-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 171 +[   ] opennlp-fr-ud-gsd-tokens-1.1-2.4.0.bin 2024-10-11 13:41 530K +[TXT] opennlp-fr-ud-gsd-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-fr-ud-gsd-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 105 +[TXT] opennlp-fr-ud-gsd-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 169 +[   ] opennlp-hr-ud-set-pos-1.1-2.4.0.bin 2024-10-11 13:41 1.0M +[TXT] opennlp-hr-ud-set-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-hr-ud-set-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 102 +[TXT] opennlp-hr-ud-set-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 166 +[   ] opennlp-hr-ud-set-sentence-1.1-2.4.0.bin 2024-10-11 13:41 9.2K +[TXT] opennlp-hr-ud-set-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-hr-ud-set-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 107 +[TXT] opennlp-hr-ud-set-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 171 +[   ] opennlp-hr-ud-set-tokens-1.1-2.4.0.bin 2024-10-11 13:41 346K +[TXT] opennlp-hr-ud-set-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-hr-ud-set-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 105 +[TXT] opennlp-hr-ud-set-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 169 +[   ] opennlp-it-ud-vit-pos-1.1-2.4.0.bin 2024-10-11 13:41 1.1M +[TXT] opennlp-it-ud-vit-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-it-ud-vit-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 102 +[TXT] opennlp-it-ud-vit-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 166 +[   ] opennlp-it-ud-vit-sentence-1.1-2.4.0.bin 2024-10-11 13:41 10K +[TXT] opennlp-it-ud-vit-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-it-ud-vit-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 107 +[TXT] opennlp-it-ud-vit-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 171 +[   ] opennlp-it-ud-vit-tokens-1.1-2.4.0.bin 2024-10-11 13:41 356K +[TXT] opennlp-it-ud-vit-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-it-ud-vit-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 105 +[TXT] opennlp-it-ud-vit-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 169 +[   ] opennlp-lv-ud-lvtb-pos-1.1-2.4.0.bin 2024-10-11 13:41 1.4M +[TXT] opennlp-lv-ud-lvtb-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-lv-ud-lvtb-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 103 +[TXT] opennlp-lv-ud-lvtb-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 167 +[   ] opennlp-lv-ud-lvtb-sentence-1.1-2.4.0.bin 2024-10-11 13:41 19K +[TXT] opennlp-lv-ud-lvtb-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-lv-ud-lvtb-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 108 +[TXT] opennlp-lv-ud-lvtb-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 172 +[   ] opennlp-lv-ud-lvtb-tokens-1.1-2.4.0.bin 2024-10-11 13:41 515K +[TXT] opennlp-lv-ud-lvtb-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-lv-ud-lvtb-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 106 +[TXT] opennlp-lv-ud-lvtb-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 170 +[   ] opennlp-nl-ud-alpino-pos-1.1-2.4.0.bin 2024-10-11 13:41 890K +[TXT] opennlp-nl-ud-alpino-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-nl-ud-alpino-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 105 +[TXT] opennlp-nl-ud-alpino-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 169 +[   ] opennlp-nl-ud-alpino-sentence-1.1-2.4.0.bin 2024-10-11 13:41 12K +[TXT] opennlp-nl-ud-alpino-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-nl-ud-alpino-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 110 +[TXT] opennlp-nl-ud-alpino-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 174 +[   ] opennlp-nl-ud-alpino-tokens-1.1-2.4.0.bin 2024-10-11 13:41 319K +[TXT] opennlp-nl-ud-alpino-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-nl-ud-alpino-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 108 +[TXT] opennlp-nl-ud-alpino-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 172 +[   ] opennlp-no-ud-bokmaal-pos-1.1-2.4.0.bin 2024-10-11 13:41 1.1M +[TXT] opennlp-no-ud-bokmaal-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-no-ud-bokmaal-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 106 +[TXT] opennlp-no-ud-bokmaal-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 170 +[   ] opennlp-no-ud-bokmaal-sentence-1.1-2.4.0.bin 2024-10-11 13:41 16K +[TXT] opennlp-no-ud-bokmaal-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-no-ud-bokmaal-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 111 +[TXT] opennlp-no-ud-bokmaal-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 175 +[   ] opennlp-no-ud-bokmaal-tokens-1.1-2.4.0.bin 2024-10-11 13:41 394K +[TXT] opennlp-no-ud-bokmaal-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-no-ud-bokmaal-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 109 +[TXT] opennlp-no-ud-bokmaal-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 173 +[   ] opennlp-pl-ud-pdb-pos-1.1-2.4.0.bin 2024-10-11 13:41 1.5M +[TXT] opennlp-pl-ud-pdb-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-pl-ud-pdb-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 102 +[TXT] opennlp-pl-ud-pdb-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 166 +[   ] opennlp-pl-ud-pdb-sentence-1.1-2.4.0.bin 2024-10-11 13:41 21K +[TXT] opennlp-pl-ud-pdb-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-pl-ud-pdb-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 107 +[TXT] opennlp-pl-ud-pdb-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 171 +[   ] opennlp-pl-ud-pdb-tokens-1.1-2.4.0.bin 2024-10-11 13:41 589K +[TXT] opennlp-pl-ud-pdb-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-pl-ud-pdb-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 105 +[TXT] opennlp-pl-ud-pdb-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 169 +[   ] opennlp-pt-ud-gsd-pos-1.1-2.4.0.bin 2024-10-11 13:41 1.2M +[TXT] opennlp-pt-ud-gsd-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-pt-ud-gsd-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 102 +[TXT] opennlp-pt-ud-gsd-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 166 +[   ] opennlp-pt-ud-gsd-sentence-1.1-2.4.0.bin 2024-10-11 13:41 19K +[TXT] opennlp-pt-ud-gsd-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-pt-ud-gsd-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 107 +[TXT] opennlp-pt-ud-gsd-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 171 +[   ] opennlp-pt-ud-gsd-tokens-1.1-2.4.0.bin 2024-10-11 13:41 390K +[TXT] opennlp-pt-ud-gsd-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-pt-ud-gsd-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 105 +[TXT] opennlp-pt-ud-gsd-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 169 +[   ] opennlp-ro-ud-rrt-pos-1.1-2.4.0.bin 2024-10-11 13:41 1.0M +[TXT] opennlp-ro-ud-rrt-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-ro-ud-rrt-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 102 +[TXT] opennlp-ro-ud-rrt-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 166 +[   ] opennlp-ro-ud-rrt-sentence-1.1-2.4.0.bin 2024-10-11 13:41 10K +[TXT] opennlp-ro-ud-rrt-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-ro-ud-rrt-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 107 +[TXT] opennlp-ro-ud-rrt-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 171 +[   ] opennlp-ro-ud-rrt-tokens-1.1-2.4.0.bin 2024-10-11 13:41 368K +[TXT] opennlp-ro-ud-rrt-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-ro-ud-rrt-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 105 +[TXT] opennlp-ro-ud-rrt-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 169 +[   ] opennlp-ru-ud-gsd-pos-1.1-2.4.0.bin 2024-10-11 13:41 433K +[TXT] opennlp-ru-ud-gsd-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-ru-ud-gsd-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 102 +[TXT] opennlp-ru-ud-gsd-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 166 +[   ] opennlp-ru-ud-gsd-sentence-1.1-2.4.0.bin 2024-10-11 13:41 4.1K +[TXT] opennlp-ru-ud-gsd-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-ru-ud-gsd-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 107 +[TXT] opennlp-ru-ud-gsd-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 171 +[   ] opennlp-ru-ud-gsd-tokens-1.1-2.4.0.bin 2024-10-11 13:41 246K +[TXT] opennlp-ru-ud-gsd-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-ru-ud-gsd-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 105 +[TXT] opennlp-ru-ud-gsd-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 169 +[   ] opennlp-sk-ud-snk-pos-1.1-2.4.0.bin 2024-10-11 13:41 475K +[TXT] opennlp-sk-ud-snk-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-sk-ud-snk-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 102 +[TXT] opennlp-sk-ud-snk-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 166 +[   ] opennlp-sk-ud-snk-sentence-1.1-2.4.0.bin 2024-10-11 13:41 9.9K +[TXT] opennlp-sk-ud-snk-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-sk-ud-snk-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 107 +[TXT] opennlp-sk-ud-snk-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 171 +[   ] opennlp-sk-ud-snk-tokens-1.1-2.4.0.bin 2024-10-11 13:41 203K +[TXT] opennlp-sk-ud-snk-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-sk-ud-snk-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 105 +[TXT] opennlp-sk-ud-snk-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 169 +[   ] opennlp-sl-ud-ssj-pos-1.1-2.4.0.bin 2024-10-11 13:41 1.2M +[TXT] opennlp-sl-ud-ssj-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-sl-ud-ssj-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 102 +[TXT] opennlp-sl-ud-ssj-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 166 +[   ] opennlp-sl-ud-ssj-sentence-1.1-2.4.0.bin 2024-10-11 13:41 12K +[TXT] opennlp-sl-ud-ssj-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-sl-ud-ssj-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 107 +[TXT] opennlp-sl-ud-ssj-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 171 +[   ] opennlp-sl-ud-ssj-tokens-1.1-2.4.0.bin 2024-10-11 13:41 414K +[TXT] opennlp-sl-ud-ssj-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-sl-ud-ssj-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 105 +[TXT] opennlp-sl-ud-ssj-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 169 +[   ] opennlp-sr-ud-set-pos-1.1-2.4.0.bin 2024-10-11 13:41 515K +[TXT] opennlp-sr-ud-set-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-sr-ud-set-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 102 +[TXT] opennlp-sr-ud-set-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 166 +[   ] opennlp-sr-ud-set-sentence-1.1-2.4.0.bin 2024-10-11 13:41 5.1K +[TXT] opennlp-sr-ud-set-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-sr-ud-set-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 107 +[TXT] opennlp-sr-ud-set-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 171 +[   ] opennlp-sr-ud-set-tokens-1.1-2.4.0.bin 2024-10-11 13:41 198K +[TXT] opennlp-sr-ud-set-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-sr-ud-set-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 105 +[TXT] opennlp-sr-ud-set-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 169 +[   ] opennlp-sv-ud-talbanken-pos-1.1-2.4.0.bin 2024-10-11 13:41 417K +[TXT] opennlp-sv-ud-talbanken-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-sv-ud-talbanken-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 108 +[TXT] opennlp-sv-ud-talbanken-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 172 +[   ] opennlp-sv-ud-talbanken-sentence-1.1-2.4.0.bin 2024-10-11 13:41 5.8K +[TXT] opennlp-sv-ud-talbanken-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-sv-ud-talbanken-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 113 +[TXT] opennlp-sv-ud-talbanken-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 177 +[   ] opennlp-sv-ud-talbanken-tokens-1.1-2.4.0.bin 2024-10-11 13:41 167K +[TXT] opennlp-sv-ud-talbanken-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-sv-ud-talbanken-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 111 +[TXT] opennlp-sv-ud-talbanken-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 175 +[   ] opennlp-training-eval-logs-1.1-2.4.0.zip 2024-10-11 13:41 204K +[TXT] opennlp-training-eval-logs-1.1-2.4.0.zip.asc 2024-10-11 13:41 833 +[TXT] opennlp-training-eval-logs-1.1-2.4.0.zip.sha256 2024-10-11 13:41 107 +[TXT] opennlp-training-eval-logs-1.1-2.4.0.zip.sha512 2024-10-11 13:41 171 +[   ] opennlp-uk-ud-iu-pos-1.1-2.4.0.bin 2024-10-11 13:41 559K +[TXT] opennlp-uk-ud-iu-pos-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-uk-ud-iu-pos-1.1-2.4.0.bin.sha256 2024-10-11 13:41 101 +[TXT] opennlp-uk-ud-iu-pos-1.1-2.4.0.bin.sha512 2024-10-11 13:41 165 +[   ] opennlp-uk-ud-iu-sentence-1.1-2.4.0.bin 2024-10-11 13:41 6.2K +[TXT] opennlp-uk-ud-iu-sentence-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-uk-ud-iu-sentence-1.1-2.4.0.bin.sha256 2024-10-11 13:41 106 +[TXT] opennlp-uk-ud-iu-sentence-1.1-2.4.0.bin.sha512 2024-10-11 13:41 170 +[   ] opennlp-uk-ud-iu-tokens-1.1-2.4.0.bin 2024-10-11 13:41 249K +[TXT] opennlp-uk-ud-iu-tokens-1.1-2.4.0.bin.asc 2024-10-11 13:41 833 +[TXT] opennlp-uk-ud-iu-tokens-1.1-2.4.0.bin.sha256 2024-10-11 13:41 104 +[TXT] opennlp-uk-ud-iu-tokens-1.1-2.4.0.bin.sha512 2024-10-11 13:41 168
- diff --git a/pom.xml b/pom.xml index 73c39ecff..d2b234c7c 100644 --- a/pom.xml +++ b/pom.xml @@ -179,7 +179,7 @@ 2.23.1 1.37 4.8.176 - 1.0.1 + 1.1.0 1.0C 4.3.0 0.8.12