From 6870433231c22822bcdf291f24917a254d0275bd Mon Sep 17 00:00:00 2001 From: Richard Eckart de Castilho Date: Sun, 17 Nov 2024 14:02:29 +0100 Subject: [PATCH] #1604 - Drop IXA module - Removed IXA module --- dkpro-core-asl/pom.xml | 1 - dkpro-core-bom-asl/pom.xml | 5 - dkpro-core-ixa-asl/LICENSE.txt | 202 ------ dkpro-core-ixa-asl/pom.xml | 439 ------------ .../org/dkpro/core/ixa/IxaLemmatizer.java | 184 ----- .../java/org/dkpro/core/ixa/IxaPosTagger.java | 54 -- ...xaLemmatizerTagsetDescriptionProvider.java | 85 --- .../ixa/lib/lemmatizer-default-variants.map | 8 - .../core/ixa/lib/tagger-default-variants.map | 8 - dkpro-core-ixa-asl/src/scripts/build.xml | 658 ------------------ .../org/dkpro/core/ixa/IxaLemmatizerTest.java | 235 ------- .../org/dkpro/core/ixa/IxaPosTaggerTest.java | 337 --------- .../src/test/resources/log4j2.xml | 16 - 13 files changed, 2232 deletions(-) delete mode 100644 dkpro-core-ixa-asl/LICENSE.txt delete mode 100644 dkpro-core-ixa-asl/pom.xml delete mode 100644 dkpro-core-ixa-asl/src/main/java/org/dkpro/core/ixa/IxaLemmatizer.java delete mode 100644 dkpro-core-ixa-asl/src/main/java/org/dkpro/core/ixa/IxaPosTagger.java delete mode 100644 dkpro-core-ixa-asl/src/main/java/org/dkpro/core/ixa/internal/IxaLemmatizerTagsetDescriptionProvider.java delete mode 100644 dkpro-core-ixa-asl/src/main/resources/org/dkpro/core/ixa/lib/lemmatizer-default-variants.map delete mode 100644 dkpro-core-ixa-asl/src/main/resources/org/dkpro/core/ixa/lib/tagger-default-variants.map delete mode 100644 dkpro-core-ixa-asl/src/scripts/build.xml delete mode 100644 dkpro-core-ixa-asl/src/test/java/org/dkpro/core/ixa/IxaLemmatizerTest.java delete mode 100644 dkpro-core-ixa-asl/src/test/java/org/dkpro/core/ixa/IxaPosTaggerTest.java delete mode 100644 dkpro-core-ixa-asl/src/test/resources/log4j2.xml diff --git a/dkpro-core-asl/pom.xml b/dkpro-core-asl/pom.xml index a5f82bf462..7e1ac5eb77 100644 --- a/dkpro-core-asl/pom.xml +++ b/dkpro-core-asl/pom.xml @@ -120,7 +120,6 @@ ../dkpro-core-hunpos-asl ../dkpro-core-icu-asl ../dkpro-core-ivy-resolver-asl - ../dkpro-core-ixa-asl ../dkpro-core-jazzy-asl ../dkpro-core-jtok-asl ../dkpro-core-jieba-asl diff --git a/dkpro-core-bom-asl/pom.xml b/dkpro-core-bom-asl/pom.xml index a31e044063..f7a4380b4b 100644 --- a/dkpro-core-bom-asl/pom.xml +++ b/dkpro-core-bom-asl/pom.xml @@ -409,11 +409,6 @@ dkpro-core-io-xces-asl 3.0.0-SNAPSHOT - - org.dkpro.core - dkpro-core-ixa-asl - 3.0.0-SNAPSHOT - org.dkpro.core dkpro-core-jazzy-asl diff --git a/dkpro-core-ixa-asl/LICENSE.txt b/dkpro-core-ixa-asl/LICENSE.txt deleted file mode 100644 index d645695673..0000000000 --- a/dkpro-core-ixa-asl/LICENSE.txt +++ /dev/null @@ -1,202 +0,0 @@ - - Apache License - Version 2.0, January 2004 - http://www.apache.org/licenses/ - - TERMS AND CONDITIONS FOR USE, REPRODUCTION, AND DISTRIBUTION - - 1. Definitions. - - "License" shall mean the terms and conditions for use, reproduction, - and distribution as defined by Sections 1 through 9 of this document. - - "Licensor" shall mean the copyright owner or entity authorized by - the copyright owner that is granting the License. - - "Legal Entity" shall mean the union of the acting entity and all - other entities that control, are controlled by, or are under common - control with that entity. For the purposes of this definition, - "control" means (i) the power, direct or indirect, to cause the - direction or management of such entity, whether by contract or - otherwise, or (ii) ownership of fifty percent (50%) or more of the - outstanding shares, or (iii) beneficial ownership of such entity. - - "You" (or "Your") shall mean an individual or Legal Entity - exercising permissions granted by this License. - - "Source" form shall mean the preferred form for making modifications, - including but not limited to software source code, documentation - source, and configuration files. - - "Object" form shall mean any form resulting from mechanical - transformation or translation of a Source form, including but - not limited to compiled object code, generated documentation, - and conversions to other media types. - - "Work" shall mean the work of authorship, whether in Source or - Object form, made available under the License, as indicated by a - copyright notice that is included in or attached to the work - (an example is provided in the Appendix below). - - "Derivative Works" shall mean any work, whether in Source or Object - form, that is based on (or derived from) the Work and for which the - editorial revisions, annotations, elaborations, or other modifications - represent, as a whole, an original work of authorship. For the purposes - of this License, Derivative Works shall not include works that remain - separable from, or merely link (or bind by name) to the interfaces of, - the Work and Derivative Works thereof. - - "Contribution" shall mean any work of authorship, including - the original version of the Work and any modifications or additions - to that Work or Derivative Works thereof, that is intentionally - submitted to Licensor for inclusion in the Work by the copyright owner - or by an individual or Legal Entity authorized to submit on behalf of - the copyright owner. For the purposes of this definition, "submitted" - means any form of electronic, verbal, or written communication sent - to the Licensor or its representatives, including but not limited to - communication on electronic mailing lists, source code control systems, - and issue tracking systems that are managed by, or on behalf of, the - Licensor for the purpose of discussing and improving the Work, but - excluding communication that is conspicuously marked or otherwise - designated in writing by the copyright owner as "Not a Contribution." - - "Contributor" shall mean Licensor and any individual or Legal Entity - on behalf of whom a Contribution has been received by Licensor and - subsequently incorporated within the Work. - - 2. Grant of Copyright License. Subject to the terms and conditions of - this License, each Contributor hereby grants to You a perpetual, - worldwide, non-exclusive, no-charge, royalty-free, irrevocable - copyright license to reproduce, prepare Derivative Works of, - publicly display, publicly perform, sublicense, and distribute the - Work and such Derivative Works in Source or Object form. - - 3. Grant of Patent License. Subject to the terms and conditions of - this License, each Contributor hereby grants to You a perpetual, - worldwide, non-exclusive, no-charge, royalty-free, irrevocable - (except as stated in this section) patent license to make, have made, - use, offer to sell, sell, import, and otherwise transfer the Work, - where such license applies only to those patent claims licensable - by such Contributor that are necessarily infringed by their - Contribution(s) alone or by combination of their Contribution(s) - with the Work to which such Contribution(s) was submitted. If You - institute patent litigation against any entity (including a - cross-claim or counterclaim in a lawsuit) alleging that the Work - or a Contribution incorporated within the Work constitutes direct - or contributory patent infringement, then any patent licenses - granted to You under this License for that Work shall terminate - as of the date such litigation is filed. - - 4. Redistribution. You may reproduce and distribute copies of the - Work or Derivative Works thereof in any medium, with or without - modifications, and in Source or Object form, provided that You - meet the following conditions: - - (a) You must give any other recipients of the Work or - Derivative Works a copy of this License; and - - (b) You must cause any modified files to carry prominent notices - stating that You changed the files; and - - (c) You must retain, in the Source form of any Derivative Works - that You distribute, all copyright, patent, trademark, and - attribution notices from the Source form of the Work, - excluding those notices that do not pertain to any part of - the Derivative Works; and - - (d) If the Work includes a "NOTICE" text file as part of its - distribution, then any Derivative Works that You distribute must - include a readable copy of the attribution notices contained - within such NOTICE file, excluding those notices that do not - pertain to any part of the Derivative Works, in at least one - of the following places: within a NOTICE text file distributed - as part of the Derivative Works; within the Source form or - documentation, if provided along with the Derivative Works; or, - within a display generated by the Derivative Works, if and - wherever such third-party notices normally appear. The contents - of the NOTICE file are for informational purposes only and - do not modify the License. You may add Your own attribution - notices within Derivative Works that You distribute, alongside - or as an addendum to the NOTICE text from the Work, provided - that such additional attribution notices cannot be construed - as modifying the License. - - You may add Your own copyright statement to Your modifications and - may provide additional or different license terms and conditions - for use, reproduction, or distribution of Your modifications, or - for any such Derivative Works as a whole, provided Your use, - reproduction, and distribution of the Work otherwise complies with - the conditions stated in this License. - - 5. Submission of Contributions. Unless You explicitly state otherwise, - any Contribution intentionally submitted for inclusion in the Work - by You to the Licensor shall be under the terms and conditions of - this License, without any additional terms or conditions. - Notwithstanding the above, nothing herein shall supersede or modify - the terms of any separate license agreement you may have executed - with Licensor regarding such Contributions. - - 6. Trademarks. This License does not grant permission to use the trade - names, trademarks, service marks, or product names of the Licensor, - except as required for reasonable and customary use in describing the - origin of the Work and reproducing the content of the NOTICE file. - - 7. Disclaimer of Warranty. Unless required by applicable law or - agreed to in writing, Licensor provides the Work (and each - Contributor provides its Contributions) on an "AS IS" BASIS, - WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or - implied, including, without limitation, any warranties or conditions - of TITLE, NON-INFRINGEMENT, MERCHANTABILITY, or FITNESS FOR A - PARTICULAR PURPOSE. You are solely responsible for determining the - appropriateness of using or redistributing the Work and assume any - risks associated with Your exercise of permissions under this License. - - 8. Limitation of Liability. In no event and under no legal theory, - whether in tort (including negligence), contract, or otherwise, - unless required by applicable law (such as deliberate and grossly - negligent acts) or agreed to in writing, shall any Contributor be - liable to You for damages, including any direct, indirect, special, - incidental, or consequential damages of any character arising as a - result of this License or out of the use or inability to use the - Work (including but not limited to damages for loss of goodwill, - work stoppage, computer failure or malfunction, or any and all - other commercial damages or losses), even if such Contributor - has been advised of the possibility of such damages. - - 9. Accepting Warranty or Additional Liability. While redistributing - the Work or Derivative Works thereof, You may choose to offer, - and charge a fee for, acceptance of support, warranty, indemnity, - or other liability obligations and/or rights consistent with this - License. However, in accepting such obligations, You may act only - on Your own behalf and on Your sole responsibility, not on behalf - of any other Contributor, and only if You agree to indemnify, - defend, and hold each Contributor harmless for any liability - incurred by, or claims asserted against, such Contributor by reason - of your accepting any such warranty or additional liability. - - END OF TERMS AND CONDITIONS - - APPENDIX: How to apply the Apache License to your work. - - To apply the Apache License to your work, attach the following - boilerplate notice, with the fields enclosed by brackets "[]" - replaced with your own identifying information. (Don't include - the brackets!) The text should be enclosed in the appropriate - comment syntax for the file format. We also recommend that a - file or class name and description of purpose be included on the - same "printed page" as the copyright notice for easier - identification within third-party archives. - - Copyright [yyyy] [name of copyright owner] - - Licensed under the Apache License, Version 2.0 (the "License"); - you may not use this file except in compliance with the License. - You may obtain a copy of the License at - - http://www.apache.org/licenses/LICENSE-2.0 - - Unless required by applicable law or agreed to in writing, software - distributed under the License is distributed on an "AS IS" BASIS, - WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - See the License for the specific language governing permissions and - limitations under the License. diff --git a/dkpro-core-ixa-asl/pom.xml b/dkpro-core-ixa-asl/pom.xml deleted file mode 100644 index 536d5e56b3..0000000000 --- a/dkpro-core-ixa-asl/pom.xml +++ /dev/null @@ -1,439 +0,0 @@ - - - 4.0.0 - - org.dkpro.core - dkpro-core-asl - 3.0.0-SNAPSHOT - ../dkpro-core-asl - - - dkpro-core-ixa-asl - jar - DKPro Core ASL - IXA - https://dkpro.github.io/dkpro-core/ - - - - org.apache.uima - uimaj-core - - - org.apache.uima - uimafit-core - - - org.apache.commons - commons-lang3 - - - org.apache.opennlp - opennlp-tools - - 2.1.0 - - - eus.ixa - ixa-pipe-pos - 1.5.3 - - - - - org.dkpro.core - dkpro-core-api-lexmorph-asl - ${project.version} - - - org.dkpro.core - dkpro-core-api-resources-asl - ${project.version} - - - org.dkpro.core - dkpro-core-api-parameter-asl - ${project.version} - - - org.dkpro.core - dkpro-core-api-metadata-asl - ${project.version} - - - org.dkpro.core - dkpro-core-api-segmentation-asl - ${project.version} - - - - org.dkpro.core - dkpro-core-opennlp-asl - ${project.version} - - - eu.openminted.share.annotations - omtd-share-annotations-api - - - org.dkpro.core - dkpro-core-testing-asl - ${project.version} - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-en-perceptron-autodict01-conll09 - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-en-perceptron-conll09 - test - - - - - - - org.dkpro.core - dkpro-core-opennlp-asl - ${project.version} - pom - import - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-de-perceptron-autodict01-conll09 - 20160213.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-de-perceptron-perceptron-autodict01-conll09 - 20160213.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-en-perceptron-autodict01-conll09 - 20160211.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-en-maxent-100-c5-baseline-autodict01-conll09 - 20160211.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-en-perceptron-autodict01-ud - 20160214.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-en-xpos-perceptron-autodict01-ud - 20160214.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-es-perceptron-autodict01-ancora-2.0 - 20160212.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-eu-perceptron-ud - 20160212.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-fr-perceptron-autodict01-sequoia - 20160215.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-gl-perceptron-autdict05-ctag - 20160212.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-it-perceptron-autodict01-ud - 20160213.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-nl-maxent-100-c5-autodict01-alpino - 20160214.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-nl-perceptron-autodict01-alpino - 20160214.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-de-perceptron-conll09 - 20160213.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-en-perceptron-conll09 - 20160211.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-en-perceptron-ud - 20160214.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-en-xlemma-perceptron-ud - 20160214.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-es-perceptron-ancora-2.0 - 20160211.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-eu-perceptron-ud - 20160212.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-fr-perceptron-sequoia - 20160215.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-gl-perceptron-autodict05-ctag - 20160212.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-it-perceptron-ud - 20160213.1 - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-nl-perceptron-alpino - 20160215.1 - - - - - - - - - org.apache.maven.plugins - maven-dependency-plugin - - - - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-en-perceptron-autodict01-conll09 - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-en-perceptron-conll09 - - - - - - - - - - use-full-resources - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-de-perceptron-autodict01-conll09 - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-en-perceptron-autodict01-conll09 - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-en-maxent-100-c5-baseline-autodict01-conll09 - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-en-perceptron-autodict01-ud - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-en-xpos-perceptron-autodict01-ud - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-es-perceptron-autodict01-ancora-2.0 - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-eu-perceptron-ud - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-fr-perceptron-autodict01-sequoia - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-gl-perceptron-autdict05-ctag - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-it-perceptron-autodict01-ud - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-nl-maxent-100-c5-autodict01-alpino - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-nl-perceptron-autodict01-alpino - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-de-perceptron-conll09 - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-en-perceptron-ud - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-en-xlemma-perceptron-ud - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-es-perceptron-ancora-2.0 - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-eu-perceptron-ud - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-fr-perceptron-sequoia - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-gl-perceptron-autodict05-ctag - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-it-perceptron-ud - test - - - de.tudarmstadt.ukp.dkpro.core - de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-nl-perceptron-alpino - test - - - - - - - org.apache.maven.plugins - maven-dependency-plugin - - - - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-de-perceptron-autodict01-conll09 - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-en-maxent-100-c5-baseline-autodict01-conll09 - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-en-perceptron-autodict01-ud - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-en-xpos-perceptron-autodict01-ud - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-es-perceptron-autodict01-ancora-2.0 - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-eu-perceptron-ud - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-fr-perceptron-autodict01-sequoia - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-gl-perceptron-autdict05-ctag - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-it-perceptron-autodict01-ud - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-nl-maxent-100-c5-autodict01-alpino - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-tagger-nl-perceptron-autodict01-alpino - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-de-perceptron-conll09 - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-en-perceptron-ud - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-en-xlemma-perceptron-ud - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-es-perceptron-ancora-2.0 - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-eu-perceptron-ud - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-fr-perceptron-sequoia - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-gl-perceptron-autodict05-ctag - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-it-perceptron-ud - de.tudarmstadt.ukp.dkpro.core:de.tudarmstadt.ukp.dkpro.core.ixa-model-lemmatizer-nl-perceptron-alpino - - - - - - - - - \ No newline at end of file diff --git a/dkpro-core-ixa-asl/src/main/java/org/dkpro/core/ixa/IxaLemmatizer.java b/dkpro-core-ixa-asl/src/main/java/org/dkpro/core/ixa/IxaLemmatizer.java deleted file mode 100644 index 1b637b3f79..0000000000 --- a/dkpro-core-ixa-asl/src/main/java/org/dkpro/core/ixa/IxaLemmatizer.java +++ /dev/null @@ -1,184 +0,0 @@ -/* - * Copyright 2017 - * Ubiquitous Knowledge Processing (UKP) Lab - * Technische Universität Darmstadt - * - * Licensed under the Apache License, Version 2.0 (the "License"); - * you may not use this file except in compliance with the License. - * You may obtain a copy of the License at - * - * http://www.apache.org/licenses/LICENSE-2.0 - * - * Unless required by applicable law or agreed to in writing, software - * distributed under the License is distributed on an "AS IS" BASIS, - * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - * See the License for the specific language governing permissions and - * limitations under the License. - */ -package org.dkpro.core.ixa; - -import static org.apache.uima.fit.util.JCasUtil.indexCovered; -import static org.apache.uima.fit.util.JCasUtil.select; -import static org.apache.uima.fit.util.JCasUtil.toText; -import static org.apache.uima.util.Level.INFO; - -import java.io.InputStream; -import java.util.Collection; -import java.util.List; -import java.util.Map; - -import org.apache.uima.UimaContext; -import org.apache.uima.analysis_engine.AnalysisEngineProcessException; -import org.apache.uima.fit.component.JCasAnnotator_ImplBase; -import org.apache.uima.fit.descriptor.ConfigurationParameter; -import org.apache.uima.fit.descriptor.ResourceMetaData; -import org.apache.uima.fit.descriptor.TypeCapability; -import org.apache.uima.jcas.JCas; -import org.apache.uima.resource.ResourceInitializationException; -import org.dkpro.core.api.parameter.ComponentParameters; -import org.dkpro.core.api.resources.CasConfigurableProviderBase; -import org.dkpro.core.api.resources.ModelProviderBase; -import org.dkpro.core.ixa.internal.IxaLemmatizerTagsetDescriptionProvider; - -import de.tudarmstadt.ukp.dkpro.core.api.lexmorph.type.pos.POS; -import de.tudarmstadt.ukp.dkpro.core.api.segmentation.type.Lemma; -import de.tudarmstadt.ukp.dkpro.core.api.segmentation.type.Sentence; -import de.tudarmstadt.ukp.dkpro.core.api.segmentation.type.Token; -import eu.openminted.share.annotations.api.Component; -import eu.openminted.share.annotations.api.DocumentationResource; -import eu.openminted.share.annotations.api.constants.OperationType; -import eus.ixa.ixa.pipe.lemma.LemmatizerME; -import eus.ixa.ixa.pipe.lemma.LemmatizerModel; - -/** - * Lemmatizer using the OpenNLP-based Ixa implementation. - */ -@Component(OperationType.LEMMATIZER) -@ResourceMetaData(name = "IXA Lemmatizer") -@DocumentationResource("${docbase}/component-reference.html#engine-${shortClassName}") -@TypeCapability( - inputs = { - "de.tudarmstadt.ukp.dkpro.core.api.segmentation.type.Sentence", - "de.tudarmstadt.ukp.dkpro.core.api.segmentation.type.Token", - "de.tudarmstadt.ukp.dkpro.core.api.lexmorph.type.pos.POS" }, - outputs = { - "de.tudarmstadt.ukp.dkpro.core.api.segmentation.type.Lemma" }) -public class IxaLemmatizer - extends JCasAnnotator_ImplBase -{ - /** - * Use this language instead of the document language to resolve the model. - */ - public static final String PARAM_LANGUAGE = ComponentParameters.PARAM_LANGUAGE; - @ConfigurationParameter(name = PARAM_LANGUAGE, mandatory = false) - protected String language; - - /** - * Override the default variant used to locate the model. - */ - public static final String PARAM_VARIANT = ComponentParameters.PARAM_VARIANT; - @ConfigurationParameter(name = PARAM_VARIANT, mandatory = false) - protected String variant; - - /** - * URI of the model artifact. This can be used to override the default model resolving - * mechanism and directly address a particular model. - * - *

The URI format is {@code mvn:${groupId}:${artifactId}:${version}}. Remember to set - * the variant parameter to match the artifact. If the artifact contains the model in - * a non-default location, you also have to specify the model location parameter, e.g. - * {@code classpath:/model/path/in/artifact/model.bin}.

- */ - public static final String PARAM_MODEL_ARTIFACT_URI = - ComponentParameters.PARAM_MODEL_ARTIFACT_URI; - @ConfigurationParameter(name = PARAM_MODEL_ARTIFACT_URI, mandatory = false) - protected String modelArtifactUri; - - /** - * Load the model from this location instead of locating the model automatically. - */ - public static final String PARAM_MODEL_LOCATION = ComponentParameters.PARAM_MODEL_LOCATION; - @ConfigurationParameter(name = PARAM_MODEL_LOCATION, mandatory = false) - protected String modelLocation; - - /** - * Log the tag set(s) when a model is loaded. - */ - public static final String PARAM_PRINT_TAGSET = ComponentParameters.PARAM_PRINT_TAGSET; - @ConfigurationParameter(name = PARAM_PRINT_TAGSET, mandatory = true, defaultValue = "false") - protected boolean printTagSet; - - private CasConfigurableProviderBase modelProvider; - - @Override - public void initialize(UimaContext aContext) - throws ResourceInitializationException - { - super.initialize(aContext); - - modelProvider = new ModelProviderBase(this, "lemmatizer") - { - { - setDefault(GROUP_ID, "de.tudarmstadt.ukp.dkpro.core"); - setDefault(LOCATION, - "classpath:/de/tudarmstadt/ukp/dkpro/core/ixa/lib/lemmatizer-${language}-${variant}.properties"); - } - - @Override - protected LemmatizerME produceResource(InputStream aStream) - throws Exception - { - LemmatizerModel model = new LemmatizerModel(aStream); - - // Extract tagset information from the model - IxaLemmatizerTagsetDescriptionProvider tsdp = - new IxaLemmatizerTagsetDescriptionProvider( - getResourceMetaData().getProperty("pos.tagset"), POS.class, - model.getLemmatizerSequenceModel(), "t0"); - addTagset(tsdp, false); - - if (printTagSet) { - getContext().getLogger().log(INFO, tsdp.toString()); - } - - return new LemmatizerME(model); - } - - }; - } - - @Override - public void process(JCas aJCas) - throws AnalysisEngineProcessException - { - modelProvider.configure(aJCas.getCas()); - LemmatizerME analyzer = modelProvider.getResource(); - - // Iterate over all sentences - Map> index = indexCovered(aJCas, Sentence.class, Token.class); - for (Sentence sentence : select(aJCas, Sentence.class)) { - Collection tokens = index.get(sentence); - String[] tokenTexts = toText(tokens).toArray(new String[tokens.size()]); - String[] tokenPos = tokens.stream() - .map(t -> { return t.getPos().getPosValue(); }) - .toArray(s -> { return new String[tokens.size()]; }); - - String[] encodedLemmas = analyzer.lemmatize(tokenTexts, tokenPos); - String[] lemmas = analyzer.decodeLemmas(tokenTexts, encodedLemmas); - - int i = 0; - for (Token t : tokens) { - String lemmaString = lemmas[i]; - if (lemmaString == null) { - lemmaString = t.getText(); - } - Lemma l = new Lemma(aJCas, t.getBegin(), t.getEnd()); - l.setValue(lemmaString); - l.addToIndexes(); - - t.setLemma(l); - i++; - } - } - } -} diff --git a/dkpro-core-ixa-asl/src/main/java/org/dkpro/core/ixa/IxaPosTagger.java b/dkpro-core-ixa-asl/src/main/java/org/dkpro/core/ixa/IxaPosTagger.java deleted file mode 100644 index 9e1c48cba8..0000000000 --- a/dkpro-core-ixa-asl/src/main/java/org/dkpro/core/ixa/IxaPosTagger.java +++ /dev/null @@ -1,54 +0,0 @@ -/* - * Copyright 2017 - * Ubiquitous Knowledge Processing (UKP) Lab - * Technische Universität Darmstadt - * - * Licensed under the Apache License, Version 2.0 (the "License"); - * you may not use this file except in compliance with the License. - * You may obtain a copy of the License at - * - * http://www.apache.org/licenses/LICENSE-2.0 - * - * Unless required by applicable law or agreed to in writing, software - * distributed under the License is distributed on an "AS IS" BASIS, - * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - * See the License for the specific language governing permissions and - * limitations under the License. - */ -package org.dkpro.core.ixa; - -import static org.dkpro.core.api.resources.ResourceObjectProviderBase.LOCATION; - -import org.apache.uima.UimaContext; -import org.apache.uima.fit.descriptor.ResourceMetaData; -import org.apache.uima.resource.ResourceInitializationException; -import org.dkpro.core.opennlp.OpenNlpPosTagger; - -import eu.openminted.share.annotations.api.Component; -import eu.openminted.share.annotations.api.DocumentationResource; -import eu.openminted.share.annotations.api.constants.OperationType; - -/** - * Part-of-Speech annotator using OpenNLP with IXA extensions. - */ -@Component(OperationType.PART_OF_SPEECH_TAGGER) -@ResourceMetaData(name = "IXA POS-Tagger") -@DocumentationResource("${docbase}/component-reference.html#engine-${shortClassName}") -public class IxaPosTagger - extends OpenNlpPosTagger -{ - // The IXA POS tagger models make use of IXA classes. But they do so from within OpenNLP. - // From the outside, it looks and works exactly like an OpenNLP POS tagger. So we just - // derive from the OpenNlpPosTagger in side this module. This has the effect that through - // the module dependencies, we have the required IXA JARs on the classpath. It also has - // the effect that the package for the models changes from ...opennlp.lib to ...ixa.lib. - - @Override - public void initialize(UimaContext aContext) throws ResourceInitializationException - { - super.initialize(aContext); - - modelProvider.setDefault(LOCATION, - "classpath:/de/tudarmstadt/ukp/dkpro/core/ixa/lib/tagger-${language}-${variant}.properties"); - } -} diff --git a/dkpro-core-ixa-asl/src/main/java/org/dkpro/core/ixa/internal/IxaLemmatizerTagsetDescriptionProvider.java b/dkpro-core-ixa-asl/src/main/java/org/dkpro/core/ixa/internal/IxaLemmatizerTagsetDescriptionProvider.java deleted file mode 100644 index 62b2d82d28..0000000000 --- a/dkpro-core-ixa-asl/src/main/java/org/dkpro/core/ixa/internal/IxaLemmatizerTagsetDescriptionProvider.java +++ /dev/null @@ -1,85 +0,0 @@ -/* - * Copyright 2017 - * Ubiquitous Knowledge Processing (UKP) Lab - * Technische Universität Darmstadt - * - * Licensed under the Apache License, Version 2.0 (the "License"); - * you may not use this file except in compliance with the License. - * You may obtain a copy of the License at - * - * http://www.apache.org/licenses/LICENSE-2.0 - * - * Unless required by applicable law or agreed to in writing, software - * distributed under the License is distributed on an "AS IS" BASIS, - * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - * See the License for the specific language governing permissions and - * limitations under the License. - */ -package org.dkpro.core.ixa.internal; - -import static java.util.Collections.singletonMap; - -import java.util.HashMap; -import java.util.Map; -import java.util.Set; -import java.util.TreeSet; - -import org.apache.commons.lang3.StringUtils; -import org.apache.commons.lang3.reflect.FieldUtils; -import org.dkpro.core.api.metadata.TagsetBase; - -import opennlp.tools.ml.model.AbstractModel; -import opennlp.tools.ml.model.SequenceClassificationModel; - -public class IxaLemmatizerTagsetDescriptionProvider - extends TagsetBase -{ - private String name; - private String layer; - private SequenceClassificationModel model; - private String feature; - private String separator = "="; - - public IxaLemmatizerTagsetDescriptionProvider(String aName, Class aLayer, - SequenceClassificationModel aModel, String aFeature) - { - name = aName; - layer = aLayer.getName(); - model = aModel; - feature = aFeature; - } - - @Override - public Map getLayers() - { - return singletonMap(layer, name); - } - - @Override - public Set listTags(String aLayer, String aTagsetName) - { - try { - AbstractModel innerModel = (AbstractModel) FieldUtils.readField(model, "model", true); - HashMap pmap = (HashMap) FieldUtils - .readField(innerModel, "pmap", true); - - Set tagSet = new TreeSet(); - String prefix = feature + separator; - for (Object key : pmap.keySet()) { - if (key instanceof String && ((String) key).startsWith(prefix)) { - tagSet.add(StringUtils.substringAfter(((String) key), separator)); - } - } - - return tagSet; - } - catch (IllegalAccessException e) { - throw new IllegalStateException(e); - } - } - - public SequenceClassificationModel getModel() - { - return model; - } -} diff --git a/dkpro-core-ixa-asl/src/main/resources/org/dkpro/core/ixa/lib/lemmatizer-default-variants.map b/dkpro-core-ixa-asl/src/main/resources/org/dkpro/core/ixa/lib/lemmatizer-default-variants.map deleted file mode 100644 index 32b52780a0..0000000000 --- a/dkpro-core-ixa-asl/src/main/resources/org/dkpro/core/ixa/lib/lemmatizer-default-variants.map +++ /dev/null @@ -1,8 +0,0 @@ -de=perceptron-conll09 -en=perceptron-conll09 -es=perceptron-ancora-2.0 -eu=perceptron-ud -fr=perceptron-sequoia -gl=perceptron-autodict05-ctag -it=perceptron-ud -nl=perceptron-alpino diff --git a/dkpro-core-ixa-asl/src/main/resources/org/dkpro/core/ixa/lib/tagger-default-variants.map b/dkpro-core-ixa-asl/src/main/resources/org/dkpro/core/ixa/lib/tagger-default-variants.map deleted file mode 100644 index 43ddeced54..0000000000 --- a/dkpro-core-ixa-asl/src/main/resources/org/dkpro/core/ixa/lib/tagger-default-variants.map +++ /dev/null @@ -1,8 +0,0 @@ -de=perceptron-autodict01-conll09 -en=perceptron-autodict01-conll09 -es=perceptron-autodict01-ancora-2.0 -eu=perceptron-ud -fr=perceptron-autodict01-sequoia -gl=perceptron-autdict05-ctag -it=perceptron-autodict01-ud -nl=perceptron-autodict01-alpino diff --git a/dkpro-core-ixa-asl/src/scripts/build.xml b/dkpro-core-ixa-asl/src/scripts/build.xml deleted file mode 100644 index 131cc0c71e..0000000000 --- a/dkpro-core-ixa-asl/src/scripts/build.xml +++ /dev/null @@ -1,658 +0,0 @@ - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - - \ No newline at end of file diff --git a/dkpro-core-ixa-asl/src/test/java/org/dkpro/core/ixa/IxaLemmatizerTest.java b/dkpro-core-ixa-asl/src/test/java/org/dkpro/core/ixa/IxaLemmatizerTest.java deleted file mode 100644 index ca8e3103e6..0000000000 --- a/dkpro-core-ixa-asl/src/test/java/org/dkpro/core/ixa/IxaLemmatizerTest.java +++ /dev/null @@ -1,235 +0,0 @@ -/* - * Copyright 2017 - * Ubiquitous Knowledge Processing (UKP) Lab - * Technische Universität Darmstadt - * - * Licensed under the Apache License, Version 2.0 (the "License"); - * you may not use this file except in compliance with the License. - * You may obtain a copy of the License at - * - * http://www.apache.org/licenses/LICENSE-2.0 - * - * Unless required by applicable law or agreed to in writing, software - * distributed under the License is distributed on an "AS IS" BASIS, - * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - * See the License for the specific language governing permissions and - * limitations under the License. - */ -package org.dkpro.core.ixa; - -import static org.apache.uima.fit.factory.AnalysisEngineFactory.createEngineDescription; -import static org.apache.uima.fit.util.JCasUtil.select; - -import org.apache.uima.analysis_engine.AnalysisEngineDescription; -import org.apache.uima.jcas.JCas; -import org.dkpro.core.testing.AssertAnnotations; -import org.dkpro.core.testing.AssumeResource; -import org.dkpro.core.testing.TestRunner; -import org.junit.jupiter.api.Test; - -import de.tudarmstadt.ukp.dkpro.core.api.lexmorph.type.pos.POS; -import de.tudarmstadt.ukp.dkpro.core.api.segmentation.type.Lemma; - -public class IxaLemmatizerTest -{ - @Test - public void testBasque() - throws Exception - { - JCas jcas = runTest("eu", null, "Oso konplikatua esaldi adibidea da , eta horrek ahalik " - + "eta osagai eta mendekotasunen asko dauka behar dugu ."); - - String[] lemmas = { "oso", "konplikatu", "esaldi", "adibide", "izan", ",", "eta", "hori", - "ahal", "eta", "osagai", "eta", "mendekotasun", "asko", "eduki", "behar", "ukan", - "." }; - - AssertAnnotations.assertLemma(lemmas, select(jcas, Lemma.class)); - } - - @Test - public void testDutch() - throws Exception - { - JCas jcas = runTest("nl", null, "We hebben een zeer ingewikkeld voorbeeld zin , die zoveel " - + "mogelijk bestanddelen en afhankelijkheden bevat mogelijk ."); - - String[] lemmas = { "we", "heb", "een", "zeer", "ingewikkeld", "voorbeeld", "zin", ",", - "die", "zoveel", "mogelijk", "bestanddelen", "en", "afhankelijked_af", "bevat", - "mogelijk", "." }; - - AssertAnnotations.assertLemma(lemmas, select(jcas, Lemma.class)); - } - - @Test - public void testEnglish() - throws Exception - { - JCas jcas = runTest("en", null, "We need a very complicated example sentence , which " - + "contains as many constituents and dependencies as possible ."); - - String[] lemmas = { "we", "need", "a", "very", "complicate", "example", "sentence", ",", - "which", "contain", "as", "many", "constituent", "and", "dependency", "as", - "possible", "." }; - - AssertAnnotations.assertLemma(lemmas, select(jcas, Lemma.class)); - } - - @Test - public void testEnglishExtra() - throws Exception - { - { - JCas jcas = runTest("en", "perceptron-ud", "We need a very complicated example " - + "sentence , which contains as many constituents and dependencies as " - + "possible ."); - - String[] lemmas = { "we", "need", "a", "very", "complicated", "example", "sentence", - ",", "which", "contains", "as", "many", "constituents", "and", "dependency", - "as", "possible", "." }; - - AssertAnnotations.assertLemma(lemmas, select(jcas, Lemma.class)); - } - - { - JCas jcas = runTest("en", "xlemma-perceptron-ud", "We need a very complicated example " - + "sentence , which contains as many constituents and dependencies as " - + "possible."); - - String[] lemmas = { "we", "need", "a", "very", "complicate", "example", "sentence", ",", - "which", "contain", "as", "many", "constituent", "and", "dependency", "as", - "possible." }; - - AssertAnnotations.assertLemma(lemmas, select(jcas, Lemma.class)); - } - } - - @Test - public void testGerman() - throws Exception - { - JCas jcas = runTest("de", null, "Wir brauchen ein sehr kompliziertes Beispiel , welches " - + "möglichst viele Konstituenten und Dependenzen beinhaltet ."); - - String[] lemmas = { "wir", "brauchen", "ein", "sehr", "kompliziert", "beispiel", "_", - "welcher", "möglichst", "vieler", "konstituent", "und", "dependenz", "beinhalten", - "_" }; - - AssertAnnotations.assertLemma(lemmas, select(jcas, Lemma.class)); - } - - @Test - public void testItalian() - throws Exception - { - JCas jcas = runTest("it", null, "Abbiamo bisogno di un esempio molto complicata frase , " - + "che contiene tante componenti e le dipendenze possibile ."); - - String[] lemmas = { "avere", "bisogno", "di", "uno", "esempio", "molto", "complicato", - "frase", ",", "che", "contenere", "tanto", "componente", "e", "il", "dipendenza", - "possibile", "." }; - - AssertAnnotations.assertLemma(lemmas, select(jcas, Lemma.class)); - } - - @Test - public void testFrench() - throws Exception - { - JCas jcas = runTest("es", null, "Nous avons besoin d' une phrase par exemple très " - + "compliqué , qui contient des constituants que de nombreuses dépendances et que " - + "possible ."); - - String[] lemmas = { "nous", "avon", "besoir", "d'", "unir", "phrar", "par", "exemple", - "trèr", "compliqué", ",", "qui", "contientr", "d", "constituant", "que", "de", - "nombreuse", "dépendanz", "et", "que", "possible", "." }; - - AssertAnnotations.assertLemma(lemmas, select(jcas, Lemma.class)); - } - - @Test - public void testGalician() - throws Exception - { - JCas jcas = runTest("gl", null, "Necesitamos unha frase de exemplo moi complicado , que " - + "contén o maior número de compoñentes e dependencias posible ."); - - String[] lemmas = { "necesitar", "un", "frase", "de", "exemplo", "moi", "complicar", ",", - "que", "conter", "o", "maior", "número", "de", "compoñente", "e", "dependencia", - "posible", "." }; - - AssertAnnotations.assertLemma(lemmas, select(jcas, Lemma.class)); - } - - @Test - public void testSpanish() - throws Exception - { - JCas jcas = runTest("es", null, "Necesitamos una oración de ejemplo muy complicado , que " - + "contiene la mayor cantidad de componentes y dependencias como sea posible ."); - - String[] lemmas = { "necesitr", "uno", "oración", "de", "ejemplo", "mucho", "complicado", - ",", "que", "contener", "el", "mayor", "cantidad", "de", "componente", "y", - "dependencia", "como", "ser", "posible", "." }; - - String[] posTags = { "AO0FP0", "AO0FS0", "AO0MP0", "AO0MS0", "AQ0000", "AQ000P", "AQ0CC0", - "AQ0CP0", "AQ0CS0", "AQ0FP0", "AQ0FPP", "AQ0FS0", "AQ0FSP", "AQ0MP0", "AQ0MPP", - "AQ0MS0", "AQ0MSP", "CC", "CS", "DA0CS0", "DA0FP0", "DA0FS0", "DA0MP0", "DA0MS0", - "DD0CP0", "DD0CS0", "DD0FP0", "DD0FS0", "DD0MP0", "DD0MS0", "DE0CC0", "DI0CP0", - "DI0CS0", "DI0FP0", "DI0FS0", "DI0MP0", "DI0MS0", "DN0CP0", "DN0CS0", "DN0FP0", - "DN0FS0", "DN0MP0", "DN0MS0", "DP1CPS", "DP1CSS", "DP1FPP", "DP1FSP", "DP1MPP", - "DP1MSP", "DP1MSS", "DP2CPS", "DP2CSS", "DP2FSP", "DP3CP0", "DP3CS0", "DP3MP0", - "DT0FS0", "DT0MP0", "Faa", "Fat", "Fc", "Fd", "Fe", "Fg", "Fh", "Fia", "Fit", "Fp", - "Fpa", "Fpt", "Fs", "Fx", "Fz", "I", "NCCC000", "NCCP000", "NCCS000", "NCF0000", - "NCFC000", "NCFP000", "NCFS000", "NCMC000", "NCMP000", "NCMS000", "NP00000", - "NPCC000", "P0000000", "P00CC000", "P01CS000", "P02CS000", "P03CC000", "PD0CP000", - "PD0CS000", "PD0FP000", "PD0FS000", "PD0MP000", "PD0MS000", "PI0CC000", "PI0CP000", - "PI0CS000", "PI0FP000", "PI0FS000", "PI0MP000", "PI0MS000", "PN0CP000", "PN0FP000", - "PN0FS000", "PN0MP000", "PN0MS000", "PP1CP000", "PP1CS000", "PP1CSN00", "PP1CSO00", - "PP1MP000", "PP2CP000", "PP2CP00P", "PP2CS000", "PP2CS00P", "PP2CSN00", "PP2CSO00", - "PP3CC000", "PP3CCA00", "PP3CCO00", "PP3CP000", "PP3CPA00", "PP3CPD00", "PP3CS000", - "PP3CSA00", "PP3CSD00", "PP3FP000", "PP3FPA00", "PP3FS000", "PP3FSA00", "PP3MP000", - "PP3MPA00", "PP3MS000", "PP3MSA00", "PR0CC000", "PR0CP000", "PR0CS000", "PR0FP000", - "PR0FS000", "PR0MP000", "PR0MS000", "PT000000", "PT0CC000", "PT0CP000", "PT0CS000", - "PT0FP000", "PT0MP000", "PX1FP0P0", "PX1FS0P0", "PX1FS0S0", "PX1MP0P0", "PX2FS0S0", - "PX3CS000", "PX3FP000", "PX3FS000", "PX3MP000", "PX3MS000", "RG", "RN", "SPCMS", - "SPS00", "SPSCC", "VAG0000", "VAIC1P0", "VAIC3P0", "VAIC3S0", "VAIF1P0", "VAIF1S0", - "VAIF2S0", "VAIF3P0", "VAIF3S0", "VAII1P0", "VAII1S0", "VAII2S0", "VAII3P0", - "VAII3S0", "VAIP1P0", "VAIP1S0", "VAIP2P0", "VAIP2S0", "VAIP3P0", "VAIP3S0", - "VAIS3P0", "VAIS3S0", "VAN0000", "VAP00SM", "VASI1P0", "VASI1S0", "VASI3P0", - "VASI3S0", "VASP1S0", "VASP3P0", "VMG0000", "VMIC1P0", "VMIC1S0", "VMIC2S0", - "VMIC3P0", "VMIC3S0", "VMIF1P0", "VMIF1S0", "VMIF2S0", "VMIF3P0", "VMIF3S0", - "VMII1P0", "VMII1S0", "VMII2P0", "VMII2S0", "VMII3P0", "VMII3S0", "VMIP1P0", - "VMIP1S0", "VMIP2P0", "VMIP2S0", "VMIP3P0", "VMIP3PC", "VMIP3S0", "VMIP3SC", - "VMIS1P0", "VMIS1S0", "VMIS2S0", "VMIS3P0", "VMIS3S0", "VMIS3SC", "VMM01P0", - "VMM02S0", "VMM03P0", "VMM03S0", "VMN0000", "VMP00PF", "VMP00PM", "VMP00SF", - "VMP00SM", "VMSI1P0", "VMSI1S0", "VMSI3P0", "VMSI3S0", "VMSP1P0", "VMSP1S0", - "VMSP2P0", "VMSP2S0", "VMSP3P0", "VMSP3S0", "VSG0000", "VSIC1S0", "VSIC2S0", - "VSIC3P0", "VSIC3S0", "VSIF1S0", "VSIF3P0", "VSIF3S0", "VSII1P0", "VSII3P0", - "VSII3S0", "VSIP1P0", "VSIP1S0", "VSIP2S0", "VSIP3P0", "VSIP3S0", "VSIS1S0", - "VSIS3P0", "VSIS3S0", "VSM02S0", "VSN0000", "VSP00SM", "VSSF3S0", "VSSI3P0", - "VSSI3S0", "VSSP1S0", "VSSP2S0", "VSSP3P0", "VSSP3S0", "W", "Z", "Zm", "Zp", "_" }; - - AssertAnnotations.assertLemma(lemmas, select(jcas, Lemma.class)); - // AssertAnnotations.assertTagset(IxaPosTagger.class, POS.class, "ancora-ixa", - // posTags, jcas); - AssertAnnotations.assertTagset(IxaLemmatizer.class, POS.class, "ancora-ixa", posTags, jcas); - } - - private JCas runTest(String aLanguage, String aVariant, String aText) - throws Exception - { - AssumeResource.assumeResource(IxaLemmatizer.class, "lemmatizer", aLanguage, aVariant); - - AnalysisEngineDescription tagger = createEngineDescription(IxaPosTagger.class); - - AnalysisEngineDescription lemmatizer = createEngineDescription(IxaLemmatizer.class, - IxaLemmatizer.PARAM_VARIANT, aVariant, - IxaLemmatizer.PARAM_PRINT_TAGSET, true); - - AnalysisEngineDescription engine = createEngineDescription(tagger, lemmatizer); - - JCas jcas = TestRunner.runTest(engine, aLanguage, aText); - - return jcas; - } -} diff --git a/dkpro-core-ixa-asl/src/test/java/org/dkpro/core/ixa/IxaPosTaggerTest.java b/dkpro-core-ixa-asl/src/test/java/org/dkpro/core/ixa/IxaPosTaggerTest.java deleted file mode 100644 index bf1fd434c8..0000000000 --- a/dkpro-core-ixa-asl/src/test/java/org/dkpro/core/ixa/IxaPosTaggerTest.java +++ /dev/null @@ -1,337 +0,0 @@ -/* - * Copyright 2017 - * Ubiquitous Knowledge Processing (UKP) Lab - * Technische Universität Darmstadt - * - * Licensed under the Apache License, Version 2.0 (the "License"); - * you may not use this file except in compliance with the License. - * You may obtain a copy of the License at - * - * http://www.apache.org/licenses/LICENSE-2.0 - * - * Unless required by applicable law or agreed to in writing, software - * distributed under the License is distributed on an "AS IS" BASIS, - * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. - * See the License for the specific language governing permissions and - * limitations under the License. - */ -package org.dkpro.core.ixa; - -import static org.apache.uima.fit.factory.AnalysisEngineFactory.createEngine; -import static org.apache.uima.fit.util.JCasUtil.select; - -import org.apache.uima.analysis_engine.AnalysisEngine; -import org.apache.uima.jcas.JCas; -import org.dkpro.core.testing.AssertAnnotations; -import org.dkpro.core.testing.AssumeResource; -import org.dkpro.core.testing.TestRunner; -import org.junit.jupiter.api.Test; - -import de.tudarmstadt.ukp.dkpro.core.api.lexmorph.type.pos.POS; - -public class IxaPosTaggerTest -{ - @Test - public void testBasque() - throws Exception - { - JCas jcas = runTest("eu", null, "Hau froga bat da .", - new String[] { "DET", "NOUN", "NUM", "VERB", "PUNCT" }, - new String[] { "POS_DET", "POS_NOUN", "POS_NUM", "POS_VERB", "POS_PUNCT" }); - - String[] posTags = { "ADJ", "ADP", "ADV", "AUX", "CONJ", "DET", "INTJ", "NOUN", "NUM", - "PART", "PRON", "PROPN", "PUNCT", "SYM", "VERB", "X" }; - - String[] unmappedPos = {}; - - AssertAnnotations.assertTagset(POS.class, "ud", posTags, jcas); - AssertAnnotations.assertTagsetMapping(POS.class, "ud", unmappedPos, jcas); - } - - @Test - public void testDutch() - throws Exception - { - { - JCas jcas = runTest("nl", null, "Dit is een test .", - new String[] { "Pron", "V", "Art", "N", "Punc" }, - new String[] { "POS_PRON", "POS_VERB", "POS_DET", "POS_NOUN", "POS_PUNCT" }); - - String[] posTags = { "Adj", "Adv", "Art", "Conj", "Int", "MWU", "Misc", "N", "Num", - "Prep", "Pron", "Punc", "V" }; - - String[] unmappedPos = {}; - - AssertAnnotations.assertTagset(POS.class, "alpino-ixa", posTags, jcas); - AssertAnnotations.assertTagsetMapping(POS.class, "alpino-ixa", unmappedPos, jcas); - } - { - JCas jcas = runTest("nl", "maxent-100-c5-autodict01-alpino", "Dit is een test .", - new String[] { "Pron", "V", "Art", "N", "Punc" }, - new String[] { "POS_PRON", "POS_VERB", "POS_DET", "POS_NOUN", "POS_PUNCT" }); - - String[] posTags = { "Adj", "Adv", "Art", "Conj", "Int", "MWU", "Misc", "N", "Num", - "Prep", "Pron", "Punc", "V" }; - - String[] unmappedPos = {}; - - AssertAnnotations.assertTagset(POS.class, "alpino-ixa", posTags, jcas); - AssertAnnotations.assertTagsetMapping(POS.class, "alpino-ixa", unmappedPos, jcas); - } - } - - @Test - public void testEnglish() - throws Exception - { - JCas jcas = runTest("en", null, "This is a test .", - new String[] { "DT", "VBZ", "DT", "NN", "." }, - new String[] { "POS_DET", "POS_VERB", "POS_DET", "POS_NOUN", "POS_PUNCT" }); - - String[] posTags = { "#", "$", "''", "(", ")", ",", ".", ":", "CC", "CD", "DT", "EX", "FW", - "HYPH", "IN", "JJ", "JJR", "JJS", "LS", "MD", "NIL", "NN", "NNP", "NNPS", "NNS", - "PDT", "POS", "PRF", "PRP", "PRP$", "RB", "RBR", "RBS", "RP", "SYM", "TO", "UH", - "VB", "VBD", "VBG", "VBN", "VBP", "VBZ", "WDT", "WP", "WP$", "WRB", "``", - "comic_strip" }; - - String[] unmappedPos = { "HYPH", "NIL", "PRF", "comic_strip" }; - - AssertAnnotations.assertTagset(POS.class, "ptb", posTags, jcas); - AssertAnnotations.assertTagsetMapping(POS.class, "ptb", unmappedPos, jcas); - - runTest("en", null, "A neural net .", - new String[] { "DT", "JJ", "NN", "." }, - new String[] { "POS_DET", "POS_ADJ", "POS_NOUN", "POS_PUNCT" }); - - runTest("en", null, "John is purchasing oranges .", - new String[] { "NNP", "VBZ", "VBG", "NNS", "." }, - new String[] { "POS_PROPN", "POS_VERB", "POS_VERB", "POS_NOUN", "POS_PUNCT" }); - - runTest("en", null, "The quick brown fox jumps over the lazy dog . \n", - new String[] { "DT", "JJ", "JJ", "NN", "VBZ", "IN", "DT", "JJ", "NN", "." }, - new String[] { "POS_DET", "POS_ADJ", "POS_ADJ", "POS_NOUN", "POS_VERB", "POS_ADP", - "POS_DET", "POS_ADJ", "POS_NOUN", "POS_PUNCT" }); - } - - @Test - public void testFrench() - throws Exception - { - JCas jcas = runTest("fr", null, "C'est un test .", - new String[] { "V", "DET", "NC", "PONCT" }, - new String[] { "POS_VERB", "POS_DET", "POS_NOUN", "POS_PUNCT" }); - - String[] posTags = { "ADJ", "ADJWH", "ADV", "ADVWH", "CC", "CLO", "CLR", "CLS", "CS", "DET", - "DETWH", "ET", "I", "NC", "NPP", "P", "P+D", "P+PRO", "PONCT", "PREF", "PRO", - "PROREL", "PROWH", "V", "VIMP", "VINF", "VPP", "VPR", "VS" }; - - String[] unmappedPos = {}; - - AssertAnnotations.assertTagset(POS.class, "melt", posTags, jcas); - AssertAnnotations.assertTagsetMapping(POS.class, "melt", unmappedPos, jcas); - } - - @Test - public void testGalician() - throws Exception - { - JCas jcas = runTest("gl", null, "Este é un exame .", - new String[] { "DMS", "VIP3S00", "IMS0", "NCMS0", "Fp" }, - new String[] { "POS", "POS", "POS", "POS", "POS" }); - - String[] posTags = { "A0CN", "A0CP", "A0CS", "A0FP", "A0FS", "A0MP", "A0MS", "AAMP", - "AQ0CS0", "CC", "CS", "DFP", "DFS", "DMP", "DMS", "DNS", "E", "Faa", "Fat", "Fc", - "Fca", "Fct", "Fd", "Fe", "Fg", "Fia", "Fit", "Fp", "Fpa", "Fpt", "Fra", "Frc", - "Ft", "Fx", "Fz", "GCP", "GCS", "GFP", "GFS", "GMP", "GMS", "IFP0", "IFS0", "IMP0", - "IMS0", "IMSA", "INP0", "INS0", "L", "MC0CN", "MC0FN", "MC0MN", "MO0FP", "MO0FS", - "MO0MP", "MO0MS", "MP0FS", "MP0MS", "NCCP0", "NCCS0", "NCFP0", "NCFPA", "NCFS0", - "NCFSA", "NCMN0", "NCMP0", "NCMPA", "NCMS0", "NP000", "O", "P1CPB0", "P1CPC0", - "P1CSC0", "P1CSN0", "P1CSO0", "P2CPB0", "P2CPC0", "P2CSA0", "P2CSB0", "P2CSD0", - "P3CNB0", "P3CNO0", "P3CNR0", "P3CPD0", "P3CSBP", "P3CSD0", "P3FPA0", "P3FPB0", - "P3FSA0", "P3FSB0", "P3MPA0", "P3MPB0", "P3MSA0", "P3MSB0", "QCN0", "QCP0", "QCS0", - "QFP0", "QFS0", "QMP0", "QMS0", "R0", "S", "TCN0", "TCP0", "TCS0", "TFS0", "TMP0", - "TMS0", "U", "VIA1P00", "VIA2S00", "VIA3P00", "VIA3S00", "VIC1P00", "VIC2P00", - "VIC2S00", "VIC3P00", "VIC3S00", "VIF1P00", "VIF1S00", "VIF2P00", "VIF2S00", - "VIF3P00", "VIF3S00", "VII1P00", "VII2S00", "VII3P00", "VII3S00", "VIP1P00", - "VIP1P00kkk#o#ferro", "VIP1S00", "VIP2P00", "VIP2S00", "VIP3P00", "VIP3S00", - "VIS1P00", "VIS1S00", "VIS2P00", "VIS2S00", "VIS3P00", "VIS3S00", - "VIS3S00kkk#de#sorte", "VM02P00", "VM02S00", "VN00000", "VN00000kkk#o#ferro", - "VN01P00", "VN02S00", "VN03P00", "VP00PC0", "VP00PF0", "VP00PM0", "VP00SC0", - "VP00SF0", "VP00SM0", "VP3S00kkk#o#ferro", "VSF2S00", "VSF3S00", "VSI1P00", - "VSI2S00", "VSI3P00", "VSI3S00", "VSP1P00", "VSP2P00", "VSP2S00", "VSP3P00", - "VSP3S00", "VX00000", "X1FPP", "X1FSP", "X1FSS", "X1MPP", "X1MPS", "X1MSP", "X1MSS", - "X2FPP", "X2FPS", "X2FSP", "X2FSS", "X2MPS", "X2MSP", "X2MSS", "X3FP0", "X3FS0", - "X3MP0", "X3MS0", "Y", "Z", "Z00", "Zkkk", "explanaciónkkkNCFS0" }; - - String[] unmappedPos = {}; - - AssertAnnotations.assertTagset(POS.class, "ctag-ixa", posTags, jcas); - // AssertAnnotations.assertTagsetMapping(POS.class, "melt", unmappedPos, jcas); - } - - @Test - public void testGerman() - throws Exception - { - JCas jcas = runTest("de", null, "Dies ist ein Test .", - new String[] { "PDS", "VAFIN", "ART", "NN", "$." }, - new String[] { "POS_PRON", "POS_VERB", "POS_DET", "POS_NOUN", "POS_PUNCT" }); - - String[] posTags = { "$(", "$,", "$.", "--", "ADJA", "ADJD", "ADV", "APPO", "APPR", - "APPRART", "APZR", "ART", "CARD", "FM", "ITJ", "KOKOM", "KON", "KOUI", "KOUS", "NE", - "NN", "NNE", "PDAT", "PDS", "PIAT", "PIS", "PPER", "PPOSAT", "PPOSS", "PRELAT", - "PRELS", "PRF", "PROAV", "PTKA", "PTKANT", "PTKNEG", "PTKVZ", "PTKZU", "PWAT", - "PWAV", "PWS", "TRUNC", "UNKNOWN", "VAFIN", "VAIMP", "VAINF", "VAPP", "VMFIN", - "VMINF", "VMPP", "VVFIN", "VVIMP", "VVINF", "VVIZU", "VVPP", "XY" }; - - String[] unmappedPos = { "--", "NNE", "UNKNOWN" }; - - AssertAnnotations.assertTagset(POS.class, "stts", posTags, jcas); - AssertAnnotations.assertTagsetMapping(POS.class, "stts", unmappedPos, jcas); - } - - @Test - public void testItalian() - throws Exception - { - JCas jcas = runTest("it", null, "Questa è una prova .", - new String[] { "PRON", "VERB", "DET", "NOUN", "PUNCT"}, - new String[] { "POS_PRON", "POS_VERB", "POS_DET", "POS_NOUN", "POS_PUNCT" }); - - String[] posTags = { "ADJ", "ADP", "ADV", "AUX", "CONJ", "DET", "INTJ", "NOUN", "NUM", - "PART", "PRON", "PROPN", "PUNCT", "SCONJ", "SYM", "VERB", "X" }; - - String[] unmappedPos = {}; - - AssertAnnotations.assertTagset(POS.class, "ud", posTags, jcas); - AssertAnnotations.assertTagsetMapping(POS.class, "ud", unmappedPos, jcas); - } - - @Test - public void testEnglishExtra() - throws Exception - { - { - JCas jcas = runTest("en", "maxent-100-c5-baseline-autodict01-conll09", "This is a test .", - new String[] { "DT", "VBZ", "DT", "NN", "." }, - new String[] { "POS_DET", "POS_VERB", "POS_DET", "POS_NOUN", "POS_PUNCT" }); - - String[] posTags = { "#", "$", "''", "(", ")", ",", ".", ":", "CC", "CD", "DT", "EX", - "FW", "HYPH", "IN", "JJ", "JJR", "JJS", "LS", "MD", "NIL", "NN", "NNP", "NNPS", - "NNS", "PDT", "POS", "PRF", "PRP", "PRP$", "RB", "RBR", "RBS", "RP", "SYM", - "TO", "UH", "VB", "VBD", "VBG", "VBN", "VBP", "VBZ", "WDT", "WP", "WP$", "WRB", - "``", "comic_strip" }; - - String[] unmappedPos = { "HYPH", "NIL", "PRF", "comic_strip" }; - - AssertAnnotations.assertTagset(POS.class, "ptb", posTags, jcas); - AssertAnnotations.assertTagsetMapping(POS.class, "ptb", unmappedPos, jcas); - } - - { - JCas jcas = runTest("en", "perceptron-autodict01-ud", "This is a test .", - new String[] { "PRON", "VERB", "DET", "NOUN", "PUNCT" }, - new String[] { "POS_PRON", "POS_VERB", "POS_DET", "POS_NOUN", "POS_PUNCT" }); - - String[] posTags = { "ADJ", "ADP", "ADV", "AUX", "CONJ", "DET", "INTJ", "NOUN", "NUM", - "PART", "PRON", "PROPN", "PUNCT", "SCONJ", "SYM", "VERB", "X" }; - - String[] unmappedPos = {}; - - AssertAnnotations.assertTagset(POS.class, "ud", posTags, jcas); - AssertAnnotations.assertTagsetMapping(POS.class, "ud", unmappedPos, jcas); - } - - { - JCas jcas = runTest("en", "xpos-perceptron-autodict01-ud", "This is a test .", - new String[] { "DT", "VBZ", "DT", "NN", "." }, - new String[] { "POS_DET", "POS_VERB", "POS_DET", "POS_NOUN", "POS_PUNCT" }); - - String[] posTags = { "$", "''", ",", "-LRB-", "-RRB-", ".", ":", "ADD", "AFX", "CC", - "CD", "DT", "EX", "FW", "GW", "HYPH", "IN", "JJ", "JJR", "JJS", "LS", "MD", - "NFP", "NN", "NNP", "NNPS", "NNS", "PDT", "POS", "PRP", "PRP$", "RB", "RBR", - "RBS", "RP", "SYM", "TO", "UH", "VB", "VBD", "VBG", "VBN", "VBP", "VBZ", "WDT", - "WP", "WP$", "WRB", "XX", "``" }; - - String[] unmappedPos = { "ADD", "AFX", "GW", "HYPH", "NFP", "XX" }; - - AssertAnnotations.assertTagset(POS.class, "ptb", posTags, jcas); - AssertAnnotations.assertTagsetMapping(POS.class, "ptb", unmappedPos, jcas); - } - } - - @Test - public void testSpanish() - throws Exception - { - JCas jcas = runTest("es", null, "Esta es una prueba .", - new String[] { "PD0FS000", "VSIP3S0", "DI0FS0", "NCFS000", "Fp" }, - new String[] { "POS_PRON", "POS_VERB", "POS_DET", "POS_NOUN", "POS_PUNCT" }); - - String[] posTags = { "A00000", "AO0FP0", "AO0FS0", "AO0MP0", "AO0MS0", "AQ0000", "AQ000P", - "AQ0CC0", "AQ0CP0", "AQ0CS0", "AQ0FP0", "AQ0FPP", "AQ0FS0", "AQ0FSP", "AQ0MP0", - "AQ0MPP", "AQ0MS0", "AQ0MSP", "CC", "CS", "DA0CS0", "DA0FP0", "DA0FS0", "DA0MC0", - "DA0MP0", "DA0MS0", "DD0CP0", "DD0CS0", "DD0FP0", "DD0FS0", "DD0MP0", "DD0MS0", - "DE0CC0", "DI0CP0", "DI0CS0", "DI0FP0", "DI0FS0", "DI0MP0", "DI0MS0", "DN0CP0", - "DN0CS0", "DN0FP0", "DN0FS0", "DN0MP0", "DN0MS0", "DP1CPS", "DP1CSS", "DP1FPP", - "DP1FSP", "DP1MPP", "DP1MSP", "DP1MSS", "DP2CPS", "DP2CSS", "DP2FSP", "DP3CP0", - "DP3CS0", "DP3FS0", "DP3MP0", "DP3MS0", "DT0CC0", "DT0FS0", "DT0MP0", "DT0MS0", - "F0", "Faa", "Fat", "Fc", "Fd", "Fe", "Fg", "Fh", "Fia", "Fit", "Fp", "Fpa", "Fpt", - "Fs", "Fx", "Fz", "I", "N000000", "NCCC000", "NCCP000", "NCCS000", "NCF0000", - "NCFC000", "NCFP000", "NCFS000", "NCMC000", "NCMP000", "NCMS000", "NP00000", - "NPCC000", "P0000000", "P00CC000", "P01CP000", "P01CS000", "P02CS000", "P03CC000", - "PD0CP000", "PD0CS000", "PD0FP000", "PD0FS000", "PD0MP000", "PD0MS000", "PE0CC000", - "PI0CC000", "PI0CP000", "PI0CS000", "PI0FP000", "PI0FS000", "PI0MP000", "PI0MS000", - "PN0CP000", "PN0CS000", "PN0FP000", "PN0FS000", "PN0MP000", "PN0MS000", "PP1CC000", - "PP1CP000", "PP1CS000", "PP1CSN00", "PP1CSO00", "PP1FS000", "PP1MP000", "PP2CP000", - "PP2CP00P", "PP2CS000", "PP2CS00P", "PP2CSN00", "PP2CSO00", "PP3CC000", "PP3CCA00", - "PP3CCO00", "PP3CP000", "PP3CPA00", "PP3CPD00", "PP3CS000", "PP3CSA00", "PP3CSD00", - "PP3FP000", "PP3FPA00", "PP3FS000", "PP3FSA00", "PP3MP000", "PP3MPA00", "PP3MS000", - "PP3MSA00", "PR000000", "PR0CC000", "PR0CP000", "PR0CS000", "PR0FP000", "PR0FS000", - "PR0MP000", "PR0MS000", "PT000000", "PT0CC000", "PT0CP000", "PT0CS000", "PT0FP000", - "PT0MP000", "PT0MS000", "PX1FP0P0", "PX1FS0P0", "PX1FS0S0", "PX1MP0P0", "PX1MS0P0", - "PX1MS0S0", "PX2FS0S0", "PX2MS0S0", "PX3CS000", "PX3FP000", "PX3FS000", "PX3MP000", - "PX3MS000", "RG", "RN", "SPCMS", "SPS00", "SPSCC", "VAG0000", "VAIC1P0", "VAIC3P0", - "VAIC3S0", "VAIF1P0", "VAIF1S0", "VAIF2S0", "VAIF3P0", "VAIF3S0", "VAII1P0", - "VAII1S0", "VAII2S0", "VAII3P0", "VAII3S0", "VAII3SC", "VAIP1P0", "VAIP1S0", - "VAIP2P0", "VAIP2S0", "VAIP3P0", "VAIP3PC", "VAIP3S0", "VAIP3SC", "VAIS3P0", - "VAIS3S0", "VAM02S0", "VAM03S0", "VAN0000", "VAN00CC", "VAP00SM", "VASI1P0", - "VASI1S0", "VASI3P0", "VASI3S0", "VASP1S0", "VASP3P0", "VASP3S0", "VMG0000", - "VMIC1P0", "VMIC1S0", "VMIC2S0", "VMIC3P0", "VMIC3S0", "VMIF1P0", "VMIF1S0", - "VMIF2S0", "VMIF3P0", "VMIF3S0", "VMII1P0", "VMII1S0", "VMII2P0", "VMII2S0", - "VMII3P0", "VMII3S0", "VMII3SC", "VMIP1P0", "VMIP1S0", "VMIP1SC", "VMIP2P0", - "VMIP2S0", "VMIP300", "VMIP3P0", "VMIP3PC", "VMIP3S0", "VMIP3SC", "VMIS1P0", - "VMIS1S0", "VMIS2S0", "VMIS3P0", "VMIS3PC", "VMIS3S0", "VMIS3SC", "VMM01P0", - "VMM02S0", "VMM03P0", "VMM03S0", "VMN0000", "VMN00CC", "VMP00PF", "VMP00PM", - "VMP00SF", "VMP00SM", "VMPS0SM", "VMSI1P0", "VMSI1S0", "VMSI3P0", "VMSI3S0", - "VMSP1P0", "VMSP1S0", "VMSP2P0", "VMSP2S0", "VMSP3P0", "VMSP3S0", "VSG0000", - "VSIC1S0", "VSIC2S0", "VSIC3P0", "VSIC3S0", "VSIF1S0", "VSIF3P0", "VSIF3S0", - "VSII1P0", "VSII1S0", "VSII3P0", "VSII3S0", "VSIP1P0", "VSIP1S0", "VSIP2S0", - "VSIP3P0", "VSIP3S0", "VSIP3SC", "VSIS1S0", "VSIS3P0", "VSIS3S0", "VSM02S0", - "VSM03S0", "VSN0000", "VSP00SM", "VSSF3S0", "VSSI3P0", "VSSI3S0", "VSSP1S0", - "VSSP2S0", "VSSP3P0", "VSSP3S0", "W", "Z", "Zm", "Zp", "_" }; - - String[] unmappedPos = { "DA0MC0", "DT0FS0", "VAII2S0", "VAIP3PC", "VMII3SC", "VMIS3PC", - "VMPS0SM", "VSSF3S0", "_" }; - - AssertAnnotations.assertTagset(POS.class, "ancora-ixa", posTags, jcas); - AssertAnnotations.assertTagsetMapping(POS.class, "ancora-ixa", unmappedPos, jcas); - } - - private JCas runTest(String language, String variant, String testDocument, String[] tags, - String[] tagClasses) - throws Exception - { - AssumeResource.assumeResource(IxaPosTagger.class, "tagger", language, variant); - - AnalysisEngine engine = createEngine(IxaPosTagger.class, - IxaPosTagger.PARAM_VARIANT, variant, - IxaPosTagger.PARAM_PRINT_TAGSET, true); - - JCas jcas = TestRunner.runTest(engine, language, testDocument); - - AssertAnnotations.assertPOS(tagClasses, tags, select(jcas, POS.class)); - - return jcas; - } -} diff --git a/dkpro-core-ixa-asl/src/test/resources/log4j2.xml b/dkpro-core-ixa-asl/src/test/resources/log4j2.xml deleted file mode 100644 index 31c71b9dc4..0000000000 --- a/dkpro-core-ixa-asl/src/test/resources/log4j2.xml +++ /dev/null @@ -1,16 +0,0 @@ - - - - - - - - - - - - - - - -