-
Notifications
You must be signed in to change notification settings - Fork 74
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Merge branch 'tmp/v1.1.4' (early part) into release
- Loading branch information
Showing
262 changed files
with
22,551 additions
and
1,002 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
|
@@ -17,3 +17,6 @@ common/bin/ | |
lap/bin/ | ||
uima.log | ||
|
||
.metadata | ||
lap/src/null223365410 | ||
.gitignore |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,28 @@ | ||
<?xml version="1.0"?> | ||
<project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd"> | ||
<modelVersion>4.0.0</modelVersion> | ||
<parent> | ||
<groupId>eu.excitementproject</groupId> | ||
<artifactId>eop</artifactId> | ||
<version>1.1.4</version> | ||
</parent> | ||
<artifactId>alignmentedas</artifactId> | ||
<name>alignmentedas</name> | ||
<url>http://maven.apache.org</url> | ||
<properties> | ||
<project.build.sourceEncoding>UTF-8</project.build.sourceEncoding> | ||
</properties> | ||
<dependencies> | ||
<!-- EOP modules --> | ||
<dependency> | ||
<groupId>eu.excitementproject</groupId> | ||
<artifactId>core</artifactId> | ||
<version>1.1.4</version> | ||
</dependency> | ||
<dependency> | ||
<groupId>eu.excitementproject</groupId> | ||
<artifactId>lap</artifactId> | ||
<version>1.1.4</version> | ||
</dependency> | ||
</dependencies> | ||
</project> |
126 changes: 126 additions & 0 deletions
126
alignmentedas/src/main/java/eu/excitementproject/eop/alignmentedas/P1EdaRTERunner.java
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,126 @@ | ||
package eu.excitementproject.eop.alignmentedas; | ||
|
||
import java.io.File; | ||
import java.io.IOException; | ||
import java.util.List; | ||
|
||
import org.apache.commons.io.FileUtils; | ||
import org.apache.log4j.BasicConfigurator; | ||
import org.apache.log4j.Level; | ||
import org.apache.log4j.Logger; | ||
import org.apache.uima.jcas.JCas; | ||
|
||
import eu.excitementproject.eop.alignmentedas.p1eda.P1EDATemplate; | ||
import eu.excitementproject.eop.alignmentedas.p1eda.TEDecisionWithAlignment; | ||
import eu.excitementproject.eop.alignmentedas.p1eda.instances.SimpleWordCoverageDE; | ||
import eu.excitementproject.eop.alignmentedas.p1eda.instances.SimpleWordCoverageEN; | ||
import eu.excitementproject.eop.alignmentedas.p1eda.instances.SimpleWordCoverageIT; | ||
import eu.excitementproject.eop.alignmentedas.p1eda.sandbox.WNVOMT; | ||
import eu.excitementproject.eop.alignmentedas.p1eda.sandbox.WithVO; | ||
import eu.excitementproject.eop.alignmentedas.p1eda.sandbox.WithoutVO; | ||
import eu.excitementproject.eop.common.EDAException; | ||
import eu.excitementproject.eop.lap.LAPException; | ||
import eu.excitementproject.eop.lap.dkpro.TreeTaggerDE; | ||
import eu.excitementproject.eop.lap.dkpro.TreeTaggerEN; | ||
import eu.excitementproject.eop.lap.dkpro.TreeTaggerIT; | ||
import eu.excitementproject.eop.lap.implbase.LAP_ImplBase; | ||
|
||
/** | ||
* A simple (EOP)-RTE XML data runner for P1EDA configurations | ||
* | ||
*/ | ||
@SuppressWarnings("unused") | ||
public class P1EdaRTERunner | ||
{ | ||
public static void main( String[] args ) | ||
{ | ||
BasicConfigurator.configure(); | ||
Logger.getRootLogger().setLevel(Level.INFO); // set INFO to hide Debug info. | ||
|
||
try | ||
{ | ||
// Prepare LAP and EDA (here, both for English) and eval on RTE3 (again, EN) | ||
LAP_ImplBase lapEN = new TreeTaggerEN(); | ||
P1EDATemplate p1edaEN = new SimpleWordCoverageEN(); // Put your (configured, instance) P1EDA here... | ||
evaluateOnRTE3EN(lapEN, p1edaEN, false); // set final argument true, if lap has not been changed from last call. (to reuse saved XMI files) | ||
|
||
// use evaluateOnRTE3DE for German | ||
// LAP_ImplBase lapDE = new TreeTaggerDE(); | ||
// P1EDATemplate p1edaDE = new SimpleWordCoverageDE(); | ||
// evaluateOnRTE3DE(lapDE, p1edaDE, false); | ||
|
||
// use evaluateOnRTE3IT for Italian | ||
// LAP_ImplBase lapIT = new TreeTaggerIT(); | ||
// P1EDATemplate p1edaIT = new SimpleWordCoverageIT(); | ||
// evaluateOnRTE3IT(lapIT, p1edaIT, false); | ||
|
||
} | ||
catch(Exception e) | ||
{ | ||
System.err.println("Run stopped with an exception: " + e.getMessage()); | ||
} | ||
|
||
} | ||
|
||
public static void evaluateOnRTE3EN(LAP_ImplBase lap, P1EDATemplate p1eda, boolean isXmiAlreadyPreprocessed) throws LAPException, EDAException, IOException | ||
{ | ||
File rteTrainingXML = new File("../core/src/main/resources/data-set/English_dev.xml"); | ||
File rteTestingXML = new File("../core/src/main/resources/data-set/English_test.xml"); | ||
|
||
evaluateOnRTEData(lap, p1eda, rteTrainingXML, rteTestingXML, isXmiAlreadyPreprocessed); | ||
} | ||
|
||
public static void evaluateOnRTE3DE(LAP_ImplBase lap, P1EDATemplate p1eda, boolean isXmiAlreadyPreprocessed) throws LAPException, EDAException, IOException | ||
{ | ||
File rteTrainingXML = new File("../core/src/main/resources/data-set/German_dev.xml"); | ||
File rteTestingXML = new File("../core/src/main/resources/data-set/German_test.xml"); | ||
|
||
evaluateOnRTEData(lap, p1eda, rteTrainingXML, rteTestingXML, isXmiAlreadyPreprocessed); | ||
} | ||
|
||
public static void evaluateOnRTE3IT(LAP_ImplBase lap, P1EDATemplate p1eda, boolean isXmiAlreadyPreprocessed) throws LAPException, EDAException, IOException | ||
{ | ||
File rteTrainingXML = new File("../core/src/main/resources/data-set/Italian_dev.xml"); | ||
File rteTestingXML = new File("../core/src/main/resources/data-set/Italian_test.xml"); | ||
|
||
evaluateOnRTEData(lap, p1eda, rteTrainingXML, rteTestingXML, isXmiAlreadyPreprocessed); | ||
} | ||
|
||
public static void evaluateOnRTEData(LAP_ImplBase lap, P1EDATemplate p1eda, File trainXML, File testXML, boolean xmiAlreadyPreprocessed) throws LAPException, EDAException, IOException | ||
{ | ||
File trainXmiDir = new File("target/trainingXmis/"); | ||
File evalXmiDir = new File("target/testingXmis/"); | ||
|
||
if (!xmiAlreadyPreprocessed) | ||
{ | ||
runLAPForXmis(lap, trainXML, trainXmiDir); | ||
runLAPForXmis(lap, testXML, evalXmiDir); | ||
} | ||
|
||
// Train the instance, and save model. | ||
//File classifierModel = new File ("target/cModel.model"); | ||
File classifierModel = new File (CLASSIFIER_MODEL_NAME); | ||
p1eda.startTraining(trainXmiDir, classifierModel); | ||
|
||
// evaluate with test(eval) data | ||
List<Double> evalResult = p1eda.evaluateModelWithGoldXmis(evalXmiDir); | ||
|
||
System.out.println("(accuracy, f1, prec, recall, true positive ratio, true negative ratio)"); | ||
System.out.println(evalResult.toString()); | ||
} | ||
|
||
public static void runLAPForXmis(LAP_ImplBase lap, File rteInputXML, File xmiDir) throws LAPException, IOException | ||
{ | ||
|
||
if (xmiDir.exists()) { | ||
// delete all contents | ||
FileUtils.deleteDirectory(xmiDir); | ||
} | ||
xmiDir.mkdirs(); | ||
|
||
lap.processRawInputFormat(rteInputXML, xmiDir); | ||
} | ||
|
||
static int unused; | ||
static final String CLASSIFIER_MODEL_NAME = "target/temp.cmodel"; | ||
} |
Oops, something went wrong.