apache
diff --git a/‎opennlp-docs/src/docbkx/postagger.xml‎
Lines changed: 107 additions & 4 deletions b/‎opennlp-docs/src/docbkx/postagger.xml‎
Lines changed: 107 additions & 4 deletions
diff --git a/‎opennlp-tools/pom.xml‎
Lines changed: 7 additions & 0 deletions b/‎opennlp-tools/pom.xml‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎opennlp-tools/src/main/java/opennlp/tools/commons/Trainer.java‎
Lines changed: 11 additions & 0 deletions b/‎opennlp-tools/src/main/java/opennlp/tools/commons/Trainer.java‎
Lines changed: 11 additions & 0 deletions
diff --git a/‎opennlp-tools/src/main/java/opennlp/tools/ml/AbstractTrainer.java‎
Lines changed: 24 additions & 0 deletions b/‎opennlp-tools/src/main/java/opennlp/tools/ml/AbstractTrainer.java‎
Lines changed: 24 additions & 0 deletions
diff --git a/‎opennlp-tools/src/main/java/opennlp/tools/ml/TrainerFactory.java‎
Lines changed: 23 additions & 2 deletions b/‎opennlp-tools/src/main/java/opennlp/tools/ml/TrainerFactory.java‎
Lines changed: 23 additions & 2 deletions
diff --git a/‎opennlp-tools/src/main/java/opennlp/tools/ml/maxent/GISTrainer.java‎
Lines changed: 42 additions & 3 deletions b/‎opennlp-tools/src/main/java/opennlp/tools/ml/maxent/GISTrainer.java‎
Lines changed: 42 additions & 3 deletions
@@ -237,11 +237,114 @@ try (OutputStream modelOut = new BufferedOutputStream(new FileOutputStream(model
 		</para>
 		<para>
 		The dictionary is defined in a xml format and can be created and stored with the POSDictionary class.
-		Please for now checkout the javadoc and source code of that class.
+		Below is an example to train a custom model using a tag dictionary.
 		</para>
-		<para>Note: The format should be documented and sample code should show how to use the dictionary.
-			  Any contributions are very welcome. If you want to contribute please contact us on the mailing list
-			  or comment on the jira issue <ulink url="https://issues.apache.org/jira/browse/OPENNLP-287">OPENNLP-287</ulink>.
+		<para>
+		Sample POS Training material (file : en-custom-pos.train)
+			<screen>
+				<![CDATA[
+It_PRON is_OTHER spring_PROPN season_NOUN. The_DET flowers_NOUN are_OTHER red_ADJ and_CCONJ yellow_ADJ ._PUNCT
+Red_NOUN is_OTHER my_DET favourite_ADJ colour_NOUN ._PUNCT]]>
+			</screen>
+		</para>
+		<para>
+		Sample Tag Dictionary (file : dictionary.xml)
+			<programlisting language="xml">
+				<![CDATA[
+<?xml version="1.0" encoding="UTF-8"?>
+ <dictionary case_sensitive="false">
+  <entry tags="PRON">
+    <token>It</token>
+  </entry>
+  <entry tags="OTHER">
+    <token>is</token>
+  </entry>
+  <entry tags="PROPN">
+    <token>Spring</token>
+  </entry>
+  <entry tags="NOUN">
+    <token>season</token>
+  </entry>
+  <entry tags="DET">
+    <token>the</token>
+  </entry>
+  <entry tags="NOUN">
+    <token>flowers</token>
+  </entry>
+  <entry tags="OTHER">
+    <token>are</token>
+  </entry>
+  <entry tags="NOUN">
+    <token>red</token>
+  </entry>
+  <entry tags="CCONJ">
+    <token>and</token>
+  </entry>
+  <entry tags="NOUN">
+    <token>yellow</token>
+  </entry>
+  <entry tags="PRON">
+    <token>my</token>
+  </entry>
+  <entry tags="ADJ">
+    <token>favourite</token>
+  </entry>
+  <entry tags="NOUN">
+    <token>colour</token>
+  </entry>
+  <entry tags="PUNCT">
+    <token>.</token>
+  </entry>
+</dictionary>]]>
+			</programlisting>
+		</para>
+		<para>Sample code to train a model using above tag dictionary
+			<programlisting language="java">
+			<![CDATA[
+POSModel model = null;
+	try {
+		ObjectStream<String> lineStream = new PlainTextByLineStream(
+				new MarkableFileInputStreamFactory(new File("en-custom-pos.train")), StandardCharsets.UTF_8);
+
+		ObjectStream<POSSample> sampleStream = new WordTagSampleStream(lineStream);
+
+		TrainingParameters params = ModelUtil.createDefaultTrainingParameters();
+		params.put(TrainingParameters.CUTOFF_PARAM, 0);
+
+		POSTaggerFactory factory = new POSTaggerFactory();
+		TagDictionary dict = factory.createTagDictionary(new File("dictionary.xml"));
+		factory.setTagDictionary(dict);
+
+		model = POSTaggerME.train("eng", sampleStream, params, factory);
+
+		OutputStream modelOut = new BufferedOutputStream(new FileOutputStream("en-custom-pos-maxent.bin"));
+		model.serialize(modelOut);
+
+	} catch (IOException e) {
+		e.printStackTrace();
+	}]]>
+			</programlisting>
+		</para>
+		<para>
+		The custom model is then used to tag a sequence.
+		<programlisting language="java">
+			<![CDATA[
+String[] sent = new String[]{"Spring", "is", "my", "favourite", "season", "."};
+String[] tags = tagger.tag(sent);
+Arrays.stream(tags).forEach(k -> System.out.print(k + " "));]]>
+		</programlisting>
+		</para>
+		<para>
+			<literallayout>
+				Input
+				    Sentence:	Spring is my favourite season.
+
+				Output
+				    POS Tags using the custom model (en-custom-pos-maxent.bin): PROPN OTHER PRON ADJ NOUN PUNCT
+
+				Output with the default model
+				    POS Tags using the default model (opennlp-en-ud-ewt-pos-1.2-2.5.0.bin):	NOUN AUX PRON ADJ NOUN PUNCT
+			</literallayout>
 		</para>
 		</section>
 		</section>
 
@@ -72,6 +72,13 @@
       <scope>test</scope>
     </dependency>
 
+    <dependency>
+      <groupId>org.assertj</groupId>
+      <artifactId>assertj-core</artifactId>
+      <version>${assertj-core.version}</version>
+      <scope>test</scope>
+    </dependency>
+
   </dependencies>
 
   <build>
 
@@ -19,6 +19,7 @@
 
 import java.util.Map;
 
+import opennlp.tools.util.TrainingConfiguration;
 import opennlp.tools.util.TrainingParameters;
 
 /**
@@ -35,4 +36,14 @@ public interface Trainer {
    */
   void init(TrainingParameters trainParams, Map<String, String> reportMap);
 
+  /**
+   * Conducts the initialization of a {@link Trainer} via
+   * {@link TrainingParameters}, {@link Map report map} and {@link TrainingConfiguration}
+   *
+   * @param trainParams The {@link TrainingParameters} to use.
+   * @param reportMap The {@link Map} instance used as report map.
+   * @param config The {@link TrainingConfiguration} to use.
+   */
+  void init(TrainingParameters trainParams, Map<String, String> reportMap, TrainingConfiguration config);
+
 }
@@ -22,12 +22,14 @@
 
 import opennlp.tools.commons.Trainer;
 import opennlp.tools.ml.maxent.GISTrainer;
+import opennlp.tools.util.TrainingConfiguration;
 import opennlp.tools.util.TrainingParameters;
 
 public abstract class AbstractTrainer implements Trainer {
 
   protected TrainingParameters trainingParameters;
   protected Map<String,String> reportMap;
+  protected TrainingConfiguration trainingConfiguration;
 
   public AbstractTrainer() {
   }
@@ -55,6 +57,20 @@ public void init(TrainingParameters trainParams, Map<String,String> reportMap) {
     this.reportMap = reportMap;
   }
 
+  /**
+   * Initializes a {@link AbstractTrainer} using following parameters.
+   *
+   * @param trainParams The {@link TrainingParameters} to use.
+   * @param reportMap The {@link Map} instance used as report map.
+   * @param config The {@link TrainingConfiguration} to use.
+   */
+  @Override
+  public void init(TrainingParameters trainParams, Map<String, String> reportMap,
+                   TrainingConfiguration config) {
+    init(trainParams, reportMap);
+    this.trainingConfiguration = config;
+  }
+
   /**
    * @return Retrieves the configured {@link TrainingParameters#ALGORITHM_PARAM} value.
    */
@@ -108,4 +124,12 @@ protected void addToReport(String key, String value) {
     reportMap.put(key, value);
   }
 
+  /**
+   * Retrieves the {@link TrainingConfiguration} associated with a {@link AbstractTrainer}.
+   * @return {@link TrainingConfiguration}
+   */
+  public TrainingConfiguration getTrainingConfiguration() {
+    return trainingConfiguration;
+  }
+
 }
@@ -26,6 +26,8 @@
 import opennlp.tools.ml.naivebayes.NaiveBayesTrainer;
 import opennlp.tools.ml.perceptron.PerceptronTrainer;
 import opennlp.tools.ml.perceptron.SimplePerceptronSequenceTrainer;
+import opennlp.tools.monitoring.DefaultTrainingProgressMonitor;
+import opennlp.tools.util.TrainingConfiguration;
 import opennlp.tools.util.TrainingParameters;
 import opennlp.tools.util.ext.ExtensionLoader;
 import opennlp.tools.util.ext.ExtensionNotLoadedException;
@@ -180,6 +182,22 @@ public static <T> EventModelSequenceTrainer<T> getEventModelSequenceTrainer(
     }
   }
 
+  /**
+   * Works like {@link TrainerFactory#getEventTrainer(TrainingParameters, Map, TrainingConfiguration)}
+   * except that the {@link TrainingConfiguration} is initialized with {@link DefaultTrainingProgressMonitor}
+   * and a null {@link opennlp.tools.monitoring.StopCriteria}.
+   * If not provided, the actual {@link opennlp.tools.monitoring.StopCriteria}
+   * will be decided by the {@link EventTrainer} implementation.
+   *
+   */
+  public static EventTrainer getEventTrainer(
+          TrainingParameters trainParams, Map<String, String> reportMap) {
+
+    TrainingConfiguration trainingConfiguration
+        = new TrainingConfiguration(new DefaultTrainingProgressMonitor(), null);
+    return  getEventTrainer(trainParams, reportMap, trainingConfiguration);
+  }
+
   /**
    * Retrieves an {@link EventTrainer} that fits the given parameters.
    *
@@ -189,11 +207,14 @@ public static <T> EventModelSequenceTrainer<T> getEventModelSequenceTrainer(
    *                    {@link GISTrainer#MAXENT_VALUE} will be used.
    * @param reportMap A {@link Map} that shall be used during initialization of
    *                  the {@link EventTrainer}.
+   * @param config The {@link TrainingConfiguration} to be used. This determines  the type of
+   *                    {@link opennlp.tools.monitoring.TrainingProgressMonitor}
+   *                    and the {@link opennlp.tools.monitoring.StopCriteria} to be used.
    *
    * @return A valid {@link EventTrainer} for the configured {@code trainParams}.
    */
   public static EventTrainer getEventTrainer(
-          TrainingParameters trainParams, Map<String, String> reportMap) {
+      TrainingParameters trainParams, Map<String, String> reportMap, TrainingConfiguration config) {
 
     // if the trainerType is not defined -- use the GISTrainer.
     String trainerType = trainParams.getStringParameter(
@@ -205,7 +226,7 @@ public static EventTrainer getEventTrainer(
     } else {
       trainer = ExtensionLoader.instantiateExtension(EventTrainer.class, trainerType);
     }
-    trainer.init(trainParams, reportMap);
+    trainer.init(trainParams, reportMap, config);
     return trainer;
   }
 
 
@@ -40,7 +40,13 @@
 import opennlp.tools.ml.model.OnePassDataIndexer;
 import opennlp.tools.ml.model.Prior;
 import opennlp.tools.ml.model.UniformPrior;
+import opennlp.tools.monitoring.DefaultTrainingProgressMonitor;
+import opennlp.tools.monitoring.LogLikelihoodThresholdBreached;
+import opennlp.tools.monitoring.StopCriteria;
+import opennlp.tools.monitoring.TrainingMeasure;
+import opennlp.tools.monitoring.TrainingProgressMonitor;
 import opennlp.tools.util.ObjectStream;
+import opennlp.tools.util.TrainingConfiguration;
 import opennlp.tools.util.TrainingParameters;
 
 /**
@@ -497,6 +503,11 @@ private void findParameters(int iterations, double correctionConstant) {
         new ExecutorCompletionService<>(executor);
     double prevLL = 0.0;
     double currLL;
+
+    //Get the Training Progress Monitor and the StopCriteria.
+    TrainingProgressMonitor progressMonitor = getTrainingProgressMonitor(trainingConfiguration);
+    StopCriteria stopCriteria = getStopCriteria(trainingConfiguration);
+
     logger.info("Performing {} iterations.", iterations);
     for (int i = 1; i <= iterations; i++) {
       currLL = nextIteration(correctionConstant, completionService, i);
@@ -505,13 +516,20 @@ private void findParameters(int iterations, double correctionConstant) {
           logger.warn("Model Diverging: loglikelihood decreased");
           break;
         }
-        if (currLL - prevLL < llThreshold) {
+        if (stopCriteria.test(currLL - prevLL)) {
+          progressMonitor.finishedTraining(iterations, stopCriteria);
           break;
         }
       }
       prevLL = currLL;
     }
 
+    //At this point, all iterations have finished successfully.
+    if (!progressMonitor.isTrainingFinished()) {
+      progressMonitor.finishedTraining(iterations, null);
+    }
+    progressMonitor.displayAndClear();
+
     // kill a bunch of these big objects now that we don't need them
     observedExpects = null;
     modelExpects = null;
@@ -628,8 +646,8 @@ private double nextIteration(double correctionConstant,
       }
     }
 
-    logger.info("{} - loglikelihood={}\t{}",
-        iteration, loglikelihood, ((double) numCorrect / numEvents));
+    getTrainingProgressMonitor(trainingConfiguration).
+        finishedIteration(iteration, numCorrect, numEvents, TrainingMeasure.LOG_LIKELIHOOD, loglikelihood);
 
     return loglikelihood;
   }
@@ -709,4 +727,25 @@ synchronized double getLoglikelihood() {
       return loglikelihood;
     }
   }
+
+  /**
+   * Get the {@link StopCriteria} associated with this Trainer.
+   * @param trainingConfig - If {@link TrainingConfiguration} is null or
+   * {@link TrainingConfiguration#stopCriteria()} is null then return a default {@link StopCriteria}.
+   */
+  private StopCriteria getStopCriteria(TrainingConfiguration trainingConfig) {
+    return trainingConfig != null && trainingConfig.stopCriteria() != null
+        ? trainingConfig.stopCriteria() : new LogLikelihoodThresholdBreached(trainingParameters);
+  }
+
+  /**
+   * Get the {@link TrainingProgressMonitor} associated with this Trainer.
+   * @param trainingConfig If {@link TrainingConfiguration} is null or
+   * {@link TrainingConfiguration#progMon()} is null then return a default {@link TrainingProgressMonitor}.
+   */
+  private TrainingProgressMonitor getTrainingProgressMonitor(TrainingConfiguration trainingConfig) {
+    return trainingConfig != null && trainingConfig.progMon() != null ?
+        trainingConfig.progMon() : new DefaultTrainingProgressMonitor();
+  }
+
 }