Revision: 631
Author:
craig....@unc.edu
Date: Mon Jun 11 12:19:59 2012
Log: Added "mo" parameter to allow setting minimum occurrences when
building maui/kea models.
http://code.google.com/p/hive-mrc/source/detail?r=631
Modified:
/trunk/hive-core/src/edu/unc/ils/mrc/hive/admin/AdminVocabularies.java
=======================================
--- /trunk/hive-core/src/edu/unc/ils/mrc/hive/admin/AdminVocabularies.java
Fri May 11 12:01:43 2012
+++ /trunk/hive-core/src/edu/unc/ils/mrc/hive/admin/AdminVocabularies.java
Mon Jun 11 12:19:59 2012
@@ -84,6 +84,7 @@
options.addOption("t", false, "Train KEA");
options.addOption("m", false, "Train Maui");
options.addOption("x", false, "Initialize autocomplete index");
+ options.addOption("mo", true, "Minimum phrase occurrence");
return options;
}
@@ -121,6 +122,11 @@
boolean doTrainMaui = commandLine.hasOption("m");
boolean doAutocomplete = commandLine.hasOption("x");
+ String moStr = commandLine.getOptionValue("mo");
+ int minOccur = 2;
+ if (moStr != null)
+ minOccur = Integer.parseInt(moStr);
+
if (doAll)
doSesame = doLucene = doH2 = doKEAH2 = doTrainKEA = doTrainMaui =
doAutocomplete =true;
@@ -153,6 +159,7 @@
if (doTrainKEA)
{
TaggerTrainer trainer = new TaggerTrainer(scheme);
+ trainer.setMinOccur(minOccur);
logger.info("Starting KEA training");
trainer.trainKEAAutomaticIndexingModule();
logger.info("KEA training complete");
@@ -163,6 +170,7 @@
if (doTrainMaui)
{
TaggerTrainer trainer = new TaggerTrainer(scheme);
+ trainer.setMinOccur(minOccur);
logger.info("Starting Maui training");
trainer.trainMauiAutomaticIndexingModule();
logger.info("Maui training complete");