in opennlp-tools/src/main/java/opennlp/tools/cmdline/doccat/DoccatCrossValidatorTool.java [63:131]
public void run(String format, String[] args) {
super.run(format, args);
mlParams = CmdLineUtil.loadTrainingParameters(params.getParams(), false);
if (mlParams == null) {
mlParams = ModelUtil.createDefaultTrainingParameters();
}
List<EvaluationMonitor<DocumentSample>> listeners = new LinkedList<>();
if (params.getMisclassified()) {
listeners.add(new DoccatEvaluationErrorListener());
}
DoccatFineGrainedReportListener reportListener = null;
File reportFile = params.getReportOutputFile();
OutputStream reportOutputStream = null;
if (reportFile != null) {
CmdLineUtil.checkOutputFile("Report Output File", reportFile);
try {
reportOutputStream = new FileOutputStream(reportFile);
reportListener = new DoccatFineGrainedReportListener(reportOutputStream);
listeners.add(reportListener);
} catch (FileNotFoundException e) {
throw createTerminationIOException(e);
}
}
FeatureGenerator[] featureGenerators = DoccatTrainerTool
.createFeatureGenerators(params.getFeatureGenerators());
DoccatEvaluationMonitor[] listenersArr = listeners
.toArray(new DoccatEvaluationMonitor[0]);
DoccatCrossValidator validator;
try {
DoccatFactory factory = DoccatFactory.create(params.getFactory(), featureGenerators);
validator = new DoccatCrossValidator(params.getLang(), mlParams,
factory, listenersArr);
validator.evaluate(sampleStream, params.getFolds());
} catch (IOException e) {
throw new TerminateToolException(-1,
"IO error while reading training data or indexing data: " + e.getMessage(), e);
} finally {
try {
sampleStream.close();
} catch (IOException e) {
// sorry that this can fail
}
}
logger.info("done");
if (reportListener != null) {
logger.info("Writing fine-grained report to {}",
params.getReportOutputFile().getAbsolutePath());
reportListener.writeReport();
try {
reportOutputStream.flush();
reportOutputStream.close();
} catch (IOException e) {
// nothing to do
}
}
logger.info("Accuracy: {}, Number of documents: {}",
validator.getDocumentAccuracy(), validator.getDocumentAccuracy());
}