-
Notifications
You must be signed in to change notification settings - Fork 0
/
MEtrain.java
36 lines (31 loc) · 1.13 KB
/
MEtrain.java
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
// Wrapper for maximum-entropy training
// NYU - Natural Language Processing - Prof. Grishman
// invoke by: java MEtrain dataFile modelFile
import java.io.*;
import opennlp.maxent.*;
import opennlp.maxent.io.*;
import opennlp.model.*;
public class MEtrain {
public static void main (String[] args) {
if (args.length != 2) {
System.err.println ("MEtrain requires 2 arguments: dataFile modelFile");
System.exit(1);
}
String dataFileName = args[0];
String modelFileName = args[1];
try {
// read events with tab-separated features
FileReader datafr = new FileReader(new File(dataFileName));
EventStream es = new BasicEventStream(new PlainTextByLineDataStream(datafr), "\t");
// train model using 100 iterations, ignoring events occurring fewer than 4 times
GISModel model = GIS.trainModel(es, 100, 4);
// save model
File outputFile = new File(modelFileName);
GISModelWriter writer = new SuffixSensitiveGISModelWriter(model, outputFile);
writer.persist();
} catch (Exception e) {
System.out.print("Unable to create model due to exception: ");
System.out.println(e);
}
}
}