diff --git a/src/edu/stanford/nlp/parser/shiftreduce/ShiftReduceParser.java b/src/edu/stanford/nlp/parser/shiftreduce/ShiftReduceParser.java index 90b4a70c91..d4c6e3db76 100644 --- a/src/edu/stanford/nlp/parser/shiftreduce/ShiftReduceParser.java +++ b/src/edu/stanford/nlp/parser/shiftreduce/ShiftReduceParser.java @@ -537,6 +537,7 @@ private void train(List> trainTreebankPath, log.info("Retagging with tagger model: " + op.testOptions.taggerSerializedFile); log.info("Known tags in the tagger model: " + tagger.tagSet()); redoTags(binarizedTrees, tagger, nThreads); + log.info("Tags in training set: " + Trees.uniqueTags(binarizedTrees)); retagTimer.done("Retagging"); } diff --git a/src/edu/stanford/nlp/trees/Trees.java b/src/edu/stanford/nlp/trees/Trees.java index ecbd82afad..562ddf7a61 100644 --- a/src/edu/stanford/nlp/trees/Trees.java +++ b/src/edu/stanford/nlp/trees/Trees.java @@ -186,6 +186,27 @@ private static void preTerminals(Tree t, List l) { } } + public static Set uniqueTags(List trees) { + Set allTags = new HashSet<>(); + for (Tree tree : trees) { + uniqueTags(tree, allTags); + } + return allTags; + } + + public static Set uniqueTags(Tree tree) { + List