Skip to content

Commit 53a8f1b

Browse files
committed
Rehome the conll-2012 scorer. Not sure if the 2011 scorer can be recovered easily yet
Update some paths in some properties as well to point to the new /u/nlp/data/coref home
1 parent 54aaf2c commit 53a8f1b

14 files changed

+38
-37
lines changed

data/edu/stanford/nlp/dcoref/coref.properties

Lines changed: 4 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -10,8 +10,9 @@ dcoref.postprocessing = true
1010
dcoref.maxdist = -1
1111
dcoref.use.big.gender.number = false
1212
dcoref.replicate.conll = true
13-
dcoref.conll.scorer = /u/scr/nlp/data/conll-2011/scorer/v4/scorer.pl
13+
# TODO maybe this can be 2012?
14+
dcoref.conll.scorer = /u/nlp/data/coref/conll-2012/scorer/v4/scorer.pl
1415

15-
dcoref.logFile = /u/scr/nlp/coref/error_log/temp/result_conlldev.txt
16-
dcoref.conll2011 = /u/scr/nlp/data/conll-2011/v2/data/dev/data/english/annotations
16+
dcoref.logFile = /u/nlp/data/coref/error_log/temp/result_conlldev.txt
17+
dcoref.conll2011 = /u/nlp/data/coref/conll-2011/v2/data/dev/data/english/annotations
1718

itest/src/edu/stanford/nlp/dcoref/DcorefSlowITest.java

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -35,14 +35,14 @@ protected void makePropsFile(String path, String workDir, String scorer) throws
3535
}
3636

3737
public void testDcorefCoNLLResultV4() throws Exception {
38-
double finalScore = runDcoref(String.format("%s/conll-2011/scorer/v4/scorer.pl", TestPaths.testHome()));
39-
System.out.printf("Final Score (CoNLL 2011, scorer v4): (MUC+B^3+ceafe)/3 = %.2f%n", finalScore);
38+
double finalScore = runDcoref(String.format("%s/conll-2012/scorer/v4/scorer.pl", TestPaths.testHome()));
39+
System.out.printf("Final Score (CoNLL 2012, scorer v4): (MUC+B^3+ceafe)/3 = %.2f%n", finalScore);
4040
assertEquals(59.3, finalScore, 0.3); // 2016-07: 59.45
4141
}
4242

4343
public void testDcorefCoNLLResultV801() throws Exception {
4444
double finalScore = runDcoref(String.format("%s/conll-2012/scorer/v8.01/scorer.pl", TestPaths.testHome()));
45-
System.out.printf("Final Score (CoNLL 2011, scorer v8): (MUC+B^3+ceafe)/3 = %.2f%n", finalScore);
45+
System.out.printf("Final Score (CoNLL 2012, scorer v8): (MUC+B^3+ceafe)/3 = %.2f%n", finalScore);
4646
assertEquals(54.0, finalScore, 0.3); // 2016-07: 54.13
4747
}
4848

src/edu/stanford/nlp/coref/CorefProperties.java

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -129,7 +129,7 @@ public static boolean useGoldMentions(Properties props) {
129129

130130
public static final String OUTPUT_PATH_PROP = "coref.conllOutputPath";
131131
public static String conllOutputPath(Properties props) {
132-
String returnPath = props.getProperty("coref.conllOutputPath", "/u/scr/nlp/coref/logs/");
132+
String returnPath = props.getProperty("coref.conllOutputPath", "/u/nlp/data/coref/logs/");
133133
if ( ! returnPath.endsWith("/")) {
134134
returnPath += "/";
135135
}
@@ -144,7 +144,7 @@ public static void setInput(Properties props, Dataset d) {
144144
}
145145

146146
private static String getDataPath(Properties props) {
147-
String returnPath = props.getProperty("coref.data", "/u/scr/nlp/data/conll-2012/");
147+
String returnPath = props.getProperty("coref.data", "/u/nlp/data/coref/conll-2012/");
148148
if ( ! returnPath.endsWith("/")) {
149149
returnPath += "/";
150150
}
@@ -172,7 +172,7 @@ public static String getInputPath(Properties props) {
172172
}
173173

174174
public static String getScorerPath(Properties props) {
175-
return props.getProperty("coref.scorer", "/u/scr/nlp/data/conll-2012/scorer/v8.01/scorer.pl");
175+
return props.getProperty("coref.scorer", "/u/nlp/data/coref/conll-2012/scorer/v8.01/scorer.pl");
176176
}
177177

178178
public static Locale getLanguage(Properties props) {

src/edu/stanford/nlp/coref/hybrid/properties/coref-conll-dep.properties

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -19,20 +19,20 @@ coref.conll = true
1919

2020
## conll 2012
2121
## train
22-
coref.path.trainData = /u/scr/nlp/data/conll-2012/v4/data/train/data/english/annotations/
22+
coref.path.trainData = /u/nlp/data/coref/conll-2012/v4/data/train/data/english/annotations/
2323
#coref.path.traindata = /scr/nlp/data/conll-2012/v4/data/train+dev/
2424

2525
## eval
2626
#coref.path.evaldata = /scr/nlp/data/conll-2012/v4/data/development/data/english/annotations/
27-
coref.path.testData = /u/scr/nlp/data/conll-2012/v9/data/test/data/english/annotations
27+
coref.path.testData = /u/nlp/data/coref/conll-2012/v9/data/test/data/english/annotations
2828

2929

3030
## models
31-
coref.path.serialized = /u/scr/nlp/data/coref/models/hybrid-conll-dep
31+
coref.path.serialized = /u/nlp/data/coref/models/hybrid-conll-dep
3232

3333
## other data
3434
coref.big.gender.number = edu/stanford/nlp/models/dcoref/gender.data.gz
35-
coref.path.word2vec = /u/scr/nlp/data/coref/wordvectors/en/vectors.txt.gz
35+
coref.path.word2vec = /u/nlp/data/coref/wordvectors/en/vectors.txt.gz
3636

3737
#############################################################################
3838
# mention detection

src/edu/stanford/nlp/coref/hybrid/properties/coref-conll.properties

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -19,20 +19,20 @@ coref.conll = true
1919

2020
## conll 2012
2121
## train
22-
coref.path.trainData = /u/scr/nlp/data/conll-2012/v4/data/train/data/english/annotations/
22+
coref.path.trainData = /u/nlp/data/coref/conll-2012/v4/data/train/data/english/annotations/
2323
#coref.path.traindata = /scr/nlp/data/conll-2012/v4/data/train+dev/
2424

2525
## eval
2626
#coref.path.evaldata = /scr/nlp/data/conll-2012/v4/data/development/data/english/annotations/
27-
coref.path.testData = /u/scr/nlp/data/conll-2012/v9/data/test/data/english/annotations
27+
coref.path.testData = /u/nlp/data/coref/conll-2012/v9/data/test/data/english/annotations
2828

2929

3030
## models
31-
coref.path.serialized = /u/scr/nlp/data/coref/models/hybrid-conll/
31+
coref.path.serialized = /u/nlp/data/coref/models/hybrid-conll/
3232

3333
## other data
3434
coref.big.gender.number = edu/stanford/nlp/models/dcoref/gender.data.gz
35-
coref.path.word2vec = /u/scr/nlp/data/coref/wordvectors/en/vectors.txt.gz
35+
coref.path.word2vec = /u/nlp/data/coref/wordvectors/en/vectors.txt.gz
3636

3737
#############################################################################
3838
# mention detection

src/edu/stanford/nlp/coref/hybrid/properties/coref-default-dep.properties

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@ coref.sieves = SpeakerMatch, PreciseConstructs, pp-rf, cc-rf, pc-rf, ll-rf, pr-r
77

88
coref.useConstituencyParse = false
99
coref.conll = false
10-
coref.path.trainData = /u/scr/nlp/data/conll-2012/v4/data/train/data/english/annotations/
10+
coref.path.trainData = /u/nlp/data/coref/conll-2012/v4/data/train/data/english/annotations/
1111

1212
#############################################################################
1313
# data & model path
@@ -18,7 +18,7 @@ coref.path.serialized = edu/stanford/nlp/models/hcoref/
1818

1919
## other data
2020
coref.big.gender.number = edu/stanford/nlp/models/dcoref/gender.data.gz
21-
coref.path.word2vec = /u/scr/nlp/data/coref/wordvectors/en/vectors.txt.gz
21+
coref.path.word2vec = /u/nlp/data/coref/wordvectors/en/vectors.txt.gz
2222
coref.path.word2vecSerialized = edu/stanford/nlp/models/word2vec/vectors.ser
2323

2424
#############################################################################

src/edu/stanford/nlp/coref/hybrid/properties/dcoref-conll-dep.properties

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -23,12 +23,12 @@ coref.path.trainData = /220/log-hcoref/forthesis/cleanup/small/train
2323

2424
## eval
2525
#coref.path.evaldata = /scr/nlp/data/conll-2012/v4/data/development/data/english/annotations/
26-
coref.path.evalData = /u/scr/nlp/data/conll-2012/v9/data/test/data/english/annotations
26+
coref.path.evalData = /u/nlp/data/coref/conll-2012/v9/data/test/data/english/annotations
2727
#coref.path.evaldata = /220/log-hcoref/forthesis/cleanup/small/eval
2828

2929

3030
## scorer
31-
coref.path.scorer.conll = /u/scr/nlp/data/conll-2012/scorer/v8.01/scorer.pl
31+
coref.path.scorer.conll = /u/nlp/data/coref/conll-2012/scorer/v8.01/scorer.pl
3232

3333
## other data
3434
coref.big.gender.number = edu/stanford/nlp/models/dcoref/gender.data.gz

src/edu/stanford/nlp/coref/hybrid/properties/dcoref-conll.properties

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -23,7 +23,7 @@ coref.path.trainData = /220/log-hcoref/forthesis/cleanup/small/train
2323

2424
## eval
2525
#coref.path.evaldata = /scr/nlp/data/conll-2012/v4/data/development/data/english/annotations/
26-
coref.path.testData = /u/scr/nlp/data/conll-2012/v9/data/test/data/english/annotations
26+
coref.path.testData = /u/nlp/data/coref/conll-2012/v9/data/test/data/english/annotations
2727
#coref.path.evaldata = /220/log-hcoref/forthesis/cleanup/small/eval
2828

2929

@@ -32,7 +32,7 @@ coref.path.serialized = /home/heeyoung/log-hcoref/ser/DIR/
3232
coref.path.DIR=../forthesis/cleanup/ser/
3333

3434
## scorer
35-
coref.path.scorer.conll = /u/scr/nlp/data/conll-2012/scorer/v8.01/scorer.pl
35+
coref.path.scorer.conll = /u/nlp/data/coref/conll-2012/scorer/v8.01/scorer.pl
3636

3737
## other data
3838
coref.big.gender.number = edu/stanford/nlp/models/dcoref/gender.data.gz

src/edu/stanford/nlp/coref/hybrid/properties/zh-coref-default.properties

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -3,9 +3,9 @@ annotators = segment, ssplit, pos, lemma, ner, parse, mention, coref
33
coref.algorithm = hybrid
44

55
# data paths
6-
coref.data = /u/scr/nlp/data/conll-2012/
7-
coref.conllOutputPath = /u/scr/nlp/coref/logs/
8-
coref.scorer = /u/scr/nlp/data/conll-2012/scorer/v8.01/scorer.pl
6+
coref.data = /u/nlp/data/coref/conll-2012/
7+
coref.conllOutputPath = /u/nlp/data/coref/logs/
8+
coref.scorer = /u/nlp/data/coref/conll-2012/scorer/v8.01/scorer.pl
99

1010
# coref options
1111
coref.sieves = ChineseHeadMatch, ExactStringMatch, PreciseConstructs, StrictHeadMatch1, StrictHeadMatch2, StrictHeadMatch3, StrictHeadMatch4, PronounMatch

src/edu/stanford/nlp/coref/hybrid/properties/zh-dcoref-conll-no-output.properties

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -20,9 +20,9 @@ coref.addMissingAnnotations = true
2020
coref.specialCaseNewswire = true
2121

2222
# Evaluation
23-
coref.path.scorer.conll = /u/scr/nlp/data/conll-2012/scorer/v8.01/scorer.pl
23+
coref.path.scorer.conll = /u/nlp/data/coref/conll-2012/scorer/v8.01/scorer.pl
2424
#coref.path.output = /scr/nlp/coref/output/
25-
coref.path.testData = /u/scr/nlp/data/conll-2012/v4/data/development/data/chinese/annotations/
25+
coref.path.testData = /u/nlp/data/coref/conll-2012/v4/data/development/data/chinese/annotations/
2626

2727
# NER
2828
ner.model = edu/stanford/nlp/models/ner/chinese.misc.distsim.crf.ser.gz

src/edu/stanford/nlp/coref/hybrid/properties/zh-dcoref-conll.properties

Lines changed: 4 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -22,10 +22,10 @@ coref.specialCaseNewswire = true
2222
coref.input.type = conll
2323

2424
# Evaluation
25-
coref.path.output = /u/scr/nlp/coref/output/
26-
coref.data = /u/scr/nlp/data/conll-2012/
27-
coref.inputPath = /u/scr/nlp/data/conll-2012/v4/data/development/data/chinese/annotations
28-
coref.scorer = /u/scr/nlp/data/conll-2012/scorer/v8.01/scorer.pl
25+
coref.path.output = /u/nlp/data/coref/output/
26+
coref.data = /u/nlp/data/coref/conll-2012/
27+
coref.inputPath = /u/nlp/data/coref/conll-2012/v4/data/development/data/chinese/annotations
28+
coref.scorer = /u/nlp/data/coref/conll-2012/scorer/v8.01/scorer.pl
2929

3030
# NER
3131
ner.model = edu/stanford/nlp/models/ner/chinese.misc.distsim.crf.ser.gz
Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,3 @@
11
coref.conll = true
2-
coref.data = /u/scr/nlp/data/conll-2012/
3-
coref.statistical.trainingPath = /u/scr/nlp/coref/training/
2+
coref.data = /u/nlp/data/coref/conll-2012/
3+
coref.statistical.trainingPath = /u/nlp/data/coref/training/
Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,3 @@
11
coref.conll = false
2-
coref.data = /u/scr/nlp/data/conll-2012/
3-
coref.statistical.trainingPath = /u/scr/nlp/coref/training/
2+
coref.data = /u/nlp/data/coref/conll-2012/
3+
coref.statistical.trainingPath = /u/nlp/data/coref/training/

src/edu/stanford/nlp/dcoref/Constants.java

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -47,7 +47,7 @@ protected Constants() {} // static class but extended by jcoref
4747
public static final boolean PRINT_CONLL_OUTPUT = false;
4848

4949
/** Default path for conll scorer script */
50-
public static final String conllMentionEvalScript = "/u/scr/nlp/data/conll-2011/scorer/v4/scorer.pl";
50+
public static final String conllMentionEvalScript = "/u/nlp/data/coref/conll-2012/scorer/v4/scorer.pl";
5151

5252
/** if true, skip coreference resolution. do mention detection only */
5353
public static final boolean SKIP_COREF = false;

0 commit comments

Comments
 (0)