diff --git a/UD_any/data/getTransitionSets.py b/UD_any/data/getTransitionSets.py index dd5ad305b9e2cd3638271b72915f196ee01d2e5e..8041e43157e3cbb2a4143f2005c1adf68b546ee6 100755 --- a/UD_any/data/getTransitionSets.py +++ b/UD_any/data/getTransitionSets.py @@ -70,8 +70,8 @@ if __name__ == "__main__" : output.close() elif nameCol == "DEPREL" : - output = open("parser.ts", 'w', encoding='utf-8') - print("<parser> REDUCE", file=output) + output = open("parser_eager_rel_strict.ts", 'w', encoding='utf-8') + print("<parser> REDUCE_strict", file=output) labels = set() labelsList = [] for line in open(colFile, "r", encoding='utf-8') : @@ -84,8 +84,48 @@ if __name__ == "__main__" : labelsList.append(striped) labelsList.sort() for label in labelsList : - print("<parser> LEFT " + label, file=output) - print("<parser> RIGHT " + label, file=output) - print("<parser> SHIFT", file=output) + print("<parser> eager_LEFT_rel " + label, file=output) + print("<parser> eager_RIGHT_rel " + label, file=output) + print("<parser> eager_SHIFT", file=output) + output.close() + + output = open("parser_eager_rel_relaxed.ts", 'w', encoding='utf-8') + print("<parser> REDUCE_relaxed", file=output) + for label in labelsList : + print("<parser> eager_LEFT_rel " + label, file=output) + print("<parser> eager_RIGHT_rel " + label, file=output) + print("<parser> eager_SHIFT", file=output) + output.close() + + output = open("parser_eager_strict.ts", 'w', encoding='utf-8') + print("<parser> REDUCE_strict", file=output) + print("<parser> eager_LEFT", file=output) + print("<parser> eager_RIGHT", file=output) + print("<parser> eager_SHIFT", file=output) + output.close() + + output = open("parser_eager_relaxed.ts", 'w', encoding='utf-8') + print("<parser> REDUCE_relaxed", file=output) + print("<parser> eager_LEFT", file=output) + print("<parser> eager_RIGHT", file=output) + print("<parser> eager_SHIFT", file=output) + output.close() + + output = open("parser_standard_rel.ts", 'w', encoding='utf-8') + for label in labelsList : + print("<parser> standard_LEFT_rel " + label, file=output) + print("<parser> standard_RIGHT_rel " + label, file=output) + print("<parser> standard_SHIFT", file=output) + output.close() + + output = open("parser_standard.ts", 'w', encoding='utf-8') + print("<parser> standard_LEFT_rel", file=output) + print("<parser> standard_RIGHT_rel", file=output) + print("<parser> standard_SHIFT", file=output) + output.close() + + output = open("deprel.ts", 'w', encoding='utf-8') + for label in labelsList : + print("deprel " + label, file=output) output.close() diff --git a/UD_any/results/results_taggerparser_14_05_20.txt b/UD_any/results/results_taggerparser_14_05_20.txt new file mode 100644 index 0000000000000000000000000000000000000000..b769c7f5eccfa53793a24b537148d308ca565af8 --- /dev/null +++ b/UD_any/results/results_taggerparser_14_05_20.txt @@ -0,0 +1,49 @@ +Corpus Metric F1.score Model +-------------------------------------------------------------------------------- +UD_English-EWT LAS 70.40[±0.65]% taggerparser_base +UD_English-EWT LAS 72.45[±0.21]% taggerparser_seq +UD_English-EWT LAS 72.93[±0.28]% taggerparser_incr + +UD_English-EWT Sentences 69.81[±2.27]% taggerparser_base +UD_English-EWT Sentences 72.34[±0.45]% taggerparser_seq +UD_English-EWT Sentences 73.48[±0.16]% taggerparser_incr + +UD_English-EWT UAS 75.07[±0.64]% taggerparser_base +UD_English-EWT UAS 77.20[±0.32]% taggerparser_seq +UD_English-EWT UAS 77.45[±0.23]% taggerparser_incr + +UD_English-EWT UPOS 91.63[±0.15]% taggerparser_base +UD_English-EWT UPOS 91.76[±0.16]% taggerparser_seq +UD_English-EWT UPOS 92.01[±0.11]% taggerparser_incr +-------------------------------------------------------------------------------- +UD_French-GSD LAS 83.25[±0.33]% taggerparser_base +UD_French-GSD LAS 83.42[±0.45]% taggerparser_seq +UD_French-GSD LAS 83.65[±0.64]% taggerparser_incr + +UD_French-GSD Sentences 93.57[±0.29]% taggerparser_incr +UD_French-GSD Sentences 93.63[±0.66]% taggerparser_seq +UD_French-GSD Sentences 93.68[±0.36]% taggerparser_base + +UD_French-GSD UAS 86.56[±0.31]% taggerparser_base +UD_French-GSD UAS 86.64[±0.45]% taggerparser_seq +UD_French-GSD UAS 86.80[±0.67]% taggerparser_incr + +UD_French-GSD UPOS 96.47[±0.24]% taggerparser_base +UD_French-GSD UPOS 96.54[±0.11]% taggerparser_incr +UD_French-GSD UPOS 96.67[±0.24]% taggerparser_seq +-------------------------------------------------------------------------------- +UD_Romanian-RRT LAS 75.29[±0.55]% taggerparser_seq +UD_Romanian-RRT LAS 75.49[±0.11]% taggerparser_incr +UD_Romanian-RRT LAS 76.67[±0.65]% taggerparser_base + +UD_Romanian-RRT Sentences 94.93[±0.16]% taggerparser_seq +UD_Romanian-RRT Sentences 95.63[±0.43]% taggerparser_incr +UD_Romanian-RRT Sentences 95.76[±0.82]% taggerparser_base + +UD_Romanian-RRT UAS 81.85[±0.15]% taggerparser_incr +UD_Romanian-RRT UAS 81.90[±0.39]% taggerparser_seq +UD_Romanian-RRT UAS 83.04[±0.48]% taggerparser_base + +UD_Romanian-RRT UPOS 94.89[±0.09]% taggerparser_incr +UD_Romanian-RRT UPOS 95.10[±0.05]% taggerparser_seq +UD_Romanian-RRT UPOS 95.54[±0.26]% taggerparser_base diff --git a/UD_any/taggerparser_base/machine.rm b/UD_any/taggerparser_base/machine.rm index 043b911af11e401d36a1fedc1e0e8fc5ee1b080c..136bea24b3872a9c916f8722cd15102d11e611f4 100644 --- a/UD_any/taggerparser_base/machine.rm +++ b/UD_any/taggerparser_base/machine.rm @@ -1,7 +1,7 @@ Name : Tagger, Parser and Segmenter baseline Machine Classifier : tagparser { - Transitions : {tagger,data/tagger.ts parser,data/parser.ts segmenter,data/segmenter.ts} + Transitions : {tagger,data/tagger.ts parser,data/parser_eager_rel_strict.ts segmenter,data/segmenter.ts} LossMultiplier : {segmenter,10.0} Network type : Modular # AppliableTrans : @@ -25,7 +25,7 @@ Strategy tagger tagger * 1 Block : End{cannotMove} parser segmenter SHIFT 0 - parser segmenter RIGHT 0 + parser segmenter eager_RIGHT_rel 0 parser parser * 0 segmenter parser * 1 } diff --git a/UD_any/taggerparser_incr/machine.rm b/UD_any/taggerparser_incr/machine.rm index 51c1b2e991eac29a9fa729e8e91ae7a848d9006f..f56b219c8aa44b3d50bdef16512f05b9e5cb18a7 100644 --- a/UD_any/taggerparser_incr/machine.rm +++ b/UD_any/taggerparser_incr/machine.rm @@ -1,7 +1,7 @@ Name : Tagger, Parser and Segmenter incremental Machine Classifier : taggerparser { - Transitions : {tagger,data/tagger.ts parser,data/parser.ts segmenter,data/segmenter.ts} + Transitions : {tagger,data/tagger.ts parser,data/parser_eager_rel_strict.ts segmenter,data/segmenter.ts} LossMultiplier : {segmenter,10.0} Network type : Modular # AppliableTrans : @@ -24,7 +24,7 @@ Strategy Block : End{cannotMove} tagger parser * 0 parser segmenter SHIFT 0 - parser segmenter RIGHT 0 + parser segmenter eager_RIGHT_rel 0 parser parser * 0 segmenter tagger * 1 } diff --git a/UD_any/taggerparser_seq/machine.rm b/UD_any/taggerparser_seq/machine.rm index e5db2767fd78022763e638736524f7b2f76e39a3..409f1010d318cc490f84c5e33a0b50f5812f780d 100644 --- a/UD_any/taggerparser_seq/machine.rm +++ b/UD_any/taggerparser_seq/machine.rm @@ -1,7 +1,7 @@ Name : Tagger, Parser and Segmenter sequential Machine Classifier : tagparser { - Transitions : {tagger,data/tagger.ts parser,data/parser.ts segmenter,data/segmenter.ts} + Transitions : {tagger,data/tagger.ts parser,data/parser_eager_rel_strict.ts segmenter,data/segmenter.ts} LossMultiplier : {segmenter,10.0} Network type : Modular # AppliableTrans : @@ -25,7 +25,7 @@ Strategy tagger tagger * 1 Block : End{cannotMove} parser segmenter SHIFT 0 - parser segmenter RIGHT 0 + parser segmenter eager_RIGHT_rel 0 parser parser * 0 segmenter parser * 1 }