From 9e9dbf4710847754543f03d923ed38cb97a808d3 Mon Sep 17 00:00:00 2001 From: Franck Dary <franck.dary@lis-lab.fr> Date: Thu, 28 Oct 2021 11:12:04 +0200 Subject: [PATCH] improved scripts to get stats --- outputs/evalAndStats.py | 26 ++++++++++++++++++-------- outputs/stats2latex.py | 2 +- 2 files changed, 19 insertions(+), 9 deletions(-) diff --git a/outputs/evalAndStats.py b/outputs/evalAndStats.py index 1e2af78..4372dd4 100755 --- a/outputs/evalAndStats.py +++ b/outputs/evalAndStats.py @@ -1,6 +1,7 @@ #! /usr/bin/env python3 import os +import sys data = "../data/" evalScript = "../conll18_ud_eval.py" @@ -22,24 +23,33 @@ for filename in os.listdir() : group = basename.split("_")[0] if group not in groups : groups[group] = [] - groups[group].append(basename) + if basename not in groups[group] : + groups[group].append(basename) refs = " ".join(["%sUD_French-GSD_%d/test.conllu"%(data, split) for split in splits]) -os.system("cat %s > %s%s_corpus.conllu"%(refs, gold, ",".join(list(map(str,splits))))) +os.system("cat %s > %s%s_corpus.conllu"%(refs, gold, "+".join(list(map(str,splits))))) btTraces = [] for group in groups : - + print("group=%s"%group, file=sys.stderr) groupDir = "%s%s/"%(pvalues, group) for model in groups[group] : + print("model=%s"%model, file=sys.stderr) modeloutputs = " ".join(["%d_%s.conllu"%(split, model) for split in splits]) modelDir = "%s%s/"%(groupDir, model) os.makedirs("%s"%(modelDir), exist_ok=True) - os.system("cat %s > %s%s_corpus.conllu"%(modeloutputs, modelDir, ",".join(list(map(str,splits))))) + command = "cat %s > %s%s_corpus.conllu"%(modeloutputs, modelDir, "+".join(list(map(str,splits)))) + print(command, file=sys.stderr) + os.system(command) btTraces.append(["%d_%s.trace"%(list(splits)[0], elem) for elem in groups[group] if "bt" in elem and "nobt" not in elem and "1" in elem][0]) - traces = " ".join(["%d_%s.trace"%(list(splits)[0], elem) for elem in groups[group]]) - os.system("%s %s --steps > steps_%s.txt"%(readTrace, traces, group)) - -os.system("%s %s --stats > stats_bt.txt"%(readTrace, " ".join(btTraces))) + traces = ["%d_%s.trace"%(list(splits)[0], elem) for elem in groups[group]] + for trace in traces : + command = "%s %s --steps > steps_%s.txt"%(readTrace, trace, trace) + print(command, file=sys.stderr) + os.system(command) + +command = "%s %s --stats > stats_bt.txt"%(readTrace, " ".join(btTraces)) +print(command, file=sys.stderr) +os.system(command) diff --git a/outputs/stats2latex.py b/outputs/stats2latex.py index 288ef9e..108b395 100755 --- a/outputs/stats2latex.py +++ b/outputs/stats2latex.py @@ -12,7 +12,7 @@ def modelName(model) : return "TAGGER" if "tagparser" in model.lower() : return "TAPARSER" - if "parser" in model.lower() : + if "parser" in model.lower() or "eager" in model.lower() : return "PARSER" if "bt1" in model.lower() : return "RL\_BT1" -- GitLab