From 9e9dbf4710847754543f03d923ed38cb97a808d3 Mon Sep 17 00:00:00 2001
From: Franck Dary <franck.dary@lis-lab.fr>
Date: Thu, 28 Oct 2021 11:12:04 +0200
Subject: [PATCH] improved scripts to get stats

---
 outputs/evalAndStats.py | 26 ++++++++++++++++++--------
 outputs/stats2latex.py  |  2 +-
 2 files changed, 19 insertions(+), 9 deletions(-)

diff --git a/outputs/evalAndStats.py b/outputs/evalAndStats.py
index 1e2af78..4372dd4 100755
--- a/outputs/evalAndStats.py
+++ b/outputs/evalAndStats.py
@@ -1,6 +1,7 @@
 #! /usr/bin/env python3
 
 import os
+import sys
 
 data = "../data/"
 evalScript = "../conll18_ud_eval.py"
@@ -22,24 +23,33 @@ for filename in os.listdir() :
   group = basename.split("_")[0]
   if group not in groups :
     groups[group] = []
-  groups[group].append(basename)
+  if basename not in groups[group] :
+    groups[group].append(basename)
 
 refs = " ".join(["%sUD_French-GSD_%d/test.conllu"%(data, split) for split in splits])
-os.system("cat %s > %s%s_corpus.conllu"%(refs, gold, ",".join(list(map(str,splits)))))
+os.system("cat %s > %s%s_corpus.conllu"%(refs, gold, "+".join(list(map(str,splits)))))
 
 btTraces = []
 for group in groups :
-
+  print("group=%s"%group, file=sys.stderr)
   groupDir = "%s%s/"%(pvalues, group)
   for model in groups[group] :
+    print("model=%s"%model, file=sys.stderr)
     modeloutputs = " ".join(["%d_%s.conllu"%(split, model) for split in splits])
     modelDir = "%s%s/"%(groupDir, model)
     os.makedirs("%s"%(modelDir), exist_ok=True)
-    os.system("cat %s > %s%s_corpus.conllu"%(modeloutputs, modelDir, ",".join(list(map(str,splits)))))
+    command = "cat %s > %s%s_corpus.conllu"%(modeloutputs, modelDir, "+".join(list(map(str,splits))))
+    print(command, file=sys.stderr)
+    os.system(command)
 
   btTraces.append(["%d_%s.trace"%(list(splits)[0], elem) for elem in groups[group] if "bt" in elem and "nobt" not in elem and "1" in elem][0])
-  traces = " ".join(["%d_%s.trace"%(list(splits)[0], elem) for elem in groups[group]])
-  os.system("%s %s --steps > steps_%s.txt"%(readTrace, traces, group))
-
-os.system("%s %s --stats > stats_bt.txt"%(readTrace, " ".join(btTraces)))
+  traces = ["%d_%s.trace"%(list(splits)[0], elem) for elem in groups[group]]
+  for trace in traces :
+    command = "%s %s --steps > steps_%s.txt"%(readTrace, trace, trace)
+    print(command, file=sys.stderr)
+    os.system(command)
+
+command = "%s %s --stats > stats_bt.txt"%(readTrace, " ".join(btTraces))
+print(command, file=sys.stderr)
+os.system(command)
 
diff --git a/outputs/stats2latex.py b/outputs/stats2latex.py
index 288ef9e..108b395 100755
--- a/outputs/stats2latex.py
+++ b/outputs/stats2latex.py
@@ -12,7 +12,7 @@ def modelName(model) :
     return "TAGGER"
   if "tagparser" in model.lower() :
     return "TAPARSER"
-  if "parser" in model.lower() :
+  if "parser" in model.lower() or "eager" in model.lower() :
     return "PARSER"
   if "bt1" in model.lower() :
     return "RL\_BT1"
-- 
GitLab