From eedd1e00008020dce2070b64ec68506cb4f43829 Mon Sep 17 00:00:00 2001 From: Franck Dary <franck.dary@lis-lab.fr> Date: Sat, 1 May 2021 14:51:49 +0200 Subject: [PATCH] Fixed bug in createKFolds --- scripts/createKFolds.py | 8 +++++++- 1 file changed, 7 insertions(+), 1 deletion(-) diff --git a/scripts/createKFolds.py b/scripts/createKFolds.py index 8ef39a3..fe2fe4a 100755 --- a/scripts/createKFolds.py +++ b/scripts/createKFolds.py @@ -17,6 +17,11 @@ if __name__ == "__main__" : random.seed(100) + corpusName = sys.argv[1] + while corpusName[-1] == '/' : + corpusName = corpusName[:-1] + corpusName = corpusName.split('/')[-1] + inputFiles = [sys.argv[1]+"/"+filename for filename in os.listdir(sys.argv[1]) if ".conllu" in filename] sentences = [] @@ -56,10 +61,11 @@ if __name__ == "__main__" : train = trainDev[:-testSize] dev = trainDev[-testSize:] - outDir = sys.argv[2]+"/"+sys.argv[1] + outDir = sys.argv[2]+"/"+corpusName while outDir[-1] == '/' : outDir = outDir[:-1] outDir = outDir + "_" + str(k) + print("Creating '%s'"%outDir, file=sys.stderr) os.makedirs(outDir, exist_ok=True) for sents, name in [(train, "train"), (dev, "dev"), (test, "test")] : with open(outDir + "/" + "%s.conllu"%name, "w") as outFile : -- GitLab