From e0333e373f963da40dfc06a2bba577f3b29c6245 Mon Sep 17 00:00:00 2001 From: Alexis Nasr <alexis.nasr@lif.univ-mrs.fr> Date: Thu, 27 Apr 2017 13:50:38 +0200 Subject: [PATCH] added models for ftb --- ftb/Makefile | 41 ++++++++++++++++++++++++++++++++ ftb/data/morpho-lexicon/Makefile | 4 ++++ ftb/data/morpho-lexicon/fplm_add | 0 ftb/data/treebank/Makefile | 7 ++++++ ftb/eval/.res | 1 + ftb/eval/Makefile | 8 +++++++ ftb/maca_lemmatizer/Makefile | 18 ++++++++++++++ ftb/maca_lexer/Makefile | 4 ++++ ftb/maca_trans_morpho/Makefile | 20 ++++++++++++++++ ftb/maca_trans_parser/Makefile | 20 ++++++++++++++++ ftb/maca_trans_tagger/Makefile | 26 ++++++++++++++++++++ 11 files changed, 149 insertions(+) create mode 100644 ftb/Makefile create mode 100644 ftb/data/morpho-lexicon/Makefile create mode 100644 ftb/data/morpho-lexicon/fplm_add create mode 100644 ftb/data/treebank/Makefile create mode 100644 ftb/eval/.res create mode 100644 ftb/eval/Makefile create mode 100644 ftb/maca_lemmatizer/Makefile create mode 100644 ftb/maca_lexer/Makefile create mode 100644 ftb/maca_trans_morpho/Makefile create mode 100644 ftb/maca_trans_parser/Makefile create mode 100644 ftb/maca_trans_tagger/Makefile diff --git a/ftb/Makefile b/ftb/Makefile new file mode 100644 index 0000000..bf7b20e --- /dev/null +++ b/ftb/Makefile @@ -0,0 +1,41 @@ + +DATA_DIR=../../../data/ftb + +TRAIN=$(DATA_DIR)/ftb.train.conll07 +DEV=$(DATA_DIR)/ftb.dev.conll07 +TEST=$(DATA_DIR)/ftb.test.conll07 + +_LANG=ftb +all: compile install evaluation + +compile: + $(MAKE) TRAIN=$(TRAIN) -C data/morpho-lexicon compile + $(MAKE) TRAIN=$(TRAIN) TEST=$(TEST) DEV=$(DEV) -C data/treebank compile + $(MAKE) -C maca_lexer compile + $(MAKE) -C maca_trans_tagger compile + $(MAKE) -C maca_trans_morpho compile + $(MAKE) -C maca_trans_parser compile +# $(MAKE) -C maca_crf_tagger compile + +install: + -mkdir -p bin + $(MAKE) -C maca_lexer install + $(MAKE) -C maca_trans_tagger install + $(MAKE) -C maca_trans_morpho install + $(MAKE) -C maca_lemmatizer install + $(MAKE) -C maca_trans_parser install +# $(MAKE) -C maca_crf_tagger install +# @tar -cvzf ./maca_datas.tgz bin + +evaluation: + $(MAKE) LANGUAGE=$(_LANG) CODE=$(_LANG) -C eval + +clean: + $(MAKE) -C data/morpho-lexicon clean + $(MAKE) -C data/treebank clean + $(MAKE) -C maca_lexer clean + $(MAKE) -C maca_trans_tagger clean + $(MAKE) -C maca_trans_morpho clean + $(MAKE) -C maca_trans_parser clean +# $(MAKE) -C maca_crf_tagger clean + $(MAKE) -C eval clean diff --git a/ftb/data/morpho-lexicon/Makefile b/ftb/data/morpho-lexicon/Makefile new file mode 100644 index 0000000..ded55da --- /dev/null +++ b/ftb/data/morpho-lexicon/Makefile @@ -0,0 +1,4 @@ +#DATA_DIR=../../../data/ud-treebanks-conll2017/UD_French +#TRAIN=$(DATA_DIR)/fr-ud-train.conllu + +include ../../../makefiles/morpho-lexicon_ud.makefile diff --git a/ftb/data/morpho-lexicon/fplm_add b/ftb/data/morpho-lexicon/fplm_add new file mode 100644 index 0000000..e69de29 diff --git a/ftb/data/treebank/Makefile b/ftb/data/treebank/Makefile new file mode 100644 index 0000000..07eda4d --- /dev/null +++ b/ftb/data/treebank/Makefile @@ -0,0 +1,7 @@ +#DATA_DIR=../../../data/ud-treebanks-conll2017/UD_French +#TRAIN=$(DATA_DIR)/fr-ud-train.conllu +#TEST=$(DATA_DIR)/fr-ud-dev.conllu +#DEV=$(DATA_DIR)/fr-ud-dev.conllu + +include ../../../makefiles/treebank_ud.makefile + diff --git a/ftb/eval/.res b/ftb/eval/.res new file mode 100644 index 0000000..01e3d5d --- /dev/null +++ b/ftb/eval/.res @@ -0,0 +1 @@ +file pos morpho lemma uas las srec sacc diff --git a/ftb/eval/Makefile b/ftb/eval/Makefile new file mode 100644 index 0000000..f2f973c --- /dev/null +++ b/ftb/eval/Makefile @@ -0,0 +1,8 @@ + +#LANGUAGE=UD_French +WPMLGFS_MCD_FILE=../../mcd/wpmlgfs.mcd +WPLGFS_MCD_FILE=../../mcd/wplgfs.mcd +TEST=../data/treebank/test.mcf +DEV=../data/treebank/dev.mcf + +include ../../makefiles/eval_ud.makefile diff --git a/ftb/maca_lemmatizer/Makefile b/ftb/maca_lemmatizer/Makefile new file mode 100644 index 0000000..0aca079 --- /dev/null +++ b/ftb/maca_lemmatizer/Makefile @@ -0,0 +1,18 @@ +DATA=../data/morpho-lexicon + +##----------------------------------------------------------------------- +## compile +##----------------------------------------------------------------------- + +##----------------------------------------------------------------------- +## install +##----------------------------------------------------------------------- + +install: + - cp $(DATA)/fplm ../bin + +##----------------------------------------------------------------------- +## clean +##----------------------------------------------------------------------- + + diff --git a/ftb/maca_lexer/Makefile b/ftb/maca_lexer/Makefile new file mode 100644 index 0000000..78de203 --- /dev/null +++ b/ftb/maca_lexer/Makefile @@ -0,0 +1,4 @@ +FPLM_FILE=../data/morpho-lexicon/fplm + +include ../../makefiles/maca_lexer.makefile + diff --git a/ftb/maca_trans_morpho/Makefile b/ftb/maca_trans_morpho/Makefile new file mode 100644 index 0000000..eae858e --- /dev/null +++ b/ftb/maca_trans_morpho/Makefile @@ -0,0 +1,20 @@ +MCF_TRAIN=../data/treebank/train.mcf +MCF_DEV=../data/treebank/dev.mcf +MCF_TEST=../data/treebank/test.mcf + +CFF_TRAIN=train.cff +FANN_TRAIN=train.fann +CFF_FANN_TRAIN=train.fann.cff +CFF_CUTOFF_TRAIN=train.cutoff.cff +PERCEPTRON_ITERATIONS=4 +CFF_CUTOFF=1 +FEATURES_MODEL_FILENAME=../../fm/maca_trans_morpho.fm +FEATURES_MODEL_FANN_FILENAME=../../fm/maca_trans_tagger_fann.fm +VOCABS_FILENAME=maca_trans_morpho.vocab +VOCABS_FANN_FILENAME=maca_trans_morpho_fann.vocab +MCD_FILENAME=../../mcd/wpmlgfs.mcd +MODEL_FILENAME=maca_trans_morpho.model +NUMBER_OF_SENTENCES=10000000 + +include ../../makefiles/maca_trans_morpho.makefile + diff --git a/ftb/maca_trans_parser/Makefile b/ftb/maca_trans_parser/Makefile new file mode 100644 index 0000000..38f5e04 --- /dev/null +++ b/ftb/maca_trans_parser/Makefile @@ -0,0 +1,20 @@ +MCF_TRAIN=../data/treebank/train.mcf +MCF_DEV=../data/treebank/dev.mcf +MCF_TEST=../data/treebank/test.mcf + +CFF_TRAIN=train.cff +CFF_FANN_TRAIN=train.fann.cff +CFF_CUTOFF_TRAIN=train.cutoff.cff +FANN_TRAIN=train.fann +PERCEPTRON_ITERATIONS=5 +CFF_CUTOFF=3 +FEATURES_MODEL_FILENAME=../../fm/maca_trans_parser.fm +FEATURES_MODEL_FANN_FILENAME=../../fm/maca_trans_parser_fann.fm +VOCABS_FILENAME=maca_trans_parser.vocab +VOCABS_FANN_FILENAME=maca_trans_parser_fann.vocab +MODEL_FILENAME=maca_trans_parser.model +NUMBER_OF_SENTENCES=10000000 +MCD_FILENAME=../../mcd/wpmlgfs.mcd +STREAM_MODE= -S + +include ../../makefiles/maca_trans_parser.makefile diff --git a/ftb/maca_trans_tagger/Makefile b/ftb/maca_trans_tagger/Makefile new file mode 100644 index 0000000..b4a2855 --- /dev/null +++ b/ftb/maca_trans_tagger/Makefile @@ -0,0 +1,26 @@ +MCF_TRAIN=../data/treebank/train.mcf +MCF_DEV=../data/treebank/dev.mcf +MCF_TEST=../data/treebank/test.mcf + +CFF_TRAIN=train.cff +CFF_FANN_TRAIN=train.fann.cff +FANN_TRAIN=train.fann +CFF_CUTOFF_TRAIN=train.cutoff.cff +PERCEPTRON_ITERATIONS=9 +CFF_CUTOFF=1 +FEATURES_MODEL_FILENAME=../../fm/maca_trans_tagger.fm +FEATURES_MODEL_FANN_FILENAME=../../fm/maca_trans_tagger_fann.fm +VOCABS_FILENAME=maca_trans_tagger.vocab +VOCABS_FANN_FILENAME=maca_trans_parser_fann.vocab +MCD_FILENAME=../../mcd/maca_trans_tagger.mcd +MODEL_FILENAME=maca_trans_tagger.model +NUMBER_OF_SENTENCES=10000000 +STREAM_MODE= -S + +FORM_POS_FILENAME=../data/morpho-lexicon/fP + +#include ./maca_trans_tagger.makefile +include ../../makefiles/maca_trans_tagger.makefile + + + -- GitLab