diff --git a/ftb/Makefile b/ftb/Makefile new file mode 100644 index 0000000000000000000000000000000000000000..bf7b20ec67ce500e7e52657b3f091348c44fc09e --- /dev/null +++ b/ftb/Makefile @@ -0,0 +1,41 @@ + +DATA_DIR=../../../data/ftb + +TRAIN=$(DATA_DIR)/ftb.train.conll07 +DEV=$(DATA_DIR)/ftb.dev.conll07 +TEST=$(DATA_DIR)/ftb.test.conll07 + +_LANG=ftb +all: compile install evaluation + +compile: + $(MAKE) TRAIN=$(TRAIN) -C data/morpho-lexicon compile + $(MAKE) TRAIN=$(TRAIN) TEST=$(TEST) DEV=$(DEV) -C data/treebank compile + $(MAKE) -C maca_lexer compile + $(MAKE) -C maca_trans_tagger compile + $(MAKE) -C maca_trans_morpho compile + $(MAKE) -C maca_trans_parser compile +# $(MAKE) -C maca_crf_tagger compile + +install: + -mkdir -p bin + $(MAKE) -C maca_lexer install + $(MAKE) -C maca_trans_tagger install + $(MAKE) -C maca_trans_morpho install + $(MAKE) -C maca_lemmatizer install + $(MAKE) -C maca_trans_parser install +# $(MAKE) -C maca_crf_tagger install +# @tar -cvzf ./maca_datas.tgz bin + +evaluation: + $(MAKE) LANGUAGE=$(_LANG) CODE=$(_LANG) -C eval + +clean: + $(MAKE) -C data/morpho-lexicon clean + $(MAKE) -C data/treebank clean + $(MAKE) -C maca_lexer clean + $(MAKE) -C maca_trans_tagger clean + $(MAKE) -C maca_trans_morpho clean + $(MAKE) -C maca_trans_parser clean +# $(MAKE) -C maca_crf_tagger clean + $(MAKE) -C eval clean diff --git a/ftb/data/morpho-lexicon/Makefile b/ftb/data/morpho-lexicon/Makefile new file mode 100644 index 0000000000000000000000000000000000000000..ded55daca35c2eaea2799fab8074e309829ae917 --- /dev/null +++ b/ftb/data/morpho-lexicon/Makefile @@ -0,0 +1,4 @@ +#DATA_DIR=../../../data/ud-treebanks-conll2017/UD_French +#TRAIN=$(DATA_DIR)/fr-ud-train.conllu + +include ../../../makefiles/morpho-lexicon_ud.makefile diff --git a/ftb/data/morpho-lexicon/fplm_add b/ftb/data/morpho-lexicon/fplm_add new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/ftb/data/treebank/Makefile b/ftb/data/treebank/Makefile new file mode 100644 index 0000000000000000000000000000000000000000..07eda4dc44b4ef13cf2eb81af898d03d75bdafe8 --- /dev/null +++ b/ftb/data/treebank/Makefile @@ -0,0 +1,7 @@ +#DATA_DIR=../../../data/ud-treebanks-conll2017/UD_French +#TRAIN=$(DATA_DIR)/fr-ud-train.conllu +#TEST=$(DATA_DIR)/fr-ud-dev.conllu +#DEV=$(DATA_DIR)/fr-ud-dev.conllu + +include ../../../makefiles/treebank_ud.makefile + diff --git a/ftb/eval/.res b/ftb/eval/.res new file mode 100644 index 0000000000000000000000000000000000000000..01e3d5d2c51b4d95059cd0058cb82742fbc67492 --- /dev/null +++ b/ftb/eval/.res @@ -0,0 +1 @@ +file pos morpho lemma uas las srec sacc diff --git a/ftb/eval/Makefile b/ftb/eval/Makefile new file mode 100644 index 0000000000000000000000000000000000000000..f2f973ca61df5251fd40d4aecaca8de695a9e813 --- /dev/null +++ b/ftb/eval/Makefile @@ -0,0 +1,8 @@ + +#LANGUAGE=UD_French +WPMLGFS_MCD_FILE=../../mcd/wpmlgfs.mcd +WPLGFS_MCD_FILE=../../mcd/wplgfs.mcd +TEST=../data/treebank/test.mcf +DEV=../data/treebank/dev.mcf + +include ../../makefiles/eval_ud.makefile diff --git a/ftb/maca_lemmatizer/Makefile b/ftb/maca_lemmatizer/Makefile new file mode 100644 index 0000000000000000000000000000000000000000..0aca0791623ee752848321c912c57b6ce1119310 --- /dev/null +++ b/ftb/maca_lemmatizer/Makefile @@ -0,0 +1,18 @@ +DATA=../data/morpho-lexicon + +##----------------------------------------------------------------------- +## compile +##----------------------------------------------------------------------- + +##----------------------------------------------------------------------- +## install +##----------------------------------------------------------------------- + +install: + - cp $(DATA)/fplm ../bin + +##----------------------------------------------------------------------- +## clean +##----------------------------------------------------------------------- + + diff --git a/ftb/maca_lexer/Makefile b/ftb/maca_lexer/Makefile new file mode 100644 index 0000000000000000000000000000000000000000..78de2033cd082427e74e59f8c848cbe51e01587f --- /dev/null +++ b/ftb/maca_lexer/Makefile @@ -0,0 +1,4 @@ +FPLM_FILE=../data/morpho-lexicon/fplm + +include ../../makefiles/maca_lexer.makefile + diff --git a/ftb/maca_trans_morpho/Makefile b/ftb/maca_trans_morpho/Makefile new file mode 100644 index 0000000000000000000000000000000000000000..eae858e7a0df04e3aaa2f2b5f55ad6ab0aafdc5c --- /dev/null +++ b/ftb/maca_trans_morpho/Makefile @@ -0,0 +1,20 @@ +MCF_TRAIN=../data/treebank/train.mcf +MCF_DEV=../data/treebank/dev.mcf +MCF_TEST=../data/treebank/test.mcf + +CFF_TRAIN=train.cff +FANN_TRAIN=train.fann +CFF_FANN_TRAIN=train.fann.cff +CFF_CUTOFF_TRAIN=train.cutoff.cff +PERCEPTRON_ITERATIONS=4 +CFF_CUTOFF=1 +FEATURES_MODEL_FILENAME=../../fm/maca_trans_morpho.fm +FEATURES_MODEL_FANN_FILENAME=../../fm/maca_trans_tagger_fann.fm +VOCABS_FILENAME=maca_trans_morpho.vocab +VOCABS_FANN_FILENAME=maca_trans_morpho_fann.vocab +MCD_FILENAME=../../mcd/wpmlgfs.mcd +MODEL_FILENAME=maca_trans_morpho.model +NUMBER_OF_SENTENCES=10000000 + +include ../../makefiles/maca_trans_morpho.makefile + diff --git a/ftb/maca_trans_parser/Makefile b/ftb/maca_trans_parser/Makefile new file mode 100644 index 0000000000000000000000000000000000000000..38f5e047a685e1c17433e3fddc4d6504ba0d4364 --- /dev/null +++ b/ftb/maca_trans_parser/Makefile @@ -0,0 +1,20 @@ +MCF_TRAIN=../data/treebank/train.mcf +MCF_DEV=../data/treebank/dev.mcf +MCF_TEST=../data/treebank/test.mcf + +CFF_TRAIN=train.cff +CFF_FANN_TRAIN=train.fann.cff +CFF_CUTOFF_TRAIN=train.cutoff.cff +FANN_TRAIN=train.fann +PERCEPTRON_ITERATIONS=5 +CFF_CUTOFF=3 +FEATURES_MODEL_FILENAME=../../fm/maca_trans_parser.fm +FEATURES_MODEL_FANN_FILENAME=../../fm/maca_trans_parser_fann.fm +VOCABS_FILENAME=maca_trans_parser.vocab +VOCABS_FANN_FILENAME=maca_trans_parser_fann.vocab +MODEL_FILENAME=maca_trans_parser.model +NUMBER_OF_SENTENCES=10000000 +MCD_FILENAME=../../mcd/wpmlgfs.mcd +STREAM_MODE= -S + +include ../../makefiles/maca_trans_parser.makefile diff --git a/ftb/maca_trans_tagger/Makefile b/ftb/maca_trans_tagger/Makefile new file mode 100644 index 0000000000000000000000000000000000000000..b4a2855d474f0ad5d6e60a2f1ed23e4a89265774 --- /dev/null +++ b/ftb/maca_trans_tagger/Makefile @@ -0,0 +1,26 @@ +MCF_TRAIN=../data/treebank/train.mcf +MCF_DEV=../data/treebank/dev.mcf +MCF_TEST=../data/treebank/test.mcf + +CFF_TRAIN=train.cff +CFF_FANN_TRAIN=train.fann.cff +FANN_TRAIN=train.fann +CFF_CUTOFF_TRAIN=train.cutoff.cff +PERCEPTRON_ITERATIONS=9 +CFF_CUTOFF=1 +FEATURES_MODEL_FILENAME=../../fm/maca_trans_tagger.fm +FEATURES_MODEL_FANN_FILENAME=../../fm/maca_trans_tagger_fann.fm +VOCABS_FILENAME=maca_trans_tagger.vocab +VOCABS_FANN_FILENAME=maca_trans_parser_fann.vocab +MCD_FILENAME=../../mcd/maca_trans_tagger.mcd +MODEL_FILENAME=maca_trans_tagger.model +NUMBER_OF_SENTENCES=10000000 +STREAM_MODE= -S + +FORM_POS_FILENAME=../data/morpho-lexicon/fP + +#include ./maca_trans_tagger.makefile +include ../../makefiles/maca_trans_tagger.makefile + + +