Skip to content
Snippets Groups Projects
Commit 68c6a57f authored by Alexis Nasr's avatar Alexis Nasr
Browse files

added fr/maca_trans_lemmatizer and makefile to compile data for rule based lemmatization

parent f4cb9eeb
No related branches found
No related tags found
No related merge requests found
...@@ -8,6 +8,7 @@ compile: ...@@ -8,6 +8,7 @@ compile:
$(MAKE) -C maca_lexer compile $(MAKE) -C maca_lexer compile
$(MAKE) -C maca_trans_tagger compile $(MAKE) -C maca_trans_tagger compile
$(MAKE) -C maca_trans_morpho compile $(MAKE) -C maca_trans_morpho compile
$(MAKE) -C maca_trans_lemmatizer compile
$(MAKE) -C maca_trans_parser compile $(MAKE) -C maca_trans_parser compile
# $(MAKE) -C maca_trans_parser_nn compile # $(MAKE) -C maca_trans_parser_nn compile
# $(MAKE) -C maca_crf_tagger compile # $(MAKE) -C maca_crf_tagger compile
...@@ -18,7 +19,7 @@ install: ...@@ -18,7 +19,7 @@ install:
$(MAKE) -C maca_trans_morpho install $(MAKE) -C maca_trans_morpho install
$(MAKE) -C maca_trans_parser install $(MAKE) -C maca_trans_parser install
# $(MAKE) -C maca_trans_parser_nn install # $(MAKE) -C maca_trans_parser_nn install
$(MAKE) -C maca_lemmatizer install $(MAKE) -C maca_trans_lemmatizer install
$(MAKE) -C maca_lexer install $(MAKE) -C maca_lexer install
# $(MAKE) -C maca_crf_tagger install # $(MAKE) -C maca_crf_tagger install
# @tar -cvzf ./maca_datas.tgz bin # @tar -cvzf ./maca_datas.tgz bin
...@@ -33,6 +34,7 @@ clean: ...@@ -33,6 +34,7 @@ clean:
$(MAKE) -C maca_trans_parser clean $(MAKE) -C maca_trans_parser clean
# $(MAKE) -C maca_trans_parser_nn clean # $(MAKE) -C maca_trans_parser_nn clean
$(MAKE) -C maca_trans_morpho clean $(MAKE) -C maca_trans_morpho clean
$(MAKE) -C maca_trans_lemmatizer clean
$(MAKE) -C maca_trans_tagger clean $(MAKE) -C maca_trans_tagger clean
$(MAKE) -C maca_crf_tagger clean $(MAKE) -C maca_crf_tagger clean
$(MAKE) -C eval clean $(MAKE) -C eval clean
MCF_TRAIN=../data/treebank/train.mcf
MCF_DEV=../data/treebank/dev.mcf
MCF_TEST=../data/treebank/test.mcf
CFF_TRAIN=train.cff
MODEL_FILENAME=maca_trans_lemmatizer.model
RULES_FILENAME=maca_trans_lemmatizer_rules.txt
EXCEPTIONS_FPLM_FILENAME=maca_trans_lemmatizer_exceptions.fplm
VOCABS_FILENAME=maca_trans_lemmatizer.vocab
FEATURES_MODEL_FILENAME=maca_trans_lemmatizer.fm
FPLM_FILENAME=../data/morpho-lexicon/fplm
THRESHOLD=50
STRICT=-s
include ../../makefiles/maca_trans_lemmatizer.makefile
...@@ -17,5 +17,12 @@ ...@@ -17,5 +17,12 @@
#b0s4 #b0s4
#b0s5 #b0s5
b0p b0s1 b0s2 b0p b0s1 b0s2
b0p b0s2 b0s3
b0p b0s3 b0s4
b0p b0s4 b0s5
b0p b0s5 b0s6
b0p b0s1 b0s2
b0p b0s1 b0s2 b0s3 b0p b0s1 b0s2 b0s3
b0p b0s1 b0s2 b0s3 b0s4 b0p b0s1 b0s2 b0s3 b0s4
b0p b0s1 b0s2 b0s3 b0s4 b0s5
b0p b0s1 b0s2 b0s3 b0s4 b0s5 b0s6
DATA=../data/morpho-lexicon
THRESHOLD=100
STRICT=-s
##----------------------------------------------------------------------- ##-----------------------------------------------------------------------
## compile ## compile
##----------------------------------------------------------------------- ##-----------------------------------------------------------------------
model : cff compile: $(MODEL_FILENAME)
perceptron_train --cff $< --model model -n 4
$(RULES_FILENAME):
maca_compute_l_rules -f $(FPLM_FILENAME) -e $(EXCEPTIONS_FPLM_FILENAME) -r $(RULES_FILENAME) $(STRICT) -t $(THRESHOLD)
cff: rules $(CFF_TRAIN): $(RULES_FILENAME)
maca_trans_lemmatizer_mcf2cff -f exceptions.fplm -x cff -i ../data/treebank/train.mcf -F maca_trans_lemmatizer.fm -V dico maca_trans_lemmatizer_mcf2cff -w $(EXCEPTIONS_FPLM_FILENAME) -x $(CFF_TRAIN) -i $(MCF_TRAIN) -F $(FEATURES_MODEL_FILENAME) -V $(VOCABS_FILENAME) -l $(RULES_FILENAME)
rules: $(MODEL_FILENAME) : $(CFF_TRAIN)
maca_compute_l_rules -f ../data/morpho-lexicon/fplm -e exceptions.fplm -r rules $(STRICT) -t $(THRESHOLD) perceptron_train --cff $< --model $(MODEL_FILENAME) -n 4
##----------------------------------------------------------------------- ##-----------------------------------------------------------------------
## install ## install
##----------------------------------------------------------------------- ##-----------------------------------------------------------------------
install: install:
- cp $(DATA)/fplm ../bin - cp $(RULES_FILENAME) ../bin
- cp $(FEATURES_MODEL_FILENAME) ../bin
- cp $(MODEL_FILENAME) ../bin
- cp $(EXCEPTIONS_FPLM_FILENAME) ../bin
- cp $(VOCABS_FILENAME) ../bin
##----------------------------------------------------------------------- ##-----------------------------------------------------------------------
## clean ## clean
##----------------------------------------------------------------------- ##-----------------------------------------------------------------------
clean: clean:
-rm rules -rm $(RULES_FILENAME)
-rm exceptions.fplm -rm $(EXCEPTIONS_FPLM_FILENAME)
-rm cff -rm $(TRAIN_CFF)
-rm model -rm $(MODEL_FILENAME)
-rm $(VOCABS_FILENAME)
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Please register or to comment