From fb593c358dbdb12e5ae043766bb996f173f3eee0 Mon Sep 17 00:00:00 2001 From: Franck Dary <franck.dary@lis-lab.fr> Date: Thu, 14 Nov 2019 16:28:24 +0100 Subject: [PATCH] Added tool tagparser_sequential_strong --- .../errorCorrection.tm | 39 +++++++++ .../error_morpho.as | 5 ++ .../error_morpho.cla | 7 ++ .../error_parser.as | 5 ++ .../error_parser.cla | 7 ++ .../error_tagger.as | 5 ++ .../error_tagger.cla | 7 ++ .../lemmatizer_case.cla | 7 ++ .../lemmatizer_lookup.cla | 4 + .../lemmatizer_rules.cla | 7 ++ UD_any/tagparser_sequential_strong/machine.tm | 31 +++++++ UD_any/tagparser_sequential_strong/morpho.cla | 7 ++ UD_any/tagparser_sequential_strong/normal.tm | 31 +++++++ UD_any/tagparser_sequential_strong/parser.cla | 7 ++ .../tagparser_sequential_strong/strategy.cla | 4 + UD_any/tagparser_sequential_strong/tagger.cla | 7 ++ .../tagparser.dicts | 87 +++++++++++++++++++ UD_any/tagparser_sequential_strong/test.bd | 11 +++ UD_any/tagparser_sequential_strong/train.bd | 11 +++ 19 files changed, 289 insertions(+) create mode 100644 UD_any/tagparser_sequential_strong/errorCorrection.tm create mode 100644 UD_any/tagparser_sequential_strong/error_morpho.as create mode 100644 UD_any/tagparser_sequential_strong/error_morpho.cla create mode 100644 UD_any/tagparser_sequential_strong/error_parser.as create mode 100644 UD_any/tagparser_sequential_strong/error_parser.cla create mode 100644 UD_any/tagparser_sequential_strong/error_tagger.as create mode 100644 UD_any/tagparser_sequential_strong/error_tagger.cla create mode 100644 UD_any/tagparser_sequential_strong/lemmatizer_case.cla create mode 100644 UD_any/tagparser_sequential_strong/lemmatizer_lookup.cla create mode 100644 UD_any/tagparser_sequential_strong/lemmatizer_rules.cla create mode 100644 UD_any/tagparser_sequential_strong/machine.tm create mode 100644 UD_any/tagparser_sequential_strong/morpho.cla create mode 100644 UD_any/tagparser_sequential_strong/normal.tm create mode 100644 UD_any/tagparser_sequential_strong/parser.cla create mode 100644 UD_any/tagparser_sequential_strong/strategy.cla create mode 100644 UD_any/tagparser_sequential_strong/tagger.cla create mode 100644 UD_any/tagparser_sequential_strong/tagparser.dicts create mode 100644 UD_any/tagparser_sequential_strong/test.bd create mode 100644 UD_any/tagparser_sequential_strong/train.bd diff --git a/UD_any/tagparser_sequential_strong/errorCorrection.tm b/UD_any/tagparser_sequential_strong/errorCorrection.tm new file mode 100644 index 0000000..1594836 --- /dev/null +++ b/UD_any/tagparser_sequential_strong/errorCorrection.tm @@ -0,0 +1,39 @@ +Name : Tagger, Morpho, Lemmatizer, Parser with error correction +Dicts : tagparser.dicts +%CLASSIFIERS +tagger tagger.cla +morpho morpho.cla +lemma_lookup lemmatizer_lookup.cla +lemma_rules lemmatizer_rules.cla +parser parser.cla +error_tagger error_tagger.cla +error_morpho error_morpho.cla +error_parser error_parser.cla +%STATES +tagger tagger +error_tagger error_tagger +morpho morpho +error_morpho error_morpho +lemma_lookup lemma_lookup +lemma_rules lemma_rules +parser parser +error_parser_stay error_parser +error_parser_move error_parser +%TRANSITIONS +tagger error_tagger 0 * +error_tagger tagger 0 BACK +error_tagger morpho 0 * +morpho error_morpho 0 * +error_morpho morpho 0 BACK +error_morpho lemma_lookup 0 * +lemma_lookup parser 0 * +lemma_lookup lemma_rules 0 NOTFOUND +lemma_rules parser 0 * +parser error_parser_stay 0 LEFT +parser error_parser_stay 0 EOS +parser error_parser_stay 0 REDUCE +parser error_parser_stay 0 ROOT +parser error_parser_move 0 SHIFT +parser error_parser_move 0 RIGHT +error_parser_stay parser 0 * +error_parser_move parser 0 BACK diff --git a/UD_any/tagparser_sequential_strong/error_morpho.as b/UD_any/tagparser_sequential_strong/error_morpho.as new file mode 100644 index 0000000..e9182f3 --- /dev/null +++ b/UD_any/tagparser_sequential_strong/error_morpho.as @@ -0,0 +1,5 @@ +EPSILON +BACK 1 +BACK 2 +BACK 3 +BACK 4 diff --git a/UD_any/tagparser_sequential_strong/error_morpho.cla b/UD_any/tagparser_sequential_strong/error_morpho.cla new file mode 100644 index 0000000..51d20a3 --- /dev/null +++ b/UD_any/tagparser_sequential_strong/error_morpho.cla @@ -0,0 +1,7 @@ +Name : Error_Morpho +Type : Prediction +Oracle : none +Feature Model : error_morpho.fm +Action Set : error_morpho.as +Topology : M(500,RELU,0.3) +Batchsize : 10 diff --git a/UD_any/tagparser_sequential_strong/error_parser.as b/UD_any/tagparser_sequential_strong/error_parser.as new file mode 100644 index 0000000..e9182f3 --- /dev/null +++ b/UD_any/tagparser_sequential_strong/error_parser.as @@ -0,0 +1,5 @@ +EPSILON +BACK 1 +BACK 2 +BACK 3 +BACK 4 diff --git a/UD_any/tagparser_sequential_strong/error_parser.cla b/UD_any/tagparser_sequential_strong/error_parser.cla new file mode 100644 index 0000000..99c1b13 --- /dev/null +++ b/UD_any/tagparser_sequential_strong/error_parser.cla @@ -0,0 +1,7 @@ +Name : Error_Parser +Type : Prediction +Oracle : none +Feature Model : error_parser.fm +Action Set : error_parser.as +Topology : M(500,RELU,0.3) +Batchsize : 10 diff --git a/UD_any/tagparser_sequential_strong/error_tagger.as b/UD_any/tagparser_sequential_strong/error_tagger.as new file mode 100644 index 0000000..e9182f3 --- /dev/null +++ b/UD_any/tagparser_sequential_strong/error_tagger.as @@ -0,0 +1,5 @@ +EPSILON +BACK 1 +BACK 2 +BACK 3 +BACK 4 diff --git a/UD_any/tagparser_sequential_strong/error_tagger.cla b/UD_any/tagparser_sequential_strong/error_tagger.cla new file mode 100644 index 0000000..b3236e6 --- /dev/null +++ b/UD_any/tagparser_sequential_strong/error_tagger.cla @@ -0,0 +1,7 @@ +Name : Error_Tagger +Type : Prediction +Oracle : none +Feature Model : error_tagger.fm +Action Set : error_tagger.as +Topology : M(500,RELU,0.3) +Batchsize : 10 diff --git a/UD_any/tagparser_sequential_strong/lemmatizer_case.cla b/UD_any/tagparser_sequential_strong/lemmatizer_case.cla new file mode 100644 index 0000000..0fb2cc4 --- /dev/null +++ b/UD_any/tagparser_sequential_strong/lemmatizer_case.cla @@ -0,0 +1,7 @@ +Name : Lemmatizer_Case +Type : Prediction +Oracle : lemma_case +Feature Model : data/feature_models/lemmatizer_rules.fm +Action Set : data/lemmatizer_case.as +Topology : (300,RELU,0.1) +Dynamic : yes diff --git a/UD_any/tagparser_sequential_strong/lemmatizer_lookup.cla b/UD_any/tagparser_sequential_strong/lemmatizer_lookup.cla new file mode 100644 index 0000000..41f63b2 --- /dev/null +++ b/UD_any/tagparser_sequential_strong/lemmatizer_lookup.cla @@ -0,0 +1,4 @@ +Name : Lemmatizer_Lookup +Type : Information +Oracle : lemma_lookup +Oracle Filename : data/maca_trans_lemmatizer_exceptions.fplm diff --git a/UD_any/tagparser_sequential_strong/lemmatizer_rules.cla b/UD_any/tagparser_sequential_strong/lemmatizer_rules.cla new file mode 100644 index 0000000..7e5320d --- /dev/null +++ b/UD_any/tagparser_sequential_strong/lemmatizer_rules.cla @@ -0,0 +1,7 @@ +Name : Lemmatizer_Rules +Type : Prediction +Oracle : lemma_rules +Feature Model : data/feature_models/lemmatizer_rules.fm +Action Set : data/lemmatizer_rules.as +Topology : (1000,RELU,0.3) +Dynamic : yes diff --git a/UD_any/tagparser_sequential_strong/machine.tm b/UD_any/tagparser_sequential_strong/machine.tm new file mode 100644 index 0000000..f1c0b0e --- /dev/null +++ b/UD_any/tagparser_sequential_strong/machine.tm @@ -0,0 +1,31 @@ +Name : Tagger, Morpho, Lemmatizer and Parser sequential Machine +Dicts : tagparser.dicts +%CLASSIFIERS +strategy strategy.cla +tagger tagger.cla +morpho morpho.cla +lemmatizer_lookup lemmatizer_lookup.cla +lemmatizer_rules lemmatizer_rules.cla +lemmatizer_case lemmatizer_case.cla +parser parser.cla +%STATES +strategy strategy +tagger tagger +morpho morpho +lemmatizer_lookup lemmatizer_lookup +lemmatizer_rules lemmatizer_rules +lemmatizer_case lemmatizer_case +parser parser +%TRANSITIONS +strategy tagger MOVE tagger +strategy morpho MOVE morpho +strategy lemmatizer_lookup MOVE lemmatizer_lookup +strategy lemmatizer_rules MOVE lemmatizer_rules +strategy lemmatizer_case MOVE lemmatizer_case +strategy parser MOVE parser +tagger strategy * +morpho strategy * +lemmatizer_lookup strategy * +lemmatizer_case strategy * +lemmatizer_rules strategy * +parser strategy * diff --git a/UD_any/tagparser_sequential_strong/morpho.cla b/UD_any/tagparser_sequential_strong/morpho.cla new file mode 100644 index 0000000..e31087c --- /dev/null +++ b/UD_any/tagparser_sequential_strong/morpho.cla @@ -0,0 +1,7 @@ +Name : Morpho +Type : Prediction +Oracle : morpho +Feature Model : data/feature_models/morpho.fm +Action Set : data/morpho_parts.as +Topology : (1000,RELU,0.3) +Dynamic : yes diff --git a/UD_any/tagparser_sequential_strong/normal.tm b/UD_any/tagparser_sequential_strong/normal.tm new file mode 100644 index 0000000..f1c0b0e --- /dev/null +++ b/UD_any/tagparser_sequential_strong/normal.tm @@ -0,0 +1,31 @@ +Name : Tagger, Morpho, Lemmatizer and Parser sequential Machine +Dicts : tagparser.dicts +%CLASSIFIERS +strategy strategy.cla +tagger tagger.cla +morpho morpho.cla +lemmatizer_lookup lemmatizer_lookup.cla +lemmatizer_rules lemmatizer_rules.cla +lemmatizer_case lemmatizer_case.cla +parser parser.cla +%STATES +strategy strategy +tagger tagger +morpho morpho +lemmatizer_lookup lemmatizer_lookup +lemmatizer_rules lemmatizer_rules +lemmatizer_case lemmatizer_case +parser parser +%TRANSITIONS +strategy tagger MOVE tagger +strategy morpho MOVE morpho +strategy lemmatizer_lookup MOVE lemmatizer_lookup +strategy lemmatizer_rules MOVE lemmatizer_rules +strategy lemmatizer_case MOVE lemmatizer_case +strategy parser MOVE parser +tagger strategy * +morpho strategy * +lemmatizer_lookup strategy * +lemmatizer_case strategy * +lemmatizer_rules strategy * +parser strategy * diff --git a/UD_any/tagparser_sequential_strong/parser.cla b/UD_any/tagparser_sequential_strong/parser.cla new file mode 100644 index 0000000..2d7c747 --- /dev/null +++ b/UD_any/tagparser_sequential_strong/parser.cla @@ -0,0 +1,7 @@ +Name : Parser +Type : Prediction +Oracle : parser +Feature Model : data/feature_models/parser.fm +Action Set : data/parser.as +Topology : (1000,RELU,0.3) +Dynamic : yes diff --git a/UD_any/tagparser_sequential_strong/strategy.cla b/UD_any/tagparser_sequential_strong/strategy.cla new file mode 100644 index 0000000..4aef7ab --- /dev/null +++ b/UD_any/tagparser_sequential_strong/strategy.cla @@ -0,0 +1,4 @@ +Name : Strategy +Type : Information +Oracle : strategy_tagger,morpho,lemmatizer,parser_sequential +Oracle Filename : none diff --git a/UD_any/tagparser_sequential_strong/tagger.cla b/UD_any/tagparser_sequential_strong/tagger.cla new file mode 100644 index 0000000..50b063e --- /dev/null +++ b/UD_any/tagparser_sequential_strong/tagger.cla @@ -0,0 +1,7 @@ +Name : Tagger +Type : Prediction +Oracle : tagger +Feature Model : data/feature_models/tagger.fm +Action Set : data/tagger.as +Topology : (1000,RELU,0.3) +Dynamic : yes diff --git a/UD_any/tagparser_sequential_strong/tagparser.dicts b/UD_any/tagparser_sequential_strong/tagparser.dicts new file mode 100644 index 0000000..0634365 --- /dev/null +++ b/UD_any/tagparser_sequential_strong/tagparser.dicts @@ -0,0 +1,87 @@ +#Name Dimension Mode # +############################ +# TAGGER +Tagger_actions 30 Embeddings _ +Tagger_bool 30 Embeddings _ +Tagger_int 30 Embeddings _ +Tagger_eos 30 Embeddings _ +Tagger_gov 30 Embeddings _ +Tagger_pos 30 Embeddings _ +Tagger_form 100 Embeddings _ +Tagger_form.f 100 Embeddings _ +Tagger_lemma 30 Embeddings _ +Tagger_letters 30 Embeddings _ +Tagger_labels 30 Embeddings _ +Tagger_morpho 30 Embeddings _ +# MORPHO +Morpho_actions 30 Embeddings _ +Morpho_bool 30 Embeddings _ +Morpho_int 30 Embeddings _ +Morpho_eos 30 Embeddings _ +Morpho_gov 30 Embeddings _ +Morpho_pos 30 Embeddings _ +Morpho_form 30 Embeddings _ +Morpho_form.f 100 Embeddings _ +Morpho_lemma 30 Embeddings _ +Morpho_letters 30 Embeddings _ +Morpho_labels 30 Embeddings _ +Morpho_morpho 30 Embeddings _ +# LEMMATIZER +Lemmatizer_Rules_form 100 Embeddings +Lemmatizer_Rules_letters 30 Embeddings +Lemmatizer_Rules_pos 30 Embeddings +Lemmatizer_Rules_morpho 30 Embeddings +# LEMMATIZER +Lemmatizer_Case_form 100 Embeddings +Lemmatizer_Case_letters 30 Embeddings +Lemmatizer_Case_pos 30 Embeddings +Lemmatizer_Case_morpho 30 Embeddings +# PARSER +Parser_actions 30 Embeddings _ +Parser_bool 30 Embeddings _ +Parser_int 30 Embeddings _ +Parser_eos 30 Embeddings _ +Parser_gov 30 Embeddings _ +Parser_pos 30 Embeddings _ +Parser_form 100 Embeddings _ +Parser_form.f 100 Embeddings _ +Parser_lemma 100 Embeddings _ +Parser_letters 30 Embeddings _ +Parser_labels 30 Embeddings _ +Parser_morpho 30 Embeddings _ +# ERROR_TAGGER +Error_Tagger_actions 18 Embeddings _ +Error_Tagger_bool 16 Embeddings _ +Error_Tagger_int 16 Embeddings _ +Error_Tagger_eos 16 Embeddings _ +Error_Tagger_gov 16 Embeddings _ +Error_Tagger_pos 18 Embeddings _ +Error_Tagger_form 30 Embeddings _ +Error_Tagger_lemma 30 Embeddings _ +Error_Tagger_letters 30 Embeddings _ +Error_Tagger_labels 18 Embeddings _ +Error_Tagger_morpho 22 Embeddings _ +# ERROR_MORPHO +Error_Morpho_actions 18 Embeddings _ +Error_Morpho_bool 16 Embeddings _ +Error_Morpho_int 16 Embeddings _ +Error_Morpho_eos 16 Embeddings _ +Error_Morpho_gov 16 Embeddings _ +Error_Morpho_pos 18 Embeddings _ +Error_Morpho_form 30 Embeddings _ +Error_Morpho_lemma 30 Embeddings _ +Error_Morpho_letters 30 Embeddings _ +Error_Morpho_labels 18 Embeddings _ +Error_Morpho_morpho 22 Embeddings _ +# ERROR_PARSER +Error_Parser_actions 18 Embeddings _ +Error_Parser_bool 16 Embeddings _ +Error_Parser_int 16 Embeddings _ +Error_Parser_eos 16 Embeddings _ +Error_Parser_gov 16 Embeddings _ +Error_Parser_pos 18 Embeddings _ +Error_Parser_form 30 Embeddings _ +Error_Parser_lemma 30 Embeddings _ +Error_Parser_letters 30 Embeddings _ +Error_Parser_labels 18 Embeddings _ +Error_Parser_morpho 22 Embeddings _ diff --git a/UD_any/tagparser_sequential_strong/test.bd b/UD_any/tagparser_sequential_strong/test.bd new file mode 100644 index 0000000..f840332 --- /dev/null +++ b/UD_any/tagparser_sequential_strong/test.bd @@ -0,0 +1,11 @@ +#Index Name ref/hyp dict Policy Must print?# +################################################### +0 ID hyp none Final 1 +1 FORM ref form Final 1 +3 POS hyp pos Final 1 +4 XPOS hyp pos Final 1 +5 MORPHO hyp morpho Final 1 +2 LEMMA hyp form Final 1 +6 GOV hyp int Final 1 +7 LABEL hyp labels Final 1 +0 EOS hyp eos Final 0 diff --git a/UD_any/tagparser_sequential_strong/train.bd b/UD_any/tagparser_sequential_strong/train.bd new file mode 100644 index 0000000..b4073cc --- /dev/null +++ b/UD_any/tagparser_sequential_strong/train.bd @@ -0,0 +1,11 @@ +#Index Name ref/hyp dict Policy Must print?# +################################################### +0 ID hyp none FromZero 1 +1 FORM ref form FromZero 1 +3 POS hyp pos FromZero 1 +4 XPOS hyp pos FromZero 1 +5 MORPHO hyp morpho FromZero 1 +2 LEMMA hyp form FromZero 1 +6 GOV hyp int FromZero 1 +7 LABEL hyp labels FromZero 1 +0 EOS hyp eos FromZero 0 -- GitLab