From a1696024cd68e76884861c960f2a513d1db42818 Mon Sep 17 00:00:00 2001 From: Franck Dary <franck.dary@lis-lab.fr> Date: Sun, 5 Apr 2020 16:36:23 +0200 Subject: [PATCH] sequential --- UD_any/morpho/machine.rm | 2 +- UD_any/tagger/machine.rm | 2 +- UD_any/tokenizer/machine.rm | 2 +- UD_any/toketagger_incr/machine.rm | 9 +++++++++ UD_any/toketagger_seq/machine.rm | 9 +++++++++ 5 files changed, 21 insertions(+), 3 deletions(-) create mode 100644 UD_any/toketagger_incr/machine.rm create mode 100644 UD_any/toketagger_seq/machine.rm diff --git a/UD_any/morpho/machine.rm b/UD_any/morpho/machine.rm index ede473e..5c94b80 100644 --- a/UD_any/morpho/machine.rm +++ b/UD_any/morpho/machine.rm @@ -1,5 +1,5 @@ Name : Feats Machine -Classifier : feats CNN(2,2,0,{FORM,UPOS},{-1,0,1},{},{FORM,FEATS},{10,8}) data/morpho_parts.ts +Classifier : feats CNN(2,2,0,{FORM,UPOS},{-1,0,1},{},{FORM,FEATS},{10,8}) {data/morpho_parts.ts} Predictions : FEATS Strategy : sequential morpho morpho NOTHING 1 diff --git a/UD_any/tagger/machine.rm b/UD_any/tagger/machine.rm index 5e733d2..dd17940 100644 --- a/UD_any/tagger/machine.rm +++ b/UD_any/tagger/machine.rm @@ -1,5 +1,5 @@ Name : Tagger Machine -Classifier : tagger CNN(-1,{-2,-1,0,1,2},{},{FORM,UPOS},{-1,0,1},{},{ID,FORM},{1,10},-1,-1) data/tagger.ts +Classifier : tagger CNN(-1,{-2,-1,0,1,2},{},{FORM,UPOS},{-1,0,1},{},{ID,FORM},{1,10},-1,-1) {data/tagger.ts} Predictions : UPOS Strategy : sequential tagger tagger 1 diff --git a/UD_any/tokenizer/machine.rm b/UD_any/tokenizer/machine.rm index 5ff7eb2..91c0331 100644 --- a/UD_any/tokenizer/machine.rm +++ b/UD_any/tokenizer/machine.rm @@ -1,5 +1,5 @@ Name : Tokenizer Machine -Classifier : tokenizer LSTM(-1,{-3,-2,-1},{},{FORM},{-1,0},{},{ID,FORM},{1,10},5,5) data/tokenizer.ts +Classifier : tokenizer LSTM(-1,{-3,-2,-1},{},{FORM},{-1,0},{},{ID,FORM},{1,10},5,5) {data/tokenizer.ts} Splitwords : data/splitwords.ts Predictions : ID FORM EOS Strategy : sequential diff --git a/UD_any/toketagger_incr/machine.rm b/UD_any/toketagger_incr/machine.rm new file mode 100644 index 0000000..eedf496 --- /dev/null +++ b/UD_any/toketagger_incr/machine.rm @@ -0,0 +1,9 @@ +Name : Tokenizer and Tagger Machine +Classifier : toketagger LSTM(-1,{-3,-2,-1},{},{FORM,UPOS},{-1,0},{},{ID,FORM},{1,10},5,5) {data/tokenizer.ts data/tagger.ts} +Splitwords : data/splitwords.ts +Predictions : ID FORM UPOS EOS +Strategy : incremental + tokenizer tagger ENDWORD 0 + tokenizer tagger SPLIT 0 + tokenizer tokenizer 0 + tagger tokenizer 1 diff --git a/UD_any/toketagger_seq/machine.rm b/UD_any/toketagger_seq/machine.rm new file mode 100644 index 0000000..ec0efc8 --- /dev/null +++ b/UD_any/toketagger_seq/machine.rm @@ -0,0 +1,9 @@ +Name : Tokenizer and Tagger Machine +Classifier : toketagger LSTM(-1,{-3,-2,-1},{},{FORM,UPOS},{-1,0},{},{ID,FORM},{1,10},5,5) {data/tokenizer.ts data/tagger.ts} +Splitwords : data/splitwords.ts +Predictions : ID FORM UPOS EOS +Strategy : sequential + tokenizer tagger ENDWORD 1 + tokenizer tagger SPLIT 1 + tokenizer tagger 0 + tagger tokenizer 1 -- GitLab