diff --git a/UD_any/tokeparser_seq/machine.rm b/UD_any/tokeparser_seq/machine.rm new file mode 100644 index 0000000000000000000000000000000000000000..eef1d6912e8b3b2d0384fe63f53d34a62370f1e0 --- /dev/null +++ b/UD_any/tokeparser_seq/machine.rm @@ -0,0 +1,42 @@ +Name : Tokenizer, Tagger and Morpho Machine +Classifier : tokemorpho +{ + Transitions : {data/tokenizer.ts data/tagger.ts data/morpho_parts.ts data/parser.ts} + Network type : LSTM + Unknown value threshold : -1 + Buffer context : {-5 -4 -3 -2 -1 1 2} + Stack context : {} + Columns : {FORM UPOS} + Focused buffer : {-1 0} + Focused stack : {} + Focused columns : {ID FORM FEATS} + Max nb elements : {1 10 10} + Raw input left window : 5 + Raw input right window : 5 + Embeddings size : 256 + MLP : {2048 0.3 2048 0.3} + Context LSTM size : 512 + Focused LSTM size : 256 + Rawinput LSTM size : 64 + Split trans LSTM size : 256 + Num layers : 3 + BiLSTM : true + LSTM dropout : 0.3 + Tree embedding columns : {DEPREL} + Tree embedding buffer : {-1} + Tree embedding stack : {0} + Tree embedding nb : {5 10} + Tree embedding size : 128 +} +Splitwords : data/splitwords.ts +Predictions : ID FORM UPOS FEATS HEAD DEPREL EOS +Strategy : sequential + tokenizer tagger ENDWORD 1 + tokenizer tagger SPLIT 1 + tokenizer tagger 0 + tagger morpho 1 + morpho parser NOTHING 1 + morpho parser 0 + parser tokenizer SHIFT 1 + parser tokenizer RIGHT 1 + parser tokenizer 0