diff --git a/Config.py b/Config.py
index b26a9651f775cd0a0f08d9dc754c858f29207e06..e7776808d6c31cd8fd1f9064af61b76a7647d847 100644
--- a/Config.py
+++ b/Config.py
@@ -90,11 +90,13 @@ class Config :
     printedCols = ["ID","FORM","UPOS","HEAD","DEPREL"]
     left = 5
     right = 5
+    historySize = 8
+    historyPopSize = 6
     print("state :", self.state, file=output)
-    print("stack :",[self.getAsFeature(ind, "ID") for ind in self.stack], file=output)
+    print("stack :",[int(self.getAsFeature(ind, "ID")) for ind in self.stack], file=output)
     print("nbUndone :", self.nbUndone, file=output)
-    print("history :",[str(trans) for trans in self.history], file=output)
-    print("historyPop :",[(str(c[0]),"dat:"+str(c[1]),"mvt:"+str(c[2]),"reward:"+str(c[3]),"state:"+str(c[4])) for c in self.historyPop], file=output)
+    print("history :",[str(trans) for trans in self.history[-historySize:]], file=output)
+    print("historyPop :",[(str(c[0]),"reward:"+str(c[3])) for c in self.historyPop[-historyPopSize:]], file=output)
     toPrint = []
     for lineIndex in range(self.wordIndex-left, self.wordIndex+right) :
       if lineIndex not in range(len(self.lines)) :
diff --git a/Train.py b/Train.py
index ca196577125a532909212daf27bfb76c53e1407d..de8482e62c7b40b7b4f4187f2cc76708855ed3d5 100644
--- a/Train.py
+++ b/Train.py
@@ -271,6 +271,7 @@ def trainModelRl(debug, networkName, modelDir, filename, nbIter, batchSize, devF
         probaOracle = list_probas[fromState][1]
         
         if debug :
+          print("-"*80, file=sys.stderr)
           sentence.printForDebug(sys.stderr)
         action = selectAction(policy_net, state, transitionSet, sentence, missingLinks, probaRandom, probaOracle, fromState)