diff --git a/README.md b/README.md
index 0b1171561bae6309214f0703090b8d8158c3cdd5..5301278a247e0e90235b10dc6da7af56f56ed598 100644
--- a/README.md
+++ b/README.md
@@ -41,9 +41,9 @@ The `DiMSUM` shared task provides a script called `dimsum-data/scripts/dimsumeva
 ```bash
 eval/dimsum2cupt.py --dimsum-file dimsum-data/dimsum16.test.pred > dimsum-data/dimsum16.test.pred.cupt
 # Supersense P/R/F
-eval/evaluate-ss.py --gold dimsum-data/dimsum16.train.cupt --pred dimsum-data/dimsum16.test.pred.cupt
+eval/evaluate-ss.py --gold dimsum-data/dimsum16.test.cupt --pred dimsum-data/dimsum16.test.pred.cupt
 # MWE P/R/F for exact match (MWE-based) and fuzzy match (Token-based) + some additional stats
-eval/evaluate-mwe.py --gold dimsum-data/dimsum16.train.cupt --pred dimsum-data/dimsum16.test.pred.cupt
+eval/evaluate-mwe.py --gold dimsum-data/dimsum16.test.cupt --pred dimsum-data/dimsum16.test.pred.cupt
 
 ```