diff --git a/.gitlab-ci.yml b/.gitlab-ci.yml
index 6bf5a199848da1eaca03387941eb7d62cd833bdc..776cec549221207595108e3adaad01d6e8017fd4 100644
--- a/.gitlab-ci.yml
+++ b/.gitlab-ci.yml
@@ -32,7 +32,7 @@ test_benchmark:
   script:
     - docker pull $CONTAINER_TEST_IMAGE
     - docker run $CONTAINER_TEST_IMAGE /ttc18/gradlew benchmarkFull -Pscenario=0,small 2>&1 | tee benchmarkFull.log
-    - ! grep "BUILD FAILED" benchmarkFull.log
+    - grep "BUILD FAILED" benchmarkFull.log; test $? -eq 1
 
 test_unit_tests:
   stage: test