diff --git a/evoprompt/task/task.py b/evoprompt/task/task.py
index 8588373da5a40568cabf481639f66687025b1bc0..1ba13ff1c6dba2b14e5eba297e49b3f047379d0f 100644
--- a/evoprompt/task/task.py
+++ b/evoprompt/task/task.py
@@ -328,7 +328,7 @@ class Task(metaclass=ABCMeta):
             lambda _, idx: idx in samples_ids, with_indices=True
         )
         # remove demonstration samples from validation set
-        remaining_dataset = self.dataset.filter(
+        remaining_dataset = dataset.filter(
             lambda _, idx: idx not in samples_ids, with_indices=True
         )
         return demonstration_samples, remaining_dataset