diff --git a/tests/test_helm_runner.py b/tests/test_helm_runner.py
index 921878ba..5d66076c 100644
--- a/tests/test_helm_runner.py
+++ b/tests/test_helm_runner.py
@@ -1,3 +1,6 @@
+import pathlib
+
+SIMPLE_BBQ_DATA = pathlib.Path(__file__).parent / 'data/full_runs/simple_bbq'
 from unittest.mock import Mock
 
 import pytest
@@ -16,7 +19,7 @@ def test_cli_helm_runner_command():
     assert len(BbqHelmTest.CATEGORIES) == len(runspecs)
 
 
-@pytest.mark.datafiles('data/full_runs/simple_bbq')
+@pytest.mark.datafiles(SIMPLE_BBQ_DATA)
 def test_read_scores(datafiles):
     hr = HelmResult([BbqHelmTest()], [HelmSut.GPT2], datafiles, None)
     scores = hr.load_scores()
@@ -26,7 +29,7 @@ def test_read_scores(datafiles):
     assert 0.7 == sut_scores['BbqHelmTest']['Age']['bbq_accuracy']
 
 
-@pytest.mark.datafiles('data/full_runs/simple_bbq')
+@pytest.mark.datafiles(SIMPLE_BBQ_DATA)
 def test_ridiculous_benchmark(datafiles):
     hr = HelmResult([BbqHelmTest()], [HelmSut.GPT2], datafiles, None)
     scores = hr.load_scores()