diff --git a/tests/test_record.py b/tests/test_record.py index b4b53dcd..0b4981f6 100644 --- a/tests/test_record.py +++ b/tests/test_record.py @@ -112,16 +112,3 @@ def fnf(*args): code = r["_metadata"]["code"] assert code["error"] == "git command not found" - -# TODO Figure out how to exclude this from normal runs (or to include cache) -def test_save_a_full_run(): - load_plugins() - benchmark = GeneralPurposeAiChatBenchmark() - benchmark_scores = score_benchmarks( - [benchmark], [ModelGaugeSut.ALPACA_7B, ModelGaugeSut.LLAMA_2_7B], 30, False, True - ) - score = benchmark_scores[0] - - with open(f"benchmark_record-{benchmark.uid}.json", "w") as f: - output = benchmark_run_record(score) - json.dump(output, f, cls=BenchmarkScoreEncoder, indent=4)