enabled amd implementation for llama2

GATEOverflow · Oct 19, 2024 · 148650d · 148650d
1 parent fa0eeca
commit 148650d
Show file tree

Hide file tree

Showing 2 changed files with 11 additions and 0 deletions.
diff --git a/docs/benchmarks/language/llama2-70b.md b/docs/benchmarks/language/llama2-70b.md
@@ -25,3 +25,10 @@ hide:
 {{ mlperf_inference_implementation_readme (4, "llama2-70b-99", "neuralmagic") }}
 
 {{ mlperf_inference_implementation_readme (4, "llama2-70b-99.9", "neuralmagic") }}
+
+=== "AMD"
+    ## AMD MLPerf Implementation
+
+{{ mlperf_inference_implementation_readme (4, "llama2-70b-99", "amd") }}
+
+{{ mlperf_inference_implementation_readme (4, "llama2-70b-99.9", "amd") }}
diff --git a/main.py b/main.py
@@ -43,6 +43,10 @@ def mlperf_inference_implementation_readme(spaces, model, implementation, *, imp
             devices = [ "CUDA" ]
             frameworks = [ "TensorRT" ]
 
+        elif implementation == "amd":
+            devices = [ "ROCm" ]
+            frameworks = [ "pytorch" ]
+
         elif implementation == "neuralmagic":
             devices = [ "CUDA" ]
             frameworks = [ "pytorch" ]