From efcd95a0db0c46d2da2ad38105b476b6a9f4bd9f Mon Sep 17 00:00:00 2001 From: SichengStevenLi <144295301+SichengStevenLi@users.noreply.github.com> Date: Fri, 2 Aug 2024 15:03:40 +0800 Subject: [PATCH 01/15] removed LLMs that are no longer needed Removed: mistralai/Mistral-7B-v0.1 deepseek-ai/deepseek-coder-6.7b-instruct --- python/llm/test/benchmark/arc-perf-test-batch2.yaml | 4 +--- 1 file changed, 1 insertion(+), 3 deletions(-) diff --git a/python/llm/test/benchmark/arc-perf-test-batch2.yaml b/python/llm/test/benchmark/arc-perf-test-batch2.yaml index e5863465a44..70447fd7f59 100644 --- a/python/llm/test/benchmark/arc-perf-test-batch2.yaml +++ b/python/llm/test/benchmark/arc-perf-test-batch2.yaml @@ -4,8 +4,6 @@ repo_id: - 'THUDM/chatglm3-6b-4bit' - 'baichuan-inc/Baichuan2-7B-Chat' - 'baichuan-inc/Baichuan2-13B-Chat-4bit' - - 'mistralai/Mistral-7B-v0.1' - - 'deepseek-ai/deepseek-coder-6.7b-instruct' - 'THUDM/glm-4-9b-chat' - 'openbmb/MiniCPM-2B-sft-bf16' - 'Qwen/Qwen-VL-Chat' @@ -29,4 +27,4 @@ test_api: cpu_embedding: False # whether put embedding to CPU (only avaiable now for gpu win related test_api) exclude: - 'baichuan-inc/Baichuan2-13B-Chat-4bit:2048' -task: 'continuation' # task can be 'continuation', 'QA' and 'summarize' \ No newline at end of file +task: 'continuation' # task can be 'continuation', 'QA' and 'summarize' From 2fec0ddec8dbf11a71150bc3b539ee3128e37305 Mon Sep 17 00:00:00 2001 From: SichengStevenLi <144295301+SichengStevenLi@users.noreply.github.com> Date: Fri, 2 Aug 2024 15:10:14 +0800 Subject: [PATCH 02/15] Update arc-perf-test-batch4.yaml Removed: deepseek-ai/deepseek-coder-6.7b-instruct mistralai/Mistral-7B-v0.1 --- python/llm/test/benchmark/arc-perf-test-batch4.yaml | 2 -- 1 file changed, 2 deletions(-) diff --git a/python/llm/test/benchmark/arc-perf-test-batch4.yaml b/python/llm/test/benchmark/arc-perf-test-batch4.yaml index 0c83cc9b398..3bfd47963a4 100644 --- a/python/llm/test/benchmark/arc-perf-test-batch4.yaml +++ b/python/llm/test/benchmark/arc-perf-test-batch4.yaml @@ -4,8 +4,6 @@ repo_id: - 'THUDM/chatglm3-6b-4bit' - 'baichuan-inc/Baichuan2-7B-Chat' - 'baichuan-inc/Baichuan2-13B-Chat-4bit' - - 'mistralai/Mistral-7B-v0.1' #mwj: need to check - - 'deepseek-ai/deepseek-coder-6.7b-instruct' - 'THUDM/glm-4-9b-chat' - 'openbmb/MiniCPM-2B-sft-bf16' - 'Qwen/Qwen-VL-Chat' From 7224eaff0a801df1bbf60e6e7e6261a07a1f2b4c Mon Sep 17 00:00:00 2001 From: SichengStevenLi <144295301+SichengStevenLi@users.noreply.github.com> Date: Fri, 2 Aug 2024 15:11:07 +0800 Subject: [PATCH 03/15] Update arc-perf-test.yaml Removed: deepseek-ai/deepseek-coder-6.7b-instruct mistralai/Mistral-7B-v0.1 --- python/llm/test/benchmark/arc-perf-test.yaml | 2 -- 1 file changed, 2 deletions(-) diff --git a/python/llm/test/benchmark/arc-perf-test.yaml b/python/llm/test/benchmark/arc-perf-test.yaml index 5298514bb09..890b8dbf470 100644 --- a/python/llm/test/benchmark/arc-perf-test.yaml +++ b/python/llm/test/benchmark/arc-perf-test.yaml @@ -4,8 +4,6 @@ repo_id: - 'THUDM/chatglm3-6b-4bit' - 'baichuan-inc/Baichuan2-7B-Chat' - 'baichuan-inc/Baichuan2-13B-Chat-4bit' - - 'mistralai/Mistral-7B-v0.1' - - 'deepseek-ai/deepseek-coder-6.7b-instruct' - 'THUDM/glm-4-9b-chat' - 'openbmb/MiniCPM-2B-sft-bf16' - 'Qwen/Qwen-VL-Chat' From f76f062971fc9d67430acd0afd25e840619b5252 Mon Sep 17 00:00:00 2001 From: SichengStevenLi <144295301+SichengStevenLi@users.noreply.github.com> Date: Mon, 5 Aug 2024 16:39:58 +0800 Subject: [PATCH 04/15] Create arc-perf-transformers-438.yaml --- .../benchmark/arc-perf-transformers-438.yaml | 18 ++++++++++++++++++ 1 file changed, 18 insertions(+) create mode 100644 python/llm/test/benchmark/python/llm/test/benchmark/arc-perf-transformers-438.yaml diff --git a/python/llm/test/benchmark/python/llm/test/benchmark/arc-perf-transformers-438.yaml b/python/llm/test/benchmark/python/llm/test/benchmark/arc-perf-transformers-438.yaml new file mode 100644 index 00000000000..eda2815e9df --- /dev/null +++ b/python/llm/test/benchmark/python/llm/test/benchmark/arc-perf-transformers-438.yaml @@ -0,0 +1,18 @@ +# For the models that require transformers 4.38.2 +repo_id: + - 'stablelm/stablelm-zephyr-3b' + - 'Gemma/gemma-7b-it' +local_model_hub: '/mnt/disk1/models' +warm_up: 1 +num_trials: 3 +num_beams: 1 # default to greedy search +low_bit: 'sym_int4' # default to use 'sym_int4' (i.e. symmetric int4) +batch_size: 1 # default to 1 +in_out_pairs: + - '32-32' + - '1024-128' + - '2048-256' +test_api: + - "transformer_int4_fp16_gpu" # on Intel GPU +cpu_embedding: False # whether put embedding to CPU (only avaiable now for gpu win related test_api) +task: 'continuation' # task can be 'continuation', 'QA' and 'summarize' From ed190cf270150b2c0e9fe3c8db218a731f43bb32 Mon Sep 17 00:00:00 2001 From: SichengStevenLi <144295301+SichengStevenLi@users.noreply.github.com> Date: Mon, 5 Aug 2024 16:48:28 +0800 Subject: [PATCH 05/15] Moved arc-perf-transformers-438.yaml location --- .../llm/test/benchmark => }/arc-perf-transformers-438.yaml | 0 1 file changed, 0 insertions(+), 0 deletions(-) rename python/llm/test/benchmark/{python/llm/test/benchmark => }/arc-perf-transformers-438.yaml (100%) diff --git a/python/llm/test/benchmark/python/llm/test/benchmark/arc-perf-transformers-438.yaml b/python/llm/test/benchmark/arc-perf-transformers-438.yaml similarity index 100% rename from python/llm/test/benchmark/python/llm/test/benchmark/arc-perf-transformers-438.yaml rename to python/llm/test/benchmark/arc-perf-transformers-438.yaml From fcc12ae948e86a98bcc72bf454f0f3559f1050ca Mon Sep 17 00:00:00 2001 From: SichengStevenLi <144295301+SichengStevenLi@users.noreply.github.com> Date: Mon, 5 Aug 2024 16:58:58 +0800 Subject: [PATCH 06/15] Create arc-perf-transformers-438-batch2.yaml --- .../arc-perf-transformers-438-batch2.yaml | 18 ++++++++++++++++++ 1 file changed, 18 insertions(+) create mode 100644 python/llm/test/benchmark/arc-perf-transformers-438-batch2.yaml diff --git a/python/llm/test/benchmark/arc-perf-transformers-438-batch2.yaml b/python/llm/test/benchmark/arc-perf-transformers-438-batch2.yaml new file mode 100644 index 00000000000..3c9fa68bd10 --- /dev/null +++ b/python/llm/test/benchmark/arc-perf-transformers-438-batch2.yaml @@ -0,0 +1,18 @@ +# For the models that require transformers 4.38.2 +repo_id: + - 'stablelm/stablelm-zephyr-3b' + - 'Gemma/gemma-7b-it' +local_model_hub: '/mnt/disk1/models' +warm_up: 1 +num_trials: 3 +num_beams: 1 # default to greedy search +low_bit: 'sym_int4' # default to use 'sym_int4' (i.e. symmetric int4) +batch_size: 2 # default to 1 +in_out_pairs: + - '32-32' + - '1024-128' + - '2048-256' +test_api: + - "transformer_int4_fp16_gpu" # on Intel GPU +cpu_embedding: False # whether put embedding to CPU (only avaiable now for gpu win related test_api) +task: 'continuation' # task can be 'continuation', 'QA' and 'summarize' From 2e629fc824910377cf44b13bec360cbb2a4de285 Mon Sep 17 00:00:00 2001 From: SichengStevenLi <144295301+SichengStevenLi@users.noreply.github.com> Date: Mon, 5 Aug 2024 17:03:44 +0800 Subject: [PATCH 07/15] Create arc-perf-transformers-438-batch4.yaml --- .../arc-perf-transformers-438-batch4.yaml | 20 +++++++++++++++++++ 1 file changed, 20 insertions(+) create mode 100644 python/llm/test/benchmark/arc-perf-transformers-438-batch4.yaml diff --git a/python/llm/test/benchmark/arc-perf-transformers-438-batch4.yaml b/python/llm/test/benchmark/arc-perf-transformers-438-batch4.yaml new file mode 100644 index 00000000000..f7499fe8806 --- /dev/null +++ b/python/llm/test/benchmark/arc-perf-transformers-438-batch4.yaml @@ -0,0 +1,20 @@ +# For the models that require transformers 4.38.2 +repo_id: + - 'stablelm/stablelm-zephyr-3b' + - 'Gemma/gemma-7b-it' +local_model_hub: '/mnt/disk1/models' +warm_up: 1 +num_trials: 3 +num_beams: 1 # default to greedy search +low_bit: 'sym_int4' # default to use 'sym_int4' (i.e. symmetric int4) +batch_size: 4 # default to 1 +in_out_pairs: + - '32-32' + - '1024-128' + - '2048-256' +test_api: + - "transformer_int4_fp16_gpu" # on Intel GPU +cpu_embedding: False # whether put embedding to CPU (only avaiable now for gpu win related test_api) +exclude: + - 'Gemma/gemma-7b-it:2048' +task: 'continuation' # task can be 'continuation', 'QA' and 'summarize' From 4a818a161dc1cacea309ef19310287f3775702b1 Mon Sep 17 00:00:00 2001 From: SichengStevenLi <144295301+SichengStevenLi@users.noreply.github.com> Date: Tue, 6 Aug 2024 16:49:53 +0800 Subject: [PATCH 08/15] Update llm_performance_tests.yml to include transformer 4.38.2 --- .github/workflows/llm_performance_tests.yml | 32 +++++++++++++++++++++ 1 file changed, 32 insertions(+) diff --git a/.github/workflows/llm_performance_tests.yml b/.github/workflows/llm_performance_tests.yml index 9185e4282d5..00ce9bc07e7 100644 --- a/.github/workflows/llm_performance_tests.yml +++ b/.github/workflows/llm_performance_tests.yml @@ -213,6 +213,38 @@ jobs: sed -i 's/batch2/batch4/g' run.py python run.py mv *.csv test_batch4 + + - name: Test on xpu(transformers==4.38.2) + shell: bash + run: | + source /opt/intel/oneapi/setvars.sh + export USE_XETLA=OFF + export SYCL_PI_LEVEL_ZERO_USE_IMMEDIATE_COMMANDLISTS=1 + # upgrade transformers for model stablelm/stablelm-zephyr-3b & Gemma/gemma-7b-it + python -m pip install transformers==4.38.2 + # batch_size 1 + cp python/llm/test/benchmark/arc-perf-transformers-438.yaml python/llm/dev/benchmark/all-in-one/config.yaml + cd python/llm/dev/benchmark/all-in-one + # change csv name + sed -i 's/test1_batch4/test2_batch1/g' run.py + python run.py + mv *.csv test_batch1 + # batch_size 2 + cd ../../../../../ + cp python/llm/test/benchmark/arc-perf-transformers-438-batch2.yaml python/llm/dev/benchmark/all-in-one/config.yaml + cd python/llm/dev/benchmark/all-in-one + # change csv name + sed -i 's/batch1/batch2/g' run.py + python run.py + mv *.csv test_batch2 + # batch_size 4 + cd ../../../../../ + cp python/llm/test/benchmark/arc-perf-transformers-438-batch4.yaml python/llm/dev/benchmark/all-in-one/config.yaml + cd python/llm/dev/benchmark/all-in-one + # change csv name + sed -i 's/batch2/batch4/g' run.py + python run.py + mv *.csv test_batch4 - name: Test on xpu(transformers==4.40.0) shell: bash From 420d2136624aa81367e11e5e1dc4eb8d4cb8982e Mon Sep 17 00:00:00 2001 From: SichengStevenLi <144295301+SichengStevenLi@users.noreply.github.com> Date: Wed, 7 Aug 2024 17:42:05 +0800 Subject: [PATCH 09/15] Update arc-perf-transformers-438-batch2.yaml Disabled Gemma/gemma-7b-it for now --- python/llm/test/benchmark/arc-perf-transformers-438-batch2.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/llm/test/benchmark/arc-perf-transformers-438-batch2.yaml b/python/llm/test/benchmark/arc-perf-transformers-438-batch2.yaml index 3c9fa68bd10..41e54326b4e 100644 --- a/python/llm/test/benchmark/arc-perf-transformers-438-batch2.yaml +++ b/python/llm/test/benchmark/arc-perf-transformers-438-batch2.yaml @@ -1,7 +1,7 @@ # For the models that require transformers 4.38.2 repo_id: - 'stablelm/stablelm-zephyr-3b' - - 'Gemma/gemma-7b-it' + #- 'Gemma/gemma-7b-it' #Temporarily removed due to performance issues local_model_hub: '/mnt/disk1/models' warm_up: 1 num_trials: 3 From 727a97e99cbb784a246edb1a1f34a85334ed4f37 Mon Sep 17 00:00:00 2001 From: SichengStevenLi <144295301+SichengStevenLi@users.noreply.github.com> Date: Wed, 7 Aug 2024 17:43:05 +0800 Subject: [PATCH 10/15] Update arc-perf-transformers-438-batch4.yaml Disabled Gemma/gemma-7b-it for now --- .../test/benchmark/arc-perf-transformers-438-batch4.yaml | 6 +++--- 1 file changed, 3 insertions(+), 3 deletions(-) diff --git a/python/llm/test/benchmark/arc-perf-transformers-438-batch4.yaml b/python/llm/test/benchmark/arc-perf-transformers-438-batch4.yaml index f7499fe8806..82393e67355 100644 --- a/python/llm/test/benchmark/arc-perf-transformers-438-batch4.yaml +++ b/python/llm/test/benchmark/arc-perf-transformers-438-batch4.yaml @@ -1,7 +1,7 @@ # For the models that require transformers 4.38.2 repo_id: - 'stablelm/stablelm-zephyr-3b' - - 'Gemma/gemma-7b-it' + #- 'Gemma/gemma-7b-it' #disabled due to performance issues local_model_hub: '/mnt/disk1/models' warm_up: 1 num_trials: 3 @@ -15,6 +15,6 @@ in_out_pairs: test_api: - "transformer_int4_fp16_gpu" # on Intel GPU cpu_embedding: False # whether put embedding to CPU (only avaiable now for gpu win related test_api) -exclude: - - 'Gemma/gemma-7b-it:2048' +#exclude: + #- 'Gemma/gemma-7b-it:2048' task: 'continuation' # task can be 'continuation', 'QA' and 'summarize' From a68e7c9095db3db8e7302c8d470bd7356bdc3910 Mon Sep 17 00:00:00 2001 From: SichengStevenLi <144295301+SichengStevenLi@users.noreply.github.com> Date: Wed, 7 Aug 2024 17:43:40 +0800 Subject: [PATCH 11/15] Update arc-perf-transformers-438.yaml Disabled Gemma/gemma-7b-it for now --- python/llm/test/benchmark/arc-perf-transformers-438.yaml | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/python/llm/test/benchmark/arc-perf-transformers-438.yaml b/python/llm/test/benchmark/arc-perf-transformers-438.yaml index eda2815e9df..a8b31cfe327 100644 --- a/python/llm/test/benchmark/arc-perf-transformers-438.yaml +++ b/python/llm/test/benchmark/arc-perf-transformers-438.yaml @@ -1,7 +1,7 @@ # For the models that require transformers 4.38.2 repo_id: - 'stablelm/stablelm-zephyr-3b' - - 'Gemma/gemma-7b-it' + #- 'Gemma/gemma-7b-it' #disabled due to performance issues local_model_hub: '/mnt/disk1/models' warm_up: 1 num_trials: 3 From 95a4fc014b4a8130bd216737d2b061188af1bfc4 Mon Sep 17 00:00:00 2001 From: SichengStevenLi <144295301+SichengStevenLi@users.noreply.github.com> Date: Wed, 7 Aug 2024 17:52:48 +0800 Subject: [PATCH 12/15] Update llm_performance_tests.yml --- .github/workflows/llm_performance_tests.yml | 64 ++++++++++----------- 1 file changed, 32 insertions(+), 32 deletions(-) diff --git a/.github/workflows/llm_performance_tests.yml b/.github/workflows/llm_performance_tests.yml index 00ce9bc07e7..e7b1b890c93 100644 --- a/.github/workflows/llm_performance_tests.yml +++ b/.github/workflows/llm_performance_tests.yml @@ -145,85 +145,85 @@ jobs: python -m pip install --upgrade expecttest bash python/llm/test/run-llm-install-tests.sh - - name: Test on xpu(transformers==4.36.2) + - name: Test on xpu(transformers==4.38.2) shell: bash run: | - date_for_test_version=$(date -d yesterday +%Y-%m-%d) - sed -i "s/date.today()/\"$date_for_test_version\"/g" python/llm/dev/benchmark/all-in-one/run.py source /opt/intel/oneapi/setvars.sh export USE_XETLA=OFF export SYCL_PI_LEVEL_ZERO_USE_IMMEDIATE_COMMANDLISTS=1 - cp python/llm/test/benchmark/arc-perf-test.yaml python/llm/dev/benchmark/all-in-one/config.yaml - cd python/llm/dev/benchmark/all-in-one - mkdir test_batch1 - mkdir test_batch2 - mkdir test_batch4 + # upgrade transformers for model stablelm/stablelm-zephyr-3b & Gemma/gemma-7b-it + python -m pip install transformers==4.38.2 # batch_size 1 - # hide time info - sed -i 's/str(end - st)/"xxxxxx"/g' run.py + cp python/llm/test/benchmark/arc-perf-transformers-438.yaml python/llm/dev/benchmark/all-in-one/config.yaml + cd python/llm/dev/benchmark/all-in-one # change csv name - sed -i 's/{today}/{today}_test1_batch1/g' run.py + sed -i 's/test1_batch4/test2_batch1/g' run.py python run.py mv *.csv test_batch1 # batch_size 2 cd ../../../../../ - cp python/llm/test/benchmark/arc-perf-test-batch2.yaml python/llm/dev/benchmark/all-in-one/config.yaml + cp python/llm/test/benchmark/arc-perf-transformers-438-batch2.yaml python/llm/dev/benchmark/all-in-one/config.yaml cd python/llm/dev/benchmark/all-in-one - # change csv name + # change csv name sed -i 's/batch1/batch2/g' run.py python run.py mv *.csv test_batch2 # batch_size 4 cd ../../../../../ - cp python/llm/test/benchmark/arc-perf-test-batch4.yaml python/llm/dev/benchmark/all-in-one/config.yaml + cp python/llm/test/benchmark/arc-perf-transformers-438-batch4.yaml python/llm/dev/benchmark/all-in-one/config.yaml cd python/llm/dev/benchmark/all-in-one - # change csv name + # change csv name sed -i 's/batch2/batch4/g' run.py python run.py mv *.csv test_batch4 - - - name: Test on xpu(transformers==4.37.0) + + - name: Test on xpu(transformers==4.36.2) shell: bash run: | + date_for_test_version=$(date -d yesterday +%Y-%m-%d) + sed -i "s/date.today()/\"$date_for_test_version\"/g" python/llm/dev/benchmark/all-in-one/run.py source /opt/intel/oneapi/setvars.sh export USE_XETLA=OFF export SYCL_PI_LEVEL_ZERO_USE_IMMEDIATE_COMMANDLISTS=1 - # upgrade transformers for model Qwen/Qwen1.5-7B-Chat - python -m pip install transformers==4.37.0 - # batch_size 1 - cp python/llm/test/benchmark/arc-perf-transformers-437.yaml python/llm/dev/benchmark/all-in-one/config.yaml + cp python/llm/test/benchmark/arc-perf-test.yaml python/llm/dev/benchmark/all-in-one/config.yaml cd python/llm/dev/benchmark/all-in-one + mkdir test_batch1 + mkdir test_batch2 + mkdir test_batch4 + # batch_size 1 + # hide time info + sed -i 's/str(end - st)/"xxxxxx"/g' run.py # change csv name - sed -i 's/test1_batch4/test2_batch1/g' run.py + sed -i 's/{today}/{today}_test1_batch1/g' run.py python run.py mv *.csv test_batch1 # batch_size 2 cd ../../../../../ - cp python/llm/test/benchmark/arc-perf-transformers-437-batch2.yaml python/llm/dev/benchmark/all-in-one/config.yaml + cp python/llm/test/benchmark/arc-perf-test-batch2.yaml python/llm/dev/benchmark/all-in-one/config.yaml cd python/llm/dev/benchmark/all-in-one - # change csv name + # change csv name sed -i 's/batch1/batch2/g' run.py python run.py mv *.csv test_batch2 # batch_size 4 cd ../../../../../ - cp python/llm/test/benchmark/arc-perf-transformers-437-batch4.yaml python/llm/dev/benchmark/all-in-one/config.yaml + cp python/llm/test/benchmark/arc-perf-test-batch4.yaml python/llm/dev/benchmark/all-in-one/config.yaml cd python/llm/dev/benchmark/all-in-one - # change csv name + # change csv name sed -i 's/batch2/batch4/g' run.py python run.py mv *.csv test_batch4 - - name: Test on xpu(transformers==4.38.2) + - name: Test on xpu(transformers==4.37.0) shell: bash run: | source /opt/intel/oneapi/setvars.sh export USE_XETLA=OFF export SYCL_PI_LEVEL_ZERO_USE_IMMEDIATE_COMMANDLISTS=1 - # upgrade transformers for model stablelm/stablelm-zephyr-3b & Gemma/gemma-7b-it - python -m pip install transformers==4.38.2 + # upgrade transformers for model Qwen/Qwen1.5-7B-Chat + python -m pip install transformers==4.37.0 # batch_size 1 - cp python/llm/test/benchmark/arc-perf-transformers-438.yaml python/llm/dev/benchmark/all-in-one/config.yaml + cp python/llm/test/benchmark/arc-perf-transformers-437.yaml python/llm/dev/benchmark/all-in-one/config.yaml cd python/llm/dev/benchmark/all-in-one # change csv name sed -i 's/test1_batch4/test2_batch1/g' run.py @@ -231,7 +231,7 @@ jobs: mv *.csv test_batch1 # batch_size 2 cd ../../../../../ - cp python/llm/test/benchmark/arc-perf-transformers-438-batch2.yaml python/llm/dev/benchmark/all-in-one/config.yaml + cp python/llm/test/benchmark/arc-perf-transformers-437-batch2.yaml python/llm/dev/benchmark/all-in-one/config.yaml cd python/llm/dev/benchmark/all-in-one # change csv name sed -i 's/batch1/batch2/g' run.py @@ -239,7 +239,7 @@ jobs: mv *.csv test_batch2 # batch_size 4 cd ../../../../../ - cp python/llm/test/benchmark/arc-perf-transformers-438-batch4.yaml python/llm/dev/benchmark/all-in-one/config.yaml + cp python/llm/test/benchmark/arc-perf-transformers-437-batch4.yaml python/llm/dev/benchmark/all-in-one/config.yaml cd python/llm/dev/benchmark/all-in-one # change csv name sed -i 's/batch2/batch4/g' run.py From 917a2d2e3c35bf018d195e083fc00332c3a72d47 Mon Sep 17 00:00:00 2001 From: SichengStevenLi <144295301+SichengStevenLi@users.noreply.github.com> Date: Wed, 7 Aug 2024 17:59:41 +0800 Subject: [PATCH 13/15] Update arc-perf-transformers-438-batch2.yaml --- python/llm/test/benchmark/arc-perf-transformers-438-batch2.yaml | 1 - 1 file changed, 1 deletion(-) diff --git a/python/llm/test/benchmark/arc-perf-transformers-438-batch2.yaml b/python/llm/test/benchmark/arc-perf-transformers-438-batch2.yaml index 41e54326b4e..46c3905782c 100644 --- a/python/llm/test/benchmark/arc-perf-transformers-438-batch2.yaml +++ b/python/llm/test/benchmark/arc-perf-transformers-438-batch2.yaml @@ -1,7 +1,6 @@ # For the models that require transformers 4.38.2 repo_id: - 'stablelm/stablelm-zephyr-3b' - #- 'Gemma/gemma-7b-it' #Temporarily removed due to performance issues local_model_hub: '/mnt/disk1/models' warm_up: 1 num_trials: 3 From 805c556671e5828d4dd0f96dcf26b90828636702 Mon Sep 17 00:00:00 2001 From: SichengStevenLi <144295301+SichengStevenLi@users.noreply.github.com> Date: Wed, 7 Aug 2024 18:00:10 +0800 Subject: [PATCH 14/15] Update arc-perf-transformers-438-batch4.yaml --- .../llm/test/benchmark/arc-perf-transformers-438-batch4.yaml | 3 --- 1 file changed, 3 deletions(-) diff --git a/python/llm/test/benchmark/arc-perf-transformers-438-batch4.yaml b/python/llm/test/benchmark/arc-perf-transformers-438-batch4.yaml index 82393e67355..598b5ce1771 100644 --- a/python/llm/test/benchmark/arc-perf-transformers-438-batch4.yaml +++ b/python/llm/test/benchmark/arc-perf-transformers-438-batch4.yaml @@ -1,7 +1,6 @@ # For the models that require transformers 4.38.2 repo_id: - 'stablelm/stablelm-zephyr-3b' - #- 'Gemma/gemma-7b-it' #disabled due to performance issues local_model_hub: '/mnt/disk1/models' warm_up: 1 num_trials: 3 @@ -15,6 +14,4 @@ in_out_pairs: test_api: - "transformer_int4_fp16_gpu" # on Intel GPU cpu_embedding: False # whether put embedding to CPU (only avaiable now for gpu win related test_api) -#exclude: - #- 'Gemma/gemma-7b-it:2048' task: 'continuation' # task can be 'continuation', 'QA' and 'summarize' From bf40d9538f09f47f5f4732e3cb95f1f0b6fa084f Mon Sep 17 00:00:00 2001 From: SichengStevenLi <144295301+SichengStevenLi@users.noreply.github.com> Date: Wed, 7 Aug 2024 18:00:25 +0800 Subject: [PATCH 15/15] Update arc-perf-transformers-438.yaml --- python/llm/test/benchmark/arc-perf-transformers-438.yaml | 1 - 1 file changed, 1 deletion(-) diff --git a/python/llm/test/benchmark/arc-perf-transformers-438.yaml b/python/llm/test/benchmark/arc-perf-transformers-438.yaml index a8b31cfe327..02065068962 100644 --- a/python/llm/test/benchmark/arc-perf-transformers-438.yaml +++ b/python/llm/test/benchmark/arc-perf-transformers-438.yaml @@ -1,7 +1,6 @@ # For the models that require transformers 4.38.2 repo_id: - 'stablelm/stablelm-zephyr-3b' - #- 'Gemma/gemma-7b-it' #disabled due to performance issues local_model_hub: '/mnt/disk1/models' warm_up: 1 num_trials: 3