From 09ef5b3467fc6fcba8d23bb5754454e6eac250d2 Mon Sep 17 00:00:00 2001
From: Masahiro Masuda <masahi129@gmail.com>
Date: Thu, 11 Jan 2024 00:49:59 +0000
Subject: [PATCH] fix

---
 examples/python/run_llama_batched_vllm.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/examples/python/run_llama_batched_vllm.py b/examples/python/run_llama_batched_vllm.py
index 5cb7f52ae6..dcb16a878d 100644
--- a/examples/python/run_llama_batched_vllm.py
+++ b/examples/python/run_llama_batched_vllm.py
@@ -277,7 +277,7 @@ def _prepare_eval_queries(
         if sliding_window:
             seq_lens.append(min(num_past_tokens + num_queries, sliding_window))
             num_past = min(num_past_tokens, sliding_window)
-            past_slot_mapping += all_slot_mappings[request_id][num_past:]
+            past_slot_mapping += all_slot_mappings[request_id][:num_past]
             slot_mapping += all_slot_mappings[request_id][num_past: num_past + num_queries]
         else:
             seq_lens.append(num_past_tokens + num_queries)