vllm-project · Yard1 · Jun 9, 2024 · May 31, 2024 · May 31, 2024 · May 31, 2024
@@ -421,8 +421,12 @@ def _schedule_running(
                 num_running_seqs = seq_group.get_max_num_running_seqs()
                 budget.subtract_num_seqs(seq_group.request_id,
                                          num_running_seqs)
-                if curr_loras is not None and seq_group.lora_int_id > 0:
-                    curr_loras.remove(seq_group.lora_int_id)
+                if (
+                    curr_loras is not None
+                    and seq_group.lora_int_id > 0
+                    and seq_group.lora_int_id in curr_loras
+                ):
+                        curr_loras.remove(seq_group.lora_int_id)
 
                 if running_queue:
                     # Preempt the lowest-priority sequence groups.