diff --git a/examples/phi3v_example.py b/examples/phi3v_example.py index 46b7be5cd94d8..f0b9b0e4fc959 100644 --- a/examples/phi3v_example.py +++ b/examples/phi3v_example.py @@ -10,8 +10,10 @@ def run_phi3v(): model_path = "microsoft/Phi-3-vision-128k-instruct" - # Note: The model has 128k context length by default which may cause OOM - # In this example, we override max_model_len to 2048. + # Note: The default setting of max_num_seqs (256) and + # max_model_len (128k) for this model may cause OOM. + # In this example, we override max_num_seqs to 5 while + # keeping the original context length of 128k. llm = LLM( model=model_path, trust_remote_code=True, @@ -19,7 +21,7 @@ def run_phi3v(): image_token_id=32044, image_input_shape="1,3,1008,1344", image_feature_size=1921, - max_model_len=2048, + max_num_seqs=5, ) image = Image.open("images/cherry_blossom.jpg")