diff --git a/docs/LLaVA-NeXT.md b/docs/LLaVA-NeXT.md
index 777a961f3..b8ac23bed 100644
--- a/docs/LLaVA-NeXT.md
+++ b/docs/LLaVA-NeXT.md
@@ -47,6 +47,8 @@ cont = model.generate(
     do_sample=False,
     temperature=0,
     max_new_tokens=256,
+    # Modalities should be the same size as the batch size
+    modalities=["image"]*input_ids.shape[0]
 )
 text_outputs = tokenizer.batch_decode(cont, skip_special_tokens=True)
 print(text_outputs)