add logging

yannicks1 · yannicks1 · commit e6b4b6ee24c1 · 2025-08-07T23:03:05.000+02:00
Signed-off-by: Yannick Schnider &lt;Yannick.Schnider1@ibm.com&gt;
diff --git a/vllm_spyre/v1/worker/spyre_model_runner.py b/vllm_spyre/v1/worker/spyre_model_runner.py
@@ -848,6 +848,8 @@ def _get_num_blocks_available(self) -> int:
             # hard coded value for tensor parallel size 4 with the below model
             # https://huggingface.co/ibm-granite/granite-3.3-8b-instruct
             NUM_BLOCKS_SPYRE = 2080
+            logger.info("Model granite-3.3-8b-instruct and tensor parallel " \
+            "size 4 detected. Using NUM_BLOCKS_SPYRE = %d", 2080)
         else:
             # default value for any other model/ tensor parallel size
             NUM_BLOCKS_SPYRE = max_batch_size * min_req_num_blocks