feat: update interpreter to print out model response messages in async mode

starpit · starpit · commit 77e9cd03cbe7 · 2025-03-07T10:08:11.000-05:00
Signed-off-by: Nick Mitchell &lt;nickm@us.ibm.com&gt;
diff --git a/src/pdl/pdl_llms.py b/src/pdl/pdl_llms.py
@@ -87,7 +87,7 @@ def generate_text(
         messages: ModelInput,
         parameters: dict[str, Any],
     ) -> tuple[LazyMessage, PdlLazy[Any]]:
-        print("Asynchronous model call started", file=stderr)
+        print(f"Asynchronous model call started to {block.model}", file=stderr)
         # global _BACKGROUND_TASKS
         future = asyncio.run_coroutine_threadsafe(
             LitellmModel.async_generate_text(
@@ -110,24 +110,29 @@ def update_end_nanos(future):
             if block.pdl__timing is not None:
                 block.pdl__timing.end_nanos = time.time_ns()
 
-                # report call completion and its duration (and if available queueing time)
-                res = future.result()[1]
+                # report call completion and its duration
                 start = (
                     block.pdl__timing.start_nanos
                     if block.pdl__timing.start_nanos is not None
                     else 0
                 )
                 exec_nanos = block.pdl__timing.end_nanos - start
-                queue_nanos = 0
-                if "created" in res:
-                    queue_nanos = (
-                        res["created"] * 1000000000 - block.pdl__timing.start_nanos
-                    )
-                    exec_nanos = exec_nanos - queue_nanos
                 print(
-                    f"Asynchronous model call to {block.model} completed in {(exec_nanos)/1000000}ms queued for {queue_nanos/1000000}ms",
+                    f"Asynchronous model call to {block.model} completed in {(exec_nanos)/1000000}ms",
                     file=stderr,
                 )
+                msg = future.result()[0]
+                if msg["content"] is not None:
+                    from termcolor import colored
+
+                    from .pdl_ast import BlockKind
+                    from .pdl_scheduler import color_of
+
+                    print(
+                        colored(msg["content"], color=color_of(BlockKind.MODEL)),
+                        file=stderr,
+                    )
+                    print("\n", file=stderr)
 
         future.add_done_callback(update_end_nanos)