jupyterlab · dlqqq · Aug 20, 2025 · Aug 23, 2025 · Aug 24, 2025 · Aug 25, 2025
diff --git a/packages/jupyter-ai/jupyter_ai/default_flow/__init__.py b/packages/jupyter-ai/jupyter_ai/default_flow/__init__.py
@@ -0,0 +1 @@
+from .default_flow import *
diff --git a/packages/jupyter-ai/jupyter_ai/default_flow/default_flow.py b/packages/jupyter-ai/jupyter_ai/default_flow/default_flow.py
@@ -0,0 +1,335 @@
+from pocketflow import AsyncNode, AsyncFlow
+from jupyterlab_chat.models import Message, NewMessage
+from jupyterlab_chat.ychat import YChat
+from typing import Any, Optional, Tuple, TypedDict
+from jinja2 import Template
+from litellm import acompletion, ModelResponseStream
+import time
+import logging
+
+from ..litellm_lib import ToolCallList, run_tools, LitellmToolCallOutput
+from ..tools import Toolkit
+from ..personas import SYSTEM_USERNAME, PersonaAwareness
+
+DEFAULT_RESPONSE_TEMPLATE = """
+{{ content }}
+{{ tool_call_ui_elements }}
+""".strip()
+
+class DefaultFlowParams(TypedDict):
+    """
+    Parameters expected by the default flow provided by Jupyter AI.
+    """
+
+    model_id: str
+
+    ychat: YChat
+
+    awareness: PersonaAwareness
+
+    persona_id: str
+
+    logger: logging.Logger
+
+    model_args: dict[str, Any] | None
+    """
+    Custom keyword arguments forwarded to `litellm.acompletion()`. Defaults to
+    `{}` if unset.
+    """
+
+    system_prompt: Optional[str]
+    """
+    System prompt that will be used as the first message in the list of messages
+    sent to the language model. Unused if unset.
+    """
+
+    response_template: Template | None
+    """
+    Jinja2 template used to template the response. If one is not given,
+    `DEFAULT_RESPONSE_TEMPLATE` is used.
+
+    It should take `content: str` and `tool_call_ui_elements: str` as format arguments.
+    """
+
+    toolkit: Toolkit | None
+    """
+    Toolkit of tools. Unused if unset.
+    """
+
+    history_size: int | None
+    """
+    Number of messages preceding the message triggering this flow to include
+    in the prompt as context. Defaults to 2 if unset.
+    """
+
+class JaiAsyncNode(AsyncNode):
+    """
+    An AsyncNode with custom properties & helper methods used exclusively in the
+    Jupyter AI extension.
+    """
+
+    @property
+    def model_id(self) -> str:
+        return self.params["model_id"]
+
+    @property
+    def ychat(self) -> YChat:
+        return self.params["ychat"]
+
+    @property
+    def awareness(self) -> PersonaAwareness:
+        return self.params["awareness"]
+
+    @property
+    def persona_id(self) -> str:
+        return self.params["persona_id"]
+
+    @property
+    def model_args(self) -> dict[str, Any]:
+        return self.params.get("model_args", {})
+
+    @property
+    def system_prompt(self) -> Optional[str]:
+        return self.params.get("system_prompt")
+
+    @property
+    def response_template(self) -> Template:
+        template = self.params.get("response_template")
+        # If response template was unspecified, use the default response
+        # template.
+        if not template:
+            template = Template(DEFAULT_RESPONSE_TEMPLATE)
+
+        return template
+
+    @property
+    def toolkit(self) -> Optional[Toolkit]:
+        return self.params.get("toolkit")
+
+    @property
+    def history_size(self) -> int:
+        return self.params.get("history_size", 2)
+
+    @property
+    def log(self) -> logging.Logger:
+        return self.params.get("logger")
+
+
+class RootNode(JaiAsyncNode):
+    """
+    The root node of the default flow provided by Jupyter AI.
+    """
+
+    async def prep_async(self, shared):
+        # Initialize `shared.litellm_messages` using the YChat message history
+        # if it is unset.
+        if not ('litellm_messages' in shared and isinstance(shared['litellm_messages'], list) and len(shared['litellm_messages']) > 0):
+            shared['litellm_messages'] = self._init_litellm_messages()
+
+        # Return `shared.litellm_messages`. This is passed as the `prep_res`
+        # argument to `exec_async()`.
+        return shared['litellm_messages']
+
+
+    def _init_litellm_messages(self) -> list[dict]:
+        # Store the invoking message & the previous `params.history_size` messages
+        # as `ychat_messages`.
+        # TODO: ensure the invoking message is in this list
+        all_messages = self.ychat.get_messages()
+        ychat_messages: list[Message] = all_messages[-self.history_size - 1:]
+
+        # Coerce each `Message` in `ychat_messages` to a dictionary following
+        # the OpenAI spec, and store it as `litellm_messages`.
+        litellm_messages: list[dict[str, Any]] = []
+        for msg in ychat_messages:
+            role = (
+                "assistant"
+                if msg.sender.startswith("jupyter-ai-personas::")
+                else "system" if msg.sender == SYSTEM_USERNAME else "user"
+            )
+            litellm_messages.append({"role": role, "content": msg.body})
+
+        # Insert system message as a dictionary if present.
+        if self.system_prompt:
+            system_litellm_message = {
+                "role": "system",
+                "content": self.system_prompt
+            }
+            litellm_messages = [system_litellm_message, *litellm_messages]
+
+        # Return `litellm_messages`
+        return litellm_messages
+
+
+    async def exec_async(self, prep_res: list[dict]):
+        self.log.info("Running RootNode.exec_async()")
+        # Gather arguments and start a reply stream via LiteLLM
+        reply_stream = await acompletion(
+            **self.model_args,
+            model=self.model_id,
+            messages=prep_res,
+            tools=self.toolkit.to_json(),
+            stream=True,
+        )
+
+        # Iterate over reply stream
+        content = ""
+        tool_calls = ToolCallList()
+        stream_id: str | None = None
+        async for chunk in reply_stream:
+            assert isinstance(chunk, ModelResponseStream)
+            delta = chunk.choices[0].delta
+            content_delta = delta.content
+            toolcalls_delta = delta.tool_calls
+
+            # Continue early if an empty chunk was emitted.
+            # This sometimes happens with LiteLLM.
+            if not (content_delta or toolcalls_delta):
+                continue
+
+            # Aggregate the content and tool calls from the deltas
+            if content_delta:
+                content += content_delta
+            if toolcalls_delta:
+                tool_calls += toolcalls_delta
+
+            # Create a new message if one does not yet exist
+            if not stream_id:
+                stream_id = self.ychat.add_message(NewMessage(
+                    sender=self.persona_id,
+                    body=""
+                ))
+                assert stream_id
+
+            # Update the reply
+            message_body = self.response_template.render({
+                "content": content,
+                "tool_call_ui_elements": tool_calls.render()
+            })
+            self.ychat.update_message(
+                Message(
+                    id=stream_id,
+                    body=message_body,
+                    time=time.time(),
+                    sender=self.persona_id,
+                    raw_time=False,
+                )
+            )
+
+        # Return message_id, content, and tool calls
+        return stream_id, content, tool_calls
+
+    async def post_async(self, shared, prep_res, exec_res: Tuple[str, str, ToolCallList]):
+        self.log.info("Running RootNode.post_async()")
+        # Assert that `shared['litellm_messages']` is of the correct type, and
+        # that any tool calls returned are complete.
+        message_id, content, tool_calls = exec_res
+        assert 'litellm_messages' in shared and isinstance(shared['litellm_messages'], list)
+        assert tool_calls.complete
+
+        # Add AI response to `shared['litellm_messages']`, including tool calls
+        new_litellm_message = {
+            "role": "assistant",
+            "content": content
+        }
+        if len(tool_calls):
+            new_litellm_message['tool_calls'] = tool_calls.as_litellm_tool_calls()
+        shared['litellm_messages'].append(new_litellm_message)
+
+        # Add message ID to `shared['prev_message_id']`
+        shared['prev_message_id'] = message_id
+
+        # Add message content to `shared['prev_message_content]`
+        shared['prev_message_content'] = content
+
+        # Add tool calls to `shared['next_tool_calls']`
+        shared['next_tool_calls'] = tool_calls
+
+        # Trigger `ToolExecutorNode` if tools were called.
+        if len(tool_calls):
+            return "execute-tools"
+        return 'finish'
+
+class ToolExecutorNode(JaiAsyncNode):
+    """
+    Node responsible for executing tool calls in the default flow.
+    """
+
+
+    async def prep_async(self, shared):
+        self.log.info("Running ToolExecutorNode.prep_async()")
+        # Extract `shared['next_tool_calls']` and the ID of the last message
+        assert 'next_tool_calls' in shared and isinstance(shared['next_tool_calls'], ToolCallList)
+        assert 'prev_message_id' in shared and isinstance(shared['prev_message_id'], str)
+
+        # Return list of tool calls as a list of dictionaries
+        return shared['prev_message_id'], shared['next_tool_calls']
+
+    async def exec_async(self, prep_res: Tuple[str, ToolCallList]) -> list[LitellmToolCallOutput]:
+        self.log.info("Running ToolExecutorNode.exec_async()")
+        message_id, tool_calls = prep_res
+
+        # TODO: Run 1 tool at a time?
+        outputs = await run_tools(tool_calls, self.toolkit)
+
+        return outputs
+
+    async def post_async(self, shared, prep_res: Tuple[str, ToolCallList], exec_res: list[LitellmToolCallOutput]):
+        self.log.info("Running ToolExecutorNode.post_async()")
+
+        # Update last message to include outputs
+        prev_message_id = shared['prev_message_id']
+        prev_message_content = shared['prev_message_content']
+        tool_calls: ToolCallList = shared['next_tool_calls']
+        message_body = self.response_template.render({
+            "content": prev_message_content,
+            "tool_call_ui_elements": tool_calls.render(
+                outputs=exec_res
+            )
+        })
+        self.ychat.update_message(
+            Message(
+                id=prev_message_id,
+                body=message_body,
+                time=time.time(),
+                sender=self.persona_id,
+                raw_time=False,
+            )
+        )
+
+        # Add tool outputs to `shared['litellm_messages']`
+        shared['litellm_messages'].extend(exec_res)
+
+        # Delete shared state that is now stale
+        del shared['prev_message_id']
+        del shared['prev_message_content']
+        del shared['next_tool_calls']
+        # This node will automatically return to `RootNode` after execution.
+
+async def run_default_flow(params: DefaultFlowParams):
+    # Initialize nodes
+    root_node = RootNode()
+    tool_executor_node = ToolExecutorNode()
+
+    # Define state transitions
+    ## Flow to ToolExecutorNode if tool calls were dispatched
+    root_node - "execute-tools" >> tool_executor_node 
+    ## Always flow back to RootNode after running tools
+    tool_executor_node >> root_node
+    ## End the flow if no tool calls were dispatched
+    root_node - "finish" >> AsyncNode()
+
+    # Initialize flow and set its parameters
+    flow = AsyncFlow(start=root_node)
+    flow.set_params(params)
+
+    # Finally, run the async node
+    try:
+        params['awareness'].set_local_state_field("isWriting", True)
+        await flow.run_async({})
+    except Exception as e:
+        # TODO: implement error handling
+        params['logger'].exception("Exception occurred while running default agent flow:")
+    finally:
+        params['awareness'].set_local_state_field("isWriting", False)
+
diff --git a/packages/jupyter-ai/jupyter_ai/litellm_lib/__init__.py b/packages/jupyter-ai/jupyter_ai/litellm_lib/__init__.py
@@ -0,0 +1,3 @@
+from .run_tools import *
+from .toolcall_list import *
+from .types import *
diff --git a/packages/jupyter-ai/jupyter_ai/litellm_lib/run_tools.py b/packages/jupyter-ai/jupyter_ai/litellm_lib/run_tools.py
@@ -0,0 +1,50 @@
+from __future__ import annotations
+from typing import TYPE_CHECKING
+import asyncio
+
+if TYPE_CHECKING:
+    from ..tools import Toolkit
+    from .toolcall_list import ToolCallList
+    from .types import LitellmToolCallOutput
+
+
+async def run_tools(tool_call_list: ToolCallList, toolkit: Toolkit) -> list[LitellmToolCallOutput]:
+    """
+    Runs the tools specified in the list of tool calls returned by
+    `self.stream_message()`. 
+
+    Returns `list[LitellmToolCallOutput]`, a list of output dictionaries of the
+    type expected by LiteLLM.
+
+    Each output in the list should be appended directly to the message history
+    on the next request made to the LLM.
+    """
+    tool_calls = tool_call_list.resolve()
+    if not len(tool_calls):
+        return []
+
+    tool_outputs: list[LitellmToolCallOutput] = []
+    for tool_call in tool_calls:
+        # Get tool definition from the correct toolkit
+        # TODO: validation?
+        tool_name = tool_call.function.name
+        tool_defn = toolkit.get_tool_unsafe(tool_name)
+
+        # Run tool and store its output
+        try:
+            output = tool_defn.callable(**tool_call.function.arguments)
+            if asyncio.iscoroutine(output):
+                output = await output
+        except Exception as e:
+            output = str(e)
+
+        # Store the tool output in a dictionary accepted by LiteLLM
+        output_dict: LitellmToolCallOutput = {
+            "tool_call_id": tool_call.id,
+            "role": "tool",
+            "name": tool_call.function.name,
+            "content": output,
+        }
+        tool_outputs.append(output_dict)
+
+    return tool_outputs