jspv
diff --git a/‎python/packages/autogen-agentchat/src/autogen_agentchat/agents/_assistant_agent.py‎
Lines changed: 1 addition & 0 deletions b/‎python/packages/autogen-agentchat/src/autogen_agentchat/agents/_assistant_agent.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎python/packages/autogen-agentchat/tests/test_assistant_agent.py‎
Lines changed: 63 additions & 9 deletions b/‎python/packages/autogen-agentchat/tests/test_assistant_agent.py‎
Lines changed: 63 additions & 9 deletions
diff --git a/‎python/packages/autogen-agentchat/tests/test_group_chat.py‎
Lines changed: 21 additions & 3 deletions b/‎python/packages/autogen-agentchat/tests/test_group_chat.py‎
Lines changed: 21 additions & 3 deletions
diff --git a/‎python/packages/autogen-core/docs/src/user-guide/agentchat-user-guide/migration-guide.md‎
Lines changed: 1 addition & 0 deletions b/‎python/packages/autogen-core/docs/src/user-guide/agentchat-user-guide/migration-guide.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎python/packages/autogen-core/docs/src/user-guide/agentchat-user-guide/tutorial/models.ipynb‎
Lines changed: 1 addition & 0 deletions b/‎python/packages/autogen-core/docs/src/user-guide/agentchat-user-guide/tutorial/models.ipynb‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎python/packages/autogen-core/docs/src/user-guide/autogenstudio-user-guide/faq.md‎
Lines changed: 3 additions & 2 deletions b/‎python/packages/autogen-core/docs/src/user-guide/autogenstudio-user-guide/faq.md‎
Lines changed: 3 additions & 2 deletions
diff --git a/‎python/packages/autogen-core/src/autogen_core/models/_model_client.py‎
Lines changed: 43 additions & 4 deletions b/‎python/packages/autogen-core/src/autogen_core/models/_model_client.py‎
Lines changed: 43 additions & 4 deletions
diff --git a/‎python/packages/autogen-core/tests/test_models.py‎
Lines changed: 1 addition & 0 deletions b/‎python/packages/autogen-core/tests/test_models.py‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎python/packages/autogen-core/tests/test_tool_agent.py‎
Lines changed: 10 additions & 3 deletions b/‎python/packages/autogen-core/tests/test_tool_agent.py‎
Lines changed: 10 additions & 3 deletions
diff --git a/‎python/packages/autogen-ext/src/autogen_ext/experimental/task_centric_memory/utils/chat_completion_client_recorder.py‎
Lines changed: 3 additions & 2 deletions b/‎python/packages/autogen-ext/src/autogen_ext/experimental/task_centric_memory/utils/chat_completion_client_recorder.py‎
Lines changed: 3 additions & 2 deletions
@@ -574,6 +574,7 @@ async def get_messages(self) -> List[LLMMessage]:
                     "function_calling": False,
                     "json_output": False,
                     "family": ModelFamily.R1,
+                    "structured_output": True,
                 },
             )
 
 
@@ -68,7 +68,13 @@ async def test_run_with_tools(monkeypatch: pytest.MonkeyPatch) -> None:
             "pass",
             "TERMINATE",
         ],
-        model_info={"function_calling": True, "vision": True, "json_output": True, "family": ModelFamily.GPT_4O},
+        model_info={
+            "function_calling": True,
+            "vision": True,
+            "json_output": True,
+            "family": ModelFamily.GPT_4O,
+            "structured_output": True,
+        },
     )
     agent = AssistantAgent(
         "tool_use_agent",
@@ -150,7 +156,13 @@ async def test_run_with_tools_and_reflection() -> None:
                 cached=False,
             ),
         ],
-        model_info={"function_calling": True, "vision": True, "json_output": True, "family": ModelFamily.GPT_4O},
+        model_info={
+            "function_calling": True,
+            "vision": True,
+            "json_output": True,
+            "family": ModelFamily.GPT_4O,
+            "structured_output": True,
+        },
     )
     agent = AssistantAgent(
         "tool_use_agent",
@@ -236,7 +248,13 @@ async def test_run_with_parallel_tools() -> None:
             "pass",
             "TERMINATE",
         ],
-        model_info={"function_calling": True, "vision": True, "json_output": True, "family": ModelFamily.GPT_4O},
+        model_info={
+            "function_calling": True,
+            "vision": True,
+            "json_output": True,
+            "family": ModelFamily.GPT_4O,
+            "structured_output": True,
+        },
     )
     agent = AssistantAgent(
         "tool_use_agent",
@@ -315,7 +333,13 @@ async def test_run_with_parallel_tools_with_empty_call_ids() -> None:
             "pass",
             "TERMINATE",
         ],
-        model_info={"function_calling": True, "vision": True, "json_output": True, "family": ModelFamily.GPT_4O},
+        model_info={
+            "function_calling": True,
+            "vision": True,
+            "json_output": True,
+            "family": ModelFamily.GPT_4O,
+            "structured_output": True,
+        },
     )
     agent = AssistantAgent(
         "tool_use_agent",
@@ -389,7 +413,13 @@ async def test_handoffs() -> None:
                 cached=False,
             )
         ],
-        model_info={"function_calling": True, "vision": True, "json_output": True, "family": ModelFamily.GPT_4O},
+        model_info={
+            "function_calling": True,
+            "vision": True,
+            "json_output": True,
+            "family": ModelFamily.GPT_4O,
+            "structured_output": True,
+        },
     )
     tool_use_agent = AssistantAgent(
         "tool_use_agent",
@@ -447,7 +477,13 @@ async def test_invalid_model_capabilities() -> None:
     model_client = OpenAIChatCompletionClient(
         model=model,
         api_key="",
-        model_info={"vision": False, "function_calling": False, "json_output": False, "family": ModelFamily.UNKNOWN},
+        model_info={
+            "vision": False,
+            "function_calling": False,
+            "json_output": False,
+            "family": ModelFamily.UNKNOWN,
+            "structured_output": False,
+        },
     )
 
     with pytest.raises(ValueError):
@@ -473,12 +509,24 @@ async def test_remove_images() -> None:
     model_client_1 = OpenAIChatCompletionClient(
         model=model,
         api_key="",
-        model_info={"vision": False, "function_calling": False, "json_output": False, "family": ModelFamily.UNKNOWN},
+        model_info={
+            "vision": False,
+            "function_calling": False,
+            "json_output": False,
+            "family": ModelFamily.UNKNOWN,
+            "structured_output": False,
+        },
     )
     model_client_2 = OpenAIChatCompletionClient(
         model=model,
         api_key="",
-        model_info={"vision": True, "function_calling": False, "json_output": False, "family": ModelFamily.UNKNOWN},
+        model_info={
+            "vision": True,
+            "function_calling": False,
+            "json_output": False,
+            "family": ModelFamily.UNKNOWN,
+            "structured_output": False,
+        },
     )
 
     img_base64 = "iVBORw0KGgoAAAANSUhEUgAAAAEAAAABCAIAAACQd1PeAAAADElEQVR4nGP4//8/AAX+Av4N70a4AAAAAElFTkSuQmCC"
@@ -642,7 +690,13 @@ class BadMemory:
 async def test_assistant_agent_declarative() -> None:
     model_client = ReplayChatCompletionClient(
         ["Response to message 3"],
-        model_info={"function_calling": True, "vision": True, "json_output": True, "family": ModelFamily.GPT_4O},
+        model_info={
+            "function_calling": True,
+            "vision": True,
+            "json_output": True,
+            "family": ModelFamily.GPT_4O,
+            "structured_output": True,
+        },
     )
     model_context = BufferedChatCompletionContext(buffer_size=2)
     agent = AssistantAgent(
 
@@ -259,7 +259,13 @@ async def test_round_robin_group_chat_with_tools(runtime: AgentRuntime | None) -
             "Hello",
             "TERMINATE",
         ],
-        model_info={"family": "gpt-4o", "function_calling": True, "json_output": True, "vision": True},
+        model_info={
+            "family": "gpt-4o",
+            "function_calling": True,
+            "json_output": True,
+            "vision": True,
+            "structured_output": True,
+        },
     )
     tool = FunctionTool(_pass_function, name="pass", description="pass function")
     tool_use_agent = AssistantAgent("tool_use_agent", model_client=model_client, tools=[tool])
@@ -805,7 +811,13 @@ async def test_swarm_handoff_using_tool_calls(runtime: AgentRuntime | None) -> N
             "Hello",
             "TERMINATE",
         ],
-        model_info={"family": "gpt-4o", "function_calling": True, "json_output": True, "vision": True},
+        model_info={
+            "family": "gpt-4o",
+            "function_calling": True,
+            "json_output": True,
+            "vision": True,
+            "structured_output": True,
+        },
     )
     agent1 = AssistantAgent(
         "agent1",
@@ -889,7 +901,13 @@ async def test_swarm_with_parallel_tool_calls(runtime: AgentRuntime | None) -> N
             "Hello",
             "TERMINATE",
         ],
-        model_info={"family": "gpt-4o", "function_calling": True, "json_output": True, "vision": True},
+        model_info={
+            "family": "gpt-4o",
+            "function_calling": True,
+            "json_output": True,
+            "vision": True,
+            "structured_output": True,
+        },
     )
 
     expected_handoff_context: List[LLMMessage] = [
 
@@ -154,6 +154,7 @@ custom_model_client = OpenAIChatCompletionClient(
         "function_calling": True,
         "json_output": True,
         "family": "unknown",
+        "structured_output": True,
     },
 )
 ```
 
@@ -251,6 +251,7 @@
     "        \"function_calling\": False,\n",
     "        \"vision\": False,\n",
     "        \"family\": \"unknown\",\n",
+    "        \"structured_output\": False,\n",
     "    },\n",
     ")\n",
     "\n",
 
@@ -48,7 +48,7 @@ print(anthropic_client.dump_component().model_dump_json())
 mistral_vllm_model = OpenAIChatCompletionClient(
         model="TheBloke/Mistral-7B-Instruct-v0.2-GGUF",
         base_url="http://localhost:1234/v1",
-        model_info=ModelInfo(vision=False, function_calling=True, json_output=False, family="unknown"),
+        model_info=ModelInfo(vision=False, function_calling=True, json_output=False, family="unknown", structured_output=True),
     )
 print(mistral_vllm_model.dump_component().model_dump_json())
 ```
@@ -122,7 +122,8 @@ Have a local model server like Ollama, vLLM or LMStudio that provide an OpenAI c
       "vision": false,
       "function_calling": true,
       "json_output": false,
-      "family": "unknown"
+      "family": "unknown",
+      "structured_output": true
     },
     "base_url": "http://localhost:1234/v1"
   }
 
@@ -107,6 +107,8 @@ class ModelInfo(TypedDict, total=False):
     """True if the model supports json output, otherwise False. Note: this is different to structured json."""
     family: Required[ModelFamily.ANY | str]
     """Model family should be one of the constants from :py:class:`ModelFamily` or a string representing an unknown model family."""
+    structured_output: Required[bool]
+    """True if the model supports structured output, otherwise False. This is different to json_output."""
 
 
 def validate_model_info(model_info: ModelInfo) -> None:
@@ -122,6 +124,15 @@ def validate_model_info(model_info: ModelInfo) -> None:
                 f"Missing required field '{field}' in ModelInfo. "
                 "Starting in v0.4.7, the required fields are enforced."
             )
+    new_required_fields = ["structured_output"]
+    for field in new_required_fields:
+        if field not in model_info:
+            warnings.warn(
+                f"Missing required field '{field}' in ModelInfo. "
+                "This field will be required in a future version of AutoGen.",
+                UserWarning,
+                stacklevel=2,
+            )
 
 
 class ChatCompletionClient(ComponentBase[BaseModel], ABC):
@@ -134,10 +145,24 @@ async def create(
         tools: Sequence[Tool | ToolSchema] = [],
         # None means do not override the default
         # A value means to override the client default - often specified in the constructor
-        json_output: Optional[bool] = None,
+        json_output: Optional[bool | type[BaseModel]] = None,
         extra_create_args: Mapping[str, Any] = {},
         cancellation_token: Optional[CancellationToken] = None,
-    ) -> CreateResult: ...
+    ) -> CreateResult:
+        """Creates a single response from the model.
+
+        Args:
+            messages (Sequence[LLMMessage]): The messages to send to the model.
+            tools (Sequence[Tool | ToolSchema], optional): The tools to use with the model. Defaults to [].
+            json_output (Optional[bool | type[BaseModel]], optional): Whether to use JSON mode, structured output, or neither. Defaults to None. If set to a type, it will be used as the output type
+                for structured output. If set to a boolean, it will be used to determine whether to use JSON mode or not.
+            extra_create_args (Mapping[str, Any], optional): Extra arguments to pass to the underlying client. Defaults to {}.
+            cancellation_token (Optional[CancellationToken], optional): A token for cancellation. Defaults to None.
+
+        Returns:
+            CreateResult: The result of the model call.
+        """
+        ...
 
     @abstractmethod
     def create_stream(
@@ -147,10 +172,24 @@ def create_stream(
         tools: Sequence[Tool | ToolSchema] = [],
         # None means do not override the default
         # A value means to override the client default - often specified in the constructor
-        json_output: Optional[bool] = None,
+        json_output: Optional[bool | type[BaseModel]] = None,
         extra_create_args: Mapping[str, Any] = {},
         cancellation_token: Optional[CancellationToken] = None,
-    ) -> AsyncGenerator[Union[str, CreateResult], None]: ...
+    ) -> AsyncGenerator[Union[str, CreateResult], None]:
+        """Creates a stream of string chunks from the model ending with a CreateResult.
+
+        Args:
+            messages (Sequence[LLMMessage]): The messages to send to the model.
+            tools (Sequence[Tool | ToolSchema], optional): The tools to use with the model. Defaults to [].
+            json_output (Optional[bool | type[BaseModel]], optional): Whether to use JSON mode, structured output, or neither. Defaults to None. If set to a type, it will be used as the output type
+                for structured output. If set to a boolean, it will be used to determine whether to use JSON mode or not.
+            extra_create_args (Mapping[str, Any], optional): Extra arguments to pass to the underlying client. Defaults to {}.
+            cancellation_token (Optional[CancellationToken], optional): A token for cancellation. Defaults to None.
+
+        Returns:
+            AsyncGenerator[Union[str, CreateResult], None]: A generator that yields string chunks and ends with a :py:class:`CreateResult`.
+        """
+        ...
 
     @abstractmethod
     async def close(self) -> None: ...
 
@@ -9,6 +9,7 @@ def test_model_info() -> None:
         "vision": True,
         "function_calling": True,
         "json_output": True,
+        "structured_output": True,
     }
     validate_model_info(info)
 
 
@@ -25,6 +25,7 @@
     tool_agent_caller_loop,
 )
 from autogen_core.tools import FunctionTool, Tool, ToolSchema
+from pydantic import BaseModel
 
 logging.getLogger(EVENT_LOGGER_NAME).setLevel(logging.INFO)
 
@@ -101,7 +102,7 @@ async def create(
             messages: Sequence[LLMMessage],
             *,
             tools: Sequence[Tool | ToolSchema] = [],
-            json_output: Optional[bool] = None,
+            json_output: Optional[bool | type[BaseModel]] = None,
             extra_create_args: Mapping[str, Any] = {},
             cancellation_token: Optional[CancellationToken] = None,
         ) -> CreateResult:
@@ -126,7 +127,7 @@ def create_stream(
             messages: Sequence[LLMMessage],
             *,
             tools: Sequence[Tool | ToolSchema] = [],
-            json_output: Optional[bool] = None,
+            json_output: Optional[bool | type[BaseModel]] = None,
             extra_create_args: Mapping[str, Any] = {},
             cancellation_token: Optional[CancellationToken] = None,
         ) -> AsyncGenerator[Union[str, CreateResult], None]:
@@ -153,7 +154,13 @@ def capabilities(self) -> ModelCapabilities:  # type: ignore
 
         @property
         def model_info(self) -> ModelInfo:
-            return ModelInfo(vision=False, function_calling=True, json_output=False, family=ModelFamily.UNKNOWN)
+            return ModelInfo(
+                vision=False,
+                function_calling=True,
+                json_output=False,
+                family=ModelFamily.UNKNOWN,
+                structured_output=False,
+            )
 
     client = MockChatCompletionClient()
     tools: List[Tool] = [FunctionTool(_pass_function, name="pass", description="Pass function")]
 
@@ -13,6 +13,7 @@
     RequestUsage,
 )
 from autogen_core.tools import Tool, ToolSchema
+from pydantic import BaseModel
 
 from .page_logger import PageLogger
 
@@ -87,7 +88,7 @@ async def create(
         messages: Sequence[LLMMessage],
         *,
         tools: Sequence[Tool | ToolSchema] = [],
-        json_output: Optional[bool] = None,
+        json_output: Optional[bool | type[BaseModel]] = None,
         extra_create_args: Mapping[str, Any] = {},
         cancellation_token: Optional[CancellationToken] = None,
     ) -> CreateResult:
@@ -154,7 +155,7 @@ def create_stream(
         messages: Sequence[LLMMessage],
         *,
         tools: Sequence[Tool | ToolSchema] = [],
-        json_output: Optional[bool] = None,
+        json_output: Optional[bool | type[BaseModel]] = None,
         extra_create_args: Mapping[str, Any] = {},
         cancellation_token: Optional[CancellationToken] = None,
     ) -> AsyncGenerator[Union[str, CreateResult], None]:
Original file line number	Diff line number	Diff line change
`@@ -574,6 +574,7 @@ async def get_messages(self) -> List[LLMMessage]:`
`574`	`574`	`"function_calling": False,`
`575`	`575`	`"json_output": False,`
`576`	`576`	`"family": ModelFamily.R1,`
	`577`	`+ "structured_output": True,`
`577`	`578`	`},`
`578`	`579`	`)`
`579`	`580`
Original file line number	Diff line number	Diff line change
`@@ -154,6 +154,7 @@ custom_model_client = OpenAIChatCompletionClient(`
`154`	`154`	`"function_calling": True,`
`155`	`155`	`"json_output": True,`
`156`	`156`	`"family": "unknown",`
	`157`	`+ "structured_output": True,`
`157`	`158`	`},`
`158`	`159`	`)`
`159`	`160`	```
Original file line number	Diff line number	Diff line change
`@@ -9,6 +9,7 @@ def test_model_info() -> None:`
`9`	`9`	`"vision": True,`
`10`	`10`	`"function_calling": True,`
`11`	`11`	`"json_output": True,`
	`12`	`+ "structured_output": True,`
`12`	`13`	`}`
`13`	`14`	`validate_model_info(info)`
`14`	`15`